diff --git a/.gitignore b/.gitignore index ee5e45bf..41a71a83 100644 --- a/.gitignore +++ b/.gitignore @@ -6,6 +6,7 @@ # Temporary files, usually created by text editors (vim) *.swp *~ +.vscode # Created by setup.py sdist build/ diff --git a/pyperformance/data-files/benchmarks/bm_pathlib/run_benchmark.py b/pyperformance/data-files/benchmarks/bm_pathlib/run_benchmark.py index cda9b4be..ca221dc7 100644 --- a/pyperformance/data-files/benchmarks/bm_pathlib/run_benchmark.py +++ b/pyperformance/data-files/benchmarks/bm_pathlib/run_benchmark.py @@ -10,6 +10,7 @@ import pathlib import shutil import tempfile +from typing import Sequence import pyperf @@ -35,9 +36,7 @@ def setup(num_files): return tmp_path -def bench_pathlib(loops, tmp_path): - base_path = pathlib.Path(tmp_path) - +def warm_up_cache(base_path): # Warm up the filesystem cache and keep some objects in memory. path_objects = list(base_path.iterdir()) # FIXME: does this code really cache anything? @@ -45,22 +44,118 @@ def bench_pathlib(loops, tmp_path): p.stat() assert len(path_objects) == NUM_FILES, len(path_objects) + +def setup_single_benchmark(loops, tmp_path): + base_path = pathlib.Path(tmp_path) + warm_up_cache(base_path) range_it = range(loops) + + return base_path, range_it + + +def bench_pathlib_callable(loops, tmp_path, callable_): + base_path, range_it = setup_single_benchmark(loops, tmp_path) + t0 = pyperf.perf_counter() for _ in range_it: - # Do something simple with each path. - for p in base_path.iterdir(): - p.stat() - for p in base_path.glob("*.py"): - p.stat() - for p in base_path.iterdir(): - p.stat() - for p in base_path.glob("*.py"): - p.stat() + callable_(base_path) return pyperf.perf_counter() - t0 +def bench_pure_pathlib_callable(loops, paths, callable_): + range_it = range(loops) + + t0 = pyperf.perf_counter() + + for _ in range_it: + callable_(paths) + + return pyperf.perf_counter() - t0 + + +def do_simple_operations(base_path: pathlib.Path): + # Do something simple with each path. + for p in base_path.iterdir(): + p.stat() + for p in base_path.glob("*.py"): + p.stat() + for p in base_path.iterdir(): + p.stat() + for p in base_path.glob("*.py"): + p.stat() + + +def do_parent(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.parent + + +def do_parents(paths: Sequence[pathlib.PurePath]): + # FIXME: this is not a good benchmark, because it creates a new list. However, otherwise it would be too slow + for p in paths[:300]: + list(p.parents) + + +def do_name(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.name + + +def do_suffix(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.suffix + + +def do_suffixes(paths: Sequence[pathlib.PurePath]): + for p in paths: + list(p.suffixes) + + +def do_stem(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.stem + + +def do_parts(paths: Sequence[pathlib.PurePath]): + for p in paths: + list(p.parts) + + +def do_joinpath(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.joinpath("foo") + + +def do_div(paths: Sequence[pathlib.PurePath]): + for p in paths: + p / "foo" + + +def do_with_name(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.with_name("foo") + + +def do_with_suffix(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.with_suffix(".py") + + +def do_relative_to(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.relative_to("..") + + +def do_is_absolute(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.is_absolute() + + +def do_is_reserved(paths: Sequence[pathlib.PurePath]): + for p in paths: + p.is_reserved() + if __name__ == "__main__": runner = pyperf.Runner() @@ -71,7 +166,24 @@ def bench_pathlib(loops, tmp_path): runner.metadata['pathlib_module'] = modname tmp_path = setup(NUM_FILES) + paths = tuple(pathlib.PurePath(*([f"foo{i}"] * i)) for i in range(NUM_FILES)) + try: - runner.bench_time_func('pathlib', bench_pathlib, tmp_path) + runner.bench_time_func('pathlib', bench_pathlib_callable, tmp_path, do_simple_operations) + runner.bench_time_func('pathlib_purepath_parent', bench_pure_pathlib_callable, paths, do_parent) + runner.bench_time_func('pathlib_purepath_parents', bench_pure_pathlib_callable, paths, do_parents) + runner.bench_time_func('pathlib_purepath_name', bench_pure_pathlib_callable, paths, do_name) + runner.bench_time_func('pathlib_purepath_suffix', bench_pure_pathlib_callable, paths, do_suffix) + runner.bench_time_func('pathlib_purepath_suffixes', bench_pure_pathlib_callable, paths, do_suffixes) + runner.bench_time_func('pathlib_purepath_stem', bench_pure_pathlib_callable, paths, do_stem) + runner.bench_time_func('pathlib_purepath_parts', bench_pure_pathlib_callable, paths, do_parts) + runner.bench_time_func('pathlib_purepath_joinpath', bench_pure_pathlib_callable, paths, do_joinpath) + runner.bench_time_func('pathlib_purepath_div', bench_pure_pathlib_callable, paths, do_div) + runner.bench_time_func('pathlib_purepath_with_name', bench_pure_pathlib_callable, paths, do_with_name) + runner.bench_time_func('pathlib_purepath_with_suffix', bench_pure_pathlib_callable, paths, do_with_suffix) + runner.bench_time_func('pathlib_purepath_relative_to', bench_pure_pathlib_callable, paths, do_relative_to) + runner.bench_time_func('pathlib_purepath_is_absolute', bench_pure_pathlib_callable, paths, do_is_absolute) + runner.bench_time_func('pathlib_purepath_is_reserved', bench_pure_pathlib_callable, paths, do_is_reserved) + finally: shutil.rmtree(tmp_path)