"""Benchmark some basic import use-cases. The assumption is made that this benchmark is run in a fresh interpreter and thus has no external changes made to import-related attributes in sys. """ from test.test_importlib import util import decimal import imp import importlib import importlib.machinery import json import os import py_compile import sys import tabnanny import timeit def bench(name, cleanup=lambda: None, *, seconds=1, repeat=3): """Bench the given statement as many times as necessary until total executions take one second.""" stmt = "__import__({!r})".format(name) timer = timeit.Timer(stmt) for x in range(repeat): total_time = 0 count = 0 while total_time < seconds: try: total_time += timer.timeit(1) finally: cleanup() count += 1 else: # One execution too far if total_time > seconds: count -= 1 yield count // seconds def from_cache(seconds, repeat): """sys.modules""" name = '' module = imp.new_module(name) module.__file__ = '' module.__package__ = '' with util.uncache(name): sys.modules[name] = module yield from bench(name, repeat=repeat, seconds=seconds) def builtin_mod(seconds, repeat): """Built-in module""" name = 'errno' if name in sys.modules: del sys.modules[name] # Relying on built-in importer being implicit. yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat, seconds=seconds) def source_wo_bytecode(seconds, repeat): """Source w/o bytecode: small""" sys.dont_write_bytecode = True try: name = '__importlib_test_benchmark__' # Clears out sys.modules and puts an entry at the front of sys.path. with util.create_modules(name) as mapping: assert not os.path.exists(imp.cache_from_source(mapping[name])) sys.meta_path.append(importlib.machinery.PathFinder) loader = (importlib.machinery.SourceFileLoader, importlib.machinery.SOURCE_SUFFIXES) sys.path_hooks.append(importlib.machinery.FileFinder.path_hook(loader)) yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat, seconds=seconds) finally: sys.dont_write_bytecode = False def _wo_bytecode(module): name = module.__name__ def benchmark_wo_bytecode(seconds, repeat): """Source w/o bytecode: {}""" bytecode_path = imp.cache_from_source(module.__file__) if os.path.exists(bytecode_path): os.unlink(bytecode_path) sys.dont_write_bytecode = True try: yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat, seconds=seconds) finally: sys.dont_write_bytecode = False benchmark_wo_bytecode.__doc__ = benchmark_wo_bytecode.__doc__.format(name) return benchmark_wo_bytecode tabnanny_wo_bytecode = _wo_bytecode(tabnanny) decimal_wo_bytecode = _wo_bytecode(decimal) def source_writing_bytecode(seconds, repeat): """Source writing bytecode: small""" assert not sys.dont_write_bytecode name = '__importlib_test_benchmark__' with util.create_modules(name) as mapping: sys.meta_path.append(importlib.machinery.PathFinder) loader = (importlib.machinery.SourceFileLoader, importlib.machinery.SOURCE_SUFFIXES) sys.path_hooks.append(importlib.machinery.FileFinder.path_hook(loader)) def cleanup(): sys.modules.pop(name) os.unlink(imp.cache_from_source(mapping[name])) for result in bench(name, cleanup, repeat=repeat, seconds=seconds): assert not os.path.exists(imp.cache_from_source(mapping[name])) yield result def _writing_bytecode(module): name = module.__name__ def writing_bytecode_benchmark(seconds, repeat): """Source writing bytecode: {}""" assert not sys.dont_write_bytecode def cleanup(): sys.modules.pop(name) os.unlink(imp.cache_from_source(module.__file__)) yield from bench(name, cleanup, repeat=repeat, seconds=seconds) writing_bytecode_benchmark.__doc__ = ( writing_bytecode_benchmark.__doc__.format(name)) return writing_bytecode_benchmark tabnanny_writing_bytecode = _writing_bytecode(tabnanny) decimal_writing_bytecode = _writing_bytecode(decimal) def source_using_bytecode(seconds, repeat): """Source w/ bytecode: small""" name = '__importlib_test_benchmark__' with util.create_modules(name) as mapping: sys.meta_path.append(importlib.machinery.PathFinder) loader = (importlib.machinery.SourceFileLoader, importlib.machinery.SOURCE_SUFFIXES) sys.path_hooks.append(importlib.machinery.FileFinder.path_hook(loader)) py_compile.compile(mapping[name]) assert os.path.exists(imp.cache_from_source(mapping[name])) yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat, seconds=seconds) def _using_bytecode(module): name = module.__name__ def using_bytecode_benchmark(seconds, repeat): """Source w/ bytecode: {}""" py_compile.compile(module.__file__) yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat, seconds=seconds) using_bytecode_benchmark.__doc__ = ( using_bytecode_benchmark.__doc__.format(name)) return using_bytecode_benchmark tabnanny_using_bytecode = _using_bytecode(tabnanny) decimal_using_bytecode = _using_bytecode(decimal) def main(import_, options): if options.source_file: with options.source_file: prev_results = json.load(options.source_file) else: prev_results = {} __builtins__.__import__ = import_ benchmarks = (from_cache, builtin_mod, source_writing_bytecode, source_wo_bytecode, source_using_bytecode, tabnanny_writing_bytecode, tabnanny_wo_bytecode, tabnanny_using_bytecode, decimal_writing_bytecode, decimal_wo_bytecode, decimal_using_bytecode, ) if options.benchmark: for b in benchmarks: if b.__doc__ == options.benchmark: benchmarks = [b] break else: print('Unknown benchmark: {!r}'.format(options.benchmark), file=sys.stderr) sys.exit(1) seconds = 1 seconds_plural = 's' if seconds > 1 else '' repeat = 3 header = ('Measuring imports/second over {} second{}, best out of {}\n' 'Entire benchmark run should take about {} seconds\n' 'Using {!r} as __import__\n') print(header.format(seconds, seconds_plural, repeat, len(benchmarks) * seconds * repeat, __import__)) new_results = {} for benchmark in benchmarks: print(benchmark.__doc__, "[", end=' ') sys.stdout.flush() results = [] for result in benchmark(seconds=seconds, repeat=repeat): results.append(result) print(result, end=' ') sys.stdout.flush() assert not sys.dont_write_bytecode print("]", "best is", format(max(results), ',d')) new_results[benchmark.__doc__] = results if prev_results: print('\n\nComparing new vs. old\n') for benchmark in benchmarks: benchmark_name = benchmark.__doc__ old_result = max(prev_results[benchmark_name]) new_result = max(new_results[benchmark_name]) result = '{:,d} vs. {:,d} ({:%})'.format(new_result, old_result, new_result/old_result) print(benchmark_name, ':', result) if options.dest_file: with options.dest_file: json.dump(new_results, options.dest_file, indent=2) if __name__ == '__main__': import argparse parser = argparse.ArgumentParser() parser.add_argument('-b', '--builtin', dest='builtin', action='store_true', default=False, help="use the built-in __import__") parser.add_argument('-r', '--read', dest='source_file', type=argparse.FileType('r'), help='file to read benchmark data from to compare ' 'against') parser.add_argument('-w', '--write', dest='dest_file', type=argparse.FileType('w'), help='file to write benchmark data to') parser.add_argument('--benchmark', dest='benchmark', help='specific benchmark to run') options = parser.parse_args() import_ = __import__ if not options.builtin: import_ = importlib.__import__ main(import_, options)