Home | History | Annotate | Download | only in importbench
      1 """Benchmark some basic import use-cases.
      2 
      3 The assumption is made that this benchmark is run in a fresh interpreter and
      4 thus has no external changes made to import-related attributes in sys.
      5 
      6 """
      7 from test.test_importlib import util
      8 import decimal
      9 import imp
     10 import importlib
     11 import importlib.machinery
     12 import json
     13 import os
     14 import py_compile
     15 import sys
     16 import tabnanny
     17 import timeit
     18 
     19 
     20 def bench(name, cleanup=lambda: None, *, seconds=1, repeat=3):
     21     """Bench the given statement as many times as necessary until total
     22     executions take one second."""
     23     stmt = "__import__({!r})".format(name)
     24     timer = timeit.Timer(stmt)
     25     for x in range(repeat):
     26         total_time = 0
     27         count = 0
     28         while total_time < seconds:
     29             try:
     30                 total_time += timer.timeit(1)
     31             finally:
     32                 cleanup()
     33             count += 1
     34         else:
     35             # One execution too far
     36             if total_time > seconds:
     37                 count -= 1
     38         yield count // seconds
     39 
     40 def from_cache(seconds, repeat):
     41     """sys.modules"""
     42     name = '<benchmark import>'
     43     module = imp.new_module(name)
     44     module.__file__ = '<test>'
     45     module.__package__ = ''
     46     with util.uncache(name):
     47         sys.modules[name] = module
     48         yield from bench(name, repeat=repeat, seconds=seconds)
     49 
     50 
     51 def builtin_mod(seconds, repeat):
     52     """Built-in module"""
     53     name = 'errno'
     54     if name in sys.modules:
     55         del sys.modules[name]
     56     # Relying on built-in importer being implicit.
     57     yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat,
     58                      seconds=seconds)
     59 
     60 
     61 def source_wo_bytecode(seconds, repeat):
     62     """Source w/o bytecode: small"""
     63     sys.dont_write_bytecode = True
     64     try:
     65         name = '__importlib_test_benchmark__'
     66         # Clears out sys.modules and puts an entry at the front of sys.path.
     67         with util.create_modules(name) as mapping:
     68             assert not os.path.exists(imp.cache_from_source(mapping[name]))
     69             sys.meta_path.append(importlib.machinery.PathFinder)
     70             loader = (importlib.machinery.SourceFileLoader,
     71                       importlib.machinery.SOURCE_SUFFIXES)
     72             sys.path_hooks.append(importlib.machinery.FileFinder.path_hook(loader))
     73             yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat,
     74                              seconds=seconds)
     75     finally:
     76         sys.dont_write_bytecode = False
     77 
     78 
     79 def _wo_bytecode(module):
     80     name = module.__name__
     81     def benchmark_wo_bytecode(seconds, repeat):
     82         """Source w/o bytecode: {}"""
     83         bytecode_path = imp.cache_from_source(module.__file__)
     84         if os.path.exists(bytecode_path):
     85             os.unlink(bytecode_path)
     86         sys.dont_write_bytecode = True
     87         try:
     88             yield from bench(name, lambda: sys.modules.pop(name),
     89                              repeat=repeat, seconds=seconds)
     90         finally:
     91             sys.dont_write_bytecode = False
     92 
     93     benchmark_wo_bytecode.__doc__ = benchmark_wo_bytecode.__doc__.format(name)
     94     return benchmark_wo_bytecode
     95 
     96 tabnanny_wo_bytecode = _wo_bytecode(tabnanny)
     97 decimal_wo_bytecode = _wo_bytecode(decimal)
     98 
     99 
    100 def source_writing_bytecode(seconds, repeat):
    101     """Source writing bytecode: small"""
    102     assert not sys.dont_write_bytecode
    103     name = '__importlib_test_benchmark__'
    104     with util.create_modules(name) as mapping:
    105         sys.meta_path.append(importlib.machinery.PathFinder)
    106         loader = (importlib.machinery.SourceFileLoader,
    107                   importlib.machinery.SOURCE_SUFFIXES)
    108         sys.path_hooks.append(importlib.machinery.FileFinder.path_hook(loader))
    109         def cleanup():
    110             sys.modules.pop(name)
    111             os.unlink(imp.cache_from_source(mapping[name]))
    112         for result in bench(name, cleanup, repeat=repeat, seconds=seconds):
    113             assert not os.path.exists(imp.cache_from_source(mapping[name]))
    114             yield result
    115 
    116 
    117 def _writing_bytecode(module):
    118     name = module.__name__
    119     def writing_bytecode_benchmark(seconds, repeat):
    120         """Source writing bytecode: {}"""
    121         assert not sys.dont_write_bytecode
    122         def cleanup():
    123             sys.modules.pop(name)
    124             os.unlink(imp.cache_from_source(module.__file__))
    125         yield from bench(name, cleanup, repeat=repeat, seconds=seconds)
    126 
    127     writing_bytecode_benchmark.__doc__ = (
    128                                 writing_bytecode_benchmark.__doc__.format(name))
    129     return writing_bytecode_benchmark
    130 
    131 tabnanny_writing_bytecode = _writing_bytecode(tabnanny)
    132 decimal_writing_bytecode = _writing_bytecode(decimal)
    133 
    134 
    135 def source_using_bytecode(seconds, repeat):
    136     """Source w/ bytecode: small"""
    137     name = '__importlib_test_benchmark__'
    138     with util.create_modules(name) as mapping:
    139         sys.meta_path.append(importlib.machinery.PathFinder)
    140         loader = (importlib.machinery.SourceFileLoader,
    141                   importlib.machinery.SOURCE_SUFFIXES)
    142         sys.path_hooks.append(importlib.machinery.FileFinder.path_hook(loader))
    143         py_compile.compile(mapping[name])
    144         assert os.path.exists(imp.cache_from_source(mapping[name]))
    145         yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat,
    146                          seconds=seconds)
    147 
    148 
    149 def _using_bytecode(module):
    150     name = module.__name__
    151     def using_bytecode_benchmark(seconds, repeat):
    152         """Source w/ bytecode: {}"""
    153         py_compile.compile(module.__file__)
    154         yield from bench(name, lambda: sys.modules.pop(name), repeat=repeat,
    155                          seconds=seconds)
    156 
    157     using_bytecode_benchmark.__doc__ = (
    158                                 using_bytecode_benchmark.__doc__.format(name))
    159     return using_bytecode_benchmark
    160 
    161 tabnanny_using_bytecode = _using_bytecode(tabnanny)
    162 decimal_using_bytecode = _using_bytecode(decimal)
    163 
    164 
    165 def main(import_, options):
    166     if options.source_file:
    167         with options.source_file:
    168             prev_results = json.load(options.source_file)
    169     else:
    170         prev_results = {}
    171     __builtins__.__import__ = import_
    172     benchmarks = (from_cache, builtin_mod,
    173                   source_writing_bytecode,
    174                   source_wo_bytecode, source_using_bytecode,
    175                   tabnanny_writing_bytecode,
    176                   tabnanny_wo_bytecode, tabnanny_using_bytecode,
    177                   decimal_writing_bytecode,
    178                   decimal_wo_bytecode, decimal_using_bytecode,
    179                 )
    180     if options.benchmark:
    181         for b in benchmarks:
    182             if b.__doc__ == options.benchmark:
    183                 benchmarks = [b]
    184                 break
    185         else:
    186             print('Unknown benchmark: {!r}'.format(options.benchmark,
    187                   file=sys.stderr))
    188             sys.exit(1)
    189     seconds = 1
    190     seconds_plural = 's' if seconds > 1 else ''
    191     repeat = 3
    192     header = ('Measuring imports/second over {} second{}, best out of {}\n'
    193               'Entire benchmark run should take about {} seconds\n'
    194               'Using {!r} as __import__\n')
    195     print(header.format(seconds, seconds_plural, repeat,
    196                         len(benchmarks) * seconds * repeat, __import__))
    197     new_results = {}
    198     for benchmark in benchmarks:
    199         print(benchmark.__doc__, "[", end=' ')
    200         sys.stdout.flush()
    201         results = []
    202         for result in benchmark(seconds=seconds, repeat=repeat):
    203             results.append(result)
    204             print(result, end=' ')
    205             sys.stdout.flush()
    206         assert not sys.dont_write_bytecode
    207         print("]", "best is", format(max(results), ',d'))
    208         new_results[benchmark.__doc__] = results
    209     if prev_results:
    210         print('\n\nComparing new vs. old\n')
    211         for benchmark in benchmarks:
    212             benchmark_name = benchmark.__doc__
    213             old_result = max(prev_results[benchmark_name])
    214             new_result = max(new_results[benchmark_name])
    215             result = '{:,d} vs. {:,d} ({:%})'.format(new_result,
    216                                                      old_result,
    217                                               new_result/old_result)
    218             print(benchmark_name, ':', result)
    219     if options.dest_file:
    220         with options.dest_file:
    221             json.dump(new_results, options.dest_file, indent=2)
    222 
    223 
    224 if __name__ == '__main__':
    225     import argparse
    226 
    227     parser = argparse.ArgumentParser()
    228     parser.add_argument('-b', '--builtin', dest='builtin', action='store_true',
    229                         default=False, help="use the built-in __import__")
    230     parser.add_argument('-r', '--read', dest='source_file',
    231                         type=argparse.FileType('r'),
    232                         help='file to read benchmark data from to compare '
    233                              'against')
    234     parser.add_argument('-w', '--write', dest='dest_file',
    235                         type=argparse.FileType('w'),
    236                         help='file to write benchmark data to')
    237     parser.add_argument('--benchmark', dest='benchmark',
    238                         help='specific benchmark to run')
    239     options = parser.parse_args()
    240     import_ = __import__
    241     if not options.builtin:
    242         import_ = importlib.__import__
    243 
    244     main(import_, options)
    245