timeit.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337
  1. #! /usr/bin/env python3
  2. """Tool for measuring execution time of small code snippets.
  3. This module avoids a number of common traps for measuring execution
  4. times. See also Tim Peters' introduction to the Algorithms chapter in
  5. the Python Cookbook, published by O'Reilly.
  6. Library usage: see the Timer class.
  7. Command line usage:
  8. python timeit.py [-n N] [-r N] [-s S] [-t] [-c] [-p] [-h] [--] [statement]
  9. Options:
  10. -n/--number N: how many times to execute 'statement' (default: see below)
  11. -r/--repeat N: how many times to repeat the timer (default 3)
  12. -s/--setup S: statement to be executed once initially (default 'pass').
  13. Execution time of this setup statement is NOT timed.
  14. -p/--process: use time.process_time() (default is time.perf_counter())
  15. -t/--time: use time.time() (deprecated)
  16. -c/--clock: use time.clock() (deprecated)
  17. -v/--verbose: print raw timing results; repeat for more digits precision
  18. -u/--unit: set the output time unit (usec, msec, or sec)
  19. -h/--help: print this usage message and exit
  20. --: separate options from statement, use when statement starts with -
  21. statement: statement to be timed (default 'pass')
  22. A multi-line statement may be given by specifying each line as a
  23. separate argument; indented lines are possible by enclosing an
  24. argument in quotes and using leading spaces. Multiple -s options are
  25. treated similarly.
  26. If -n is not given, a suitable number of loops is calculated by trying
  27. successive powers of 10 until the total time is at least 0.2 seconds.
  28. Note: there is a certain baseline overhead associated with executing a
  29. pass statement. It differs between versions. The code here doesn't try
  30. to hide it, but you should be aware of it. The baseline overhead can be
  31. measured by invoking the program without arguments.
  32. Classes:
  33. Timer
  34. Functions:
  35. timeit(string, string) -> float
  36. repeat(string, string) -> list
  37. default_timer() -> float
  38. """
  39. import gc
  40. import sys
  41. import time
  42. import itertools
  43. __all__ = ["Timer", "timeit", "repeat", "default_timer"]
  44. dummy_src_name = "<timeit-src>"
  45. default_number = 1000000
  46. default_repeat = 3
  47. default_timer = time.perf_counter
  48. _globals = globals
  49. # Don't change the indentation of the template; the reindent() calls
  50. # in Timer.__init__() depend on setup being indented 4 spaces and stmt
  51. # being indented 8 spaces.
  52. template = """
  53. def inner(_it, _timer{init}):
  54. {setup}
  55. _t0 = _timer()
  56. for _i in _it:
  57. {stmt}
  58. _t1 = _timer()
  59. return _t1 - _t0
  60. """
  61. def reindent(src, indent):
  62. """Helper to reindent a multi-line statement."""
  63. return src.replace("\n", "\n" + " "*indent)
  64. class Timer:
  65. """Class for timing execution speed of small code snippets.
  66. The constructor takes a statement to be timed, an additional
  67. statement used for setup, and a timer function. Both statements
  68. default to 'pass'; the timer function is platform-dependent (see
  69. module doc string). If 'globals' is specified, the code will be
  70. executed within that namespace (as opposed to inside timeit's
  71. namespace).
  72. To measure the execution time of the first statement, use the
  73. timeit() method. The repeat() method is a convenience to call
  74. timeit() multiple times and return a list of results.
  75. The statements may contain newlines, as long as they don't contain
  76. multi-line string literals.
  77. """
  78. def __init__(self, stmt="pass", setup="pass", timer=default_timer,
  79. globals=None):
  80. """Constructor. See class doc string."""
  81. self.timer = timer
  82. local_ns = {}
  83. global_ns = _globals() if globals is None else globals
  84. init = ''
  85. if isinstance(setup, str):
  86. # Check that the code can be compiled outside a function
  87. compile(setup, dummy_src_name, "exec")
  88. stmtprefix = setup + '\n'
  89. setup = reindent(setup, 4)
  90. elif callable(setup):
  91. local_ns['_setup'] = setup
  92. init += ', _setup=_setup'
  93. stmtprefix = ''
  94. setup = '_setup()'
  95. else:
  96. raise ValueError("setup is neither a string nor callable")
  97. if isinstance(stmt, str):
  98. # Check that the code can be compiled outside a function
  99. compile(stmtprefix + stmt, dummy_src_name, "exec")
  100. stmt = reindent(stmt, 8)
  101. elif callable(stmt):
  102. local_ns['_stmt'] = stmt
  103. init += ', _stmt=_stmt'
  104. stmt = '_stmt()'
  105. else:
  106. raise ValueError("stmt is neither a string nor callable")
  107. src = template.format(stmt=stmt, setup=setup, init=init)
  108. self.src = src # Save for traceback display
  109. code = compile(src, dummy_src_name, "exec")
  110. exec(code, global_ns, local_ns)
  111. self.inner = local_ns["inner"]
  112. def print_exc(self, file=None):
  113. """Helper to print a traceback from the timed code.
  114. Typical use:
  115. t = Timer(...) # outside the try/except
  116. try:
  117. t.timeit(...) # or t.repeat(...)
  118. except:
  119. t.print_exc()
  120. The advantage over the standard traceback is that source lines
  121. in the compiled template will be displayed.
  122. The optional file argument directs where the traceback is
  123. sent; it defaults to sys.stderr.
  124. """
  125. import linecache, traceback
  126. if self.src is not None:
  127. linecache.cache[dummy_src_name] = (len(self.src),
  128. None,
  129. self.src.split("\n"),
  130. dummy_src_name)
  131. # else the source is already stored somewhere else
  132. traceback.print_exc(file=file)
  133. def timeit(self, number=default_number):
  134. """Time 'number' executions of the main statement.
  135. To be precise, this executes the setup statement once, and
  136. then returns the time it takes to execute the main statement
  137. a number of times, as a float measured in seconds. The
  138. argument is the number of times through the loop, defaulting
  139. to one million. The main statement, the setup statement and
  140. the timer function to be used are passed to the constructor.
  141. """
  142. it = itertools.repeat(None, number)
  143. gcold = gc.isenabled()
  144. gc.disable()
  145. try:
  146. timing = self.inner(it, self.timer)
  147. finally:
  148. if gcold:
  149. gc.enable()
  150. return timing
  151. def repeat(self, repeat=default_repeat, number=default_number):
  152. """Call timeit() a few times.
  153. This is a convenience function that calls the timeit()
  154. repeatedly, returning a list of results. The first argument
  155. specifies how many times to call timeit(), defaulting to 3;
  156. the second argument specifies the timer argument, defaulting
  157. to one million.
  158. Note: it's tempting to calculate mean and standard deviation
  159. from the result vector and report these. However, this is not
  160. very useful. In a typical case, the lowest value gives a
  161. lower bound for how fast your machine can run the given code
  162. snippet; higher values in the result vector are typically not
  163. caused by variability in Python's speed, but by other
  164. processes interfering with your timing accuracy. So the min()
  165. of the result is probably the only number you should be
  166. interested in. After that, you should look at the entire
  167. vector and apply common sense rather than statistics.
  168. """
  169. r = []
  170. for i in range(repeat):
  171. t = self.timeit(number)
  172. r.append(t)
  173. return r
  174. def timeit(stmt="pass", setup="pass", timer=default_timer,
  175. number=default_number, globals=None):
  176. """Convenience function to create Timer object and call timeit method."""
  177. return Timer(stmt, setup, timer, globals).timeit(number)
  178. def repeat(stmt="pass", setup="pass", timer=default_timer,
  179. repeat=default_repeat, number=default_number, globals=None):
  180. """Convenience function to create Timer object and call repeat method."""
  181. return Timer(stmt, setup, timer, globals).repeat(repeat, number)
  182. def main(args=None, *, _wrap_timer=None):
  183. """Main program, used when run as a script.
  184. The optional 'args' argument specifies the command line to be parsed,
  185. defaulting to sys.argv[1:].
  186. The return value is an exit code to be passed to sys.exit(); it
  187. may be None to indicate success.
  188. When an exception happens during timing, a traceback is printed to
  189. stderr and the return value is 1. Exceptions at other times
  190. (including the template compilation) are not caught.
  191. '_wrap_timer' is an internal interface used for unit testing. If it
  192. is not None, it must be a callable that accepts a timer function
  193. and returns another timer function (used for unit testing).
  194. """
  195. if args is None:
  196. args = sys.argv[1:]
  197. import getopt
  198. try:
  199. opts, args = getopt.getopt(args, "n:u:s:r:tcpvh",
  200. ["number=", "setup=", "repeat=",
  201. "time", "clock", "process",
  202. "verbose", "unit=", "help"])
  203. except getopt.error as err:
  204. print(err)
  205. print("use -h/--help for command line help")
  206. return 2
  207. timer = default_timer
  208. stmt = "\n".join(args) or "pass"
  209. number = 0 # auto-determine
  210. setup = []
  211. repeat = default_repeat
  212. verbose = 0
  213. time_unit = None
  214. units = {"usec": 1, "msec": 1e3, "sec": 1e6}
  215. precision = 3
  216. for o, a in opts:
  217. if o in ("-n", "--number"):
  218. number = int(a)
  219. if o in ("-s", "--setup"):
  220. setup.append(a)
  221. if o in ("-u", "--unit"):
  222. if a in units:
  223. time_unit = a
  224. else:
  225. print("Unrecognized unit. Please select usec, msec, or sec.",
  226. file=sys.stderr)
  227. return 2
  228. if o in ("-r", "--repeat"):
  229. repeat = int(a)
  230. if repeat <= 0:
  231. repeat = 1
  232. if o in ("-t", "--time"):
  233. timer = time.time
  234. if o in ("-c", "--clock"):
  235. timer = time.clock
  236. if o in ("-p", "--process"):
  237. timer = time.process_time
  238. if o in ("-v", "--verbose"):
  239. if verbose:
  240. precision += 1
  241. verbose += 1
  242. if o in ("-h", "--help"):
  243. print(__doc__, end=' ')
  244. return 0
  245. setup = "\n".join(setup) or "pass"
  246. # Include the current directory, so that local imports work (sys.path
  247. # contains the directory of this script, rather than the current
  248. # directory)
  249. import os
  250. sys.path.insert(0, os.curdir)
  251. if _wrap_timer is not None:
  252. timer = _wrap_timer(timer)
  253. t = Timer(stmt, setup, timer)
  254. if number == 0:
  255. # determine number so that 0.2 <= total time < 2.0
  256. for i in range(1, 10):
  257. number = 10**i
  258. try:
  259. x = t.timeit(number)
  260. except:
  261. t.print_exc()
  262. return 1
  263. if verbose:
  264. print("%d loops -> %.*g secs" % (number, precision, x))
  265. if x >= 0.2:
  266. break
  267. try:
  268. r = t.repeat(repeat, number)
  269. except:
  270. t.print_exc()
  271. return 1
  272. best = min(r)
  273. if verbose:
  274. print("raw times:", " ".join(["%.*g" % (precision, x) for x in r]))
  275. print("%d loops," % number, end=' ')
  276. usec = best * 1e6 / number
  277. if time_unit is not None:
  278. print("best of %d: %.*g %s per loop" % (repeat, precision,
  279. usec/units[time_unit], time_unit))
  280. else:
  281. if usec < 1000:
  282. print("best of %d: %.*g usec per loop" % (repeat, precision, usec))
  283. else:
  284. msec = usec / 1000
  285. if msec < 1000:
  286. print("best of %d: %.*g msec per loop" % (repeat,
  287. precision, msec))
  288. else:
  289. sec = msec / 1000
  290. print("best of %d: %.*g sec per loop" % (repeat,
  291. precision, sec))
  292. return None
  293. if __name__ == "__main__":
  294. sys.exit(main())