blob: 8815ac3d6ac0c040cd48e25f61e6a4e1a2db9db2 [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum81762581992-04-21 15:36:23 +00002#
Guido van Rossumb6775db1994-08-01 11:34:53 +00003# Class for profiling python code. rev 1.0 6/2/94
Guido van Rossum81762581992-04-21 15:36:23 +00004#
Guido van Rossumb6775db1994-08-01 11:34:53 +00005# Based on prior profile module by Sjoerd Mullender...
6# which was hacked somewhat by: Guido van Rossum
Guido van Rossumb6775db1994-08-01 11:34:53 +00007
Guido van Rossum54f22ed2000-02-04 15:10:34 +00008"""Class for profiling Python code."""
Guido van Rossumb6775db1994-08-01 11:34:53 +00009
10# Copyright 1994, by InfoSeek Corporation, all rights reserved.
11# Written by James Roskind
Tim Peters2344fae2001-01-15 00:50:52 +000012#
Guido van Rossumb6775db1994-08-01 11:34:53 +000013# Permission to use, copy, modify, and distribute this Python software
14# and its associated documentation for any purpose (subject to the
15# restriction in the following sentence) without fee is hereby granted,
16# provided that the above copyright notice appears in all copies, and
17# that both that copyright notice and this permission notice appear in
18# supporting documentation, and that the name of InfoSeek not be used in
19# advertising or publicity pertaining to distribution of the software
20# without specific, written prior permission. This permission is
21# explicitly restricted to the copying and modification of the software
22# to remain in Python, compiled Python, or other languages (such as C)
23# wherein the modified or derived code is exclusively imported into a
24# Python module.
Tim Peters2344fae2001-01-15 00:50:52 +000025#
Guido van Rossumb6775db1994-08-01 11:34:53 +000026# INFOSEEK CORPORATION DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS
27# SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND
28# FITNESS. IN NO EVENT SHALL INFOSEEK CORPORATION BE LIABLE FOR ANY
29# SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER
30# RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF
31# CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
32# CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
33
34
Guido van Rossum81762581992-04-21 15:36:23 +000035
36import sys
Guido van Rossum4e160981992-09-02 20:43:20 +000037import os
Guido van Rossumb6775db1994-08-01 11:34:53 +000038import time
Guido van Rossum4e160981992-09-02 20:43:20 +000039import marshal
Nicholas Bastin824b1b22004-03-23 18:44:39 +000040from optparse import OptionParser
Guido van Rossum81762581992-04-21 15:36:23 +000041
Guido van Rossum48713e82004-03-23 19:19:21 +000042__all__ = ["run", "runctx", "help", "Profile"]
Guido van Rossum81762581992-04-21 15:36:23 +000043
Tim Peters2344fae2001-01-15 00:50:52 +000044# Sample timer for use with
Guido van Rossumb6775db1994-08-01 11:34:53 +000045#i_count = 0
46#def integer_timer():
Tim Peters2344fae2001-01-15 00:50:52 +000047# global i_count
48# i_count = i_count + 1
49# return i_count
Guido van Rossumb6775db1994-08-01 11:34:53 +000050#itimes = integer_timer # replace with C coded timer returning integers
Guido van Rossum81762581992-04-21 15:36:23 +000051
Guido van Rossumb6775db1994-08-01 11:34:53 +000052#**************************************************************************
53# The following are the static member functions for the profiler class
54# Note that an instance of Profile() is *not* needed to call them.
55#**************************************************************************
Guido van Rossum81762581992-04-21 15:36:23 +000056
Nicholas Bastin824b1b22004-03-23 18:44:39 +000057def run(statement, filename=None, sort=-1):
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000058 """Run statement under profiler optionally saving results in filename
Guido van Rossum4e160981992-09-02 20:43:20 +000059
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000060 This function takes a single argument that can be passed to the
61 "exec" statement, and an optional file name. In all cases this
62 routine attempts to "exec" its first argument and gather profiling
63 statistics from the execution. If no file name is present, then this
64 function automatically prints a simple profiling report, sorted by the
65 standard name string (file/line/function-name) that is presented in
66 each line.
67 """
Tim Peters2344fae2001-01-15 00:50:52 +000068 prof = Profile()
69 try:
70 prof = prof.run(statement)
71 except SystemExit:
72 pass
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000073 if filename is not None:
74 prof.dump_stats(filename)
Tim Peters2344fae2001-01-15 00:50:52 +000075 else:
Nicholas Bastin824b1b22004-03-23 18:44:39 +000076 return prof.print_stats(sort)
Guido van Rossume61fa0a1993-10-22 13:56:35 +000077
Nicholas Bastin1eb4bfc2004-03-22 20:12:56 +000078def runctx(statement, globals, locals, filename=None):
79 """Run statement under profiler, supplying your own globals and locals,
80 optionally saving results in filename.
81
82 statement and filename have the same semantics as profile.run
83 """
84 prof = Profile()
85 try:
86 prof = prof.runctx(statement, globals, locals)
87 except SystemExit:
88 pass
89
90 if filename is not None:
91 prof.dump_stats(filename)
92 else:
93 return prof.print_stats()
94
Johannes Gijsbersc0b194a2005-01-10 09:07:22 +000095# Backwards compatibility.
Guido van Rossume61fa0a1993-10-22 13:56:35 +000096def help():
Johannes Gijsbersc0b194a2005-01-10 09:07:22 +000097 print "Documentation for the profile module can be found "
98 print "in the Python Library Reference, section 'The Python Profiler'."
Guido van Rossumb6775db1994-08-01 11:34:53 +000099
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000100if os.name == "mac":
Jack Jansen1bdcadd2001-06-19 20:11:36 +0000101 import MacOS
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000102 def _get_time_mac(timer=MacOS.GetTicks):
103 return timer() / 60.0
104
105if hasattr(os, "times"):
106 def _get_time_times(timer=os.times):
107 t = timer()
108 return t[0] + t[1]
109
110
Guido van Rossumb6775db1994-08-01 11:34:53 +0000111class Profile:
Tim Peters2344fae2001-01-15 00:50:52 +0000112 """Profiler class.
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000113
Tim Peters2344fae2001-01-15 00:50:52 +0000114 self.cur is always a tuple. Each such tuple corresponds to a stack
115 frame that is currently active (self.cur[-2]). The following are the
116 definitions of its members. We use this external "parallel stack" to
117 avoid contaminating the program that we are profiling. (old profiler
118 used to write into the frames local dictionary!!) Derived classes
119 can change the definition of some entries, as long as they leave
Tim Petersdf5cfd82001-10-05 23:15:10 +0000120 [-2:] intact (frame and previous tuple). In case an internal error is
121 detected, the -3 element is used as the function name.
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000122
Tim Petersdf5cfd82001-10-05 23:15:10 +0000123 [ 0] = Time that needs to be charged to the parent frame's function.
124 It is used so that a function call will not have to access the
125 timing data for the parent frame.
126 [ 1] = Total time spent in this frame's function, excluding time in
Tim Peters8d061ed2001-10-07 08:35:44 +0000127 subfunctions (this latter is tallied in cur[2]).
Tim Petersfb163782001-10-07 08:49:02 +0000128 [ 2] = Total time spent in subfunctions, excluding time executing the
Tim Peters8d061ed2001-10-07 08:35:44 +0000129 frame's function (this latter is tallied in cur[1]).
Tim Petersdf5cfd82001-10-05 23:15:10 +0000130 [-3] = Name of the function that corresponds to this frame.
Tim Peters8d061ed2001-10-07 08:35:44 +0000131 [-2] = Actual frame that we correspond to (used to sync exception handling).
132 [-1] = Our parent 6-tuple (corresponds to frame.f_back).
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000133
Tim Peters2344fae2001-01-15 00:50:52 +0000134 Timing data for each function is stored as a 5-tuple in the dictionary
Tim Petersdf5cfd82001-10-05 23:15:10 +0000135 self.timings[]. The index is always the name stored in self.cur[-3].
Tim Peters2344fae2001-01-15 00:50:52 +0000136 The following are the definitions of the members:
Guido van Rossumb6775db1994-08-01 11:34:53 +0000137
Tim Peters2344fae2001-01-15 00:50:52 +0000138 [0] = The number of times this function was called, not counting direct
139 or indirect recursion,
140 [1] = Number of times this function appears on the stack, minus one
141 [2] = Total time spent internal to this function
142 [3] = Cumulative time that this function was present on the stack. In
143 non-recursive functions, this is the total execution time from start
144 to finish of each invocation of a function, including time spent in
145 all subfunctions.
Tim Peters6e221492001-10-07 04:02:36 +0000146 [4] = A dictionary indicating for each function name, the number of times
Tim Peters2344fae2001-01-15 00:50:52 +0000147 it was called by us.
148 """
Guido van Rossumb6775db1994-08-01 11:34:53 +0000149
Tim Peters659a6032001-10-09 20:51:19 +0000150 bias = 0 # calibration constant
151
152 def __init__(self, timer=None, bias=None):
Tim Peters2344fae2001-01-15 00:50:52 +0000153 self.timings = {}
154 self.cur = None
155 self.cmd = ""
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000156 self.c_func_name = ""
Guido van Rossumb6775db1994-08-01 11:34:53 +0000157
Tim Peters659a6032001-10-09 20:51:19 +0000158 if bias is None:
159 bias = self.bias
160 self.bias = bias # Materialize in local dict for lookup speed.
161
Raymond Hettinger16e3c422002-06-01 16:07:16 +0000162 if timer is None:
Tim Peters2344fae2001-01-15 00:50:52 +0000163 if os.name == 'mac':
Tim Peters2344fae2001-01-15 00:50:52 +0000164 self.timer = MacOS.GetTicks
165 self.dispatcher = self.trace_dispatch_mac
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000166 self.get_time = _get_time_mac
Tim Peters2344fae2001-01-15 00:50:52 +0000167 elif hasattr(time, 'clock'):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000168 self.timer = self.get_time = time.clock
Tim Peters2344fae2001-01-15 00:50:52 +0000169 self.dispatcher = self.trace_dispatch_i
170 elif hasattr(os, 'times'):
171 self.timer = os.times
172 self.dispatcher = self.trace_dispatch
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000173 self.get_time = _get_time_times
Tim Peters2344fae2001-01-15 00:50:52 +0000174 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000175 self.timer = self.get_time = time.time
Tim Peters2344fae2001-01-15 00:50:52 +0000176 self.dispatcher = self.trace_dispatch_i
177 else:
178 self.timer = timer
179 t = self.timer() # test out timer function
180 try:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000181 length = len(t)
182 except TypeError:
183 self.get_time = timer
184 self.dispatcher = self.trace_dispatch_i
185 else:
186 if length == 2:
Tim Peters2344fae2001-01-15 00:50:52 +0000187 self.dispatcher = self.trace_dispatch
188 else:
189 self.dispatcher = self.trace_dispatch_l
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000190 # This get_time() implementation needs to be defined
191 # here to capture the passed-in timer in the parameter
192 # list (for performance). Note that we can't assume
193 # the timer() result contains two values in all
194 # cases.
Raymond Hettinger97aa32b2003-10-22 16:49:01 +0000195 def get_time_timer(timer=timer, sum=sum):
196 return sum(timer())
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000197 self.get_time = get_time_timer
Tim Peters2344fae2001-01-15 00:50:52 +0000198 self.t = self.get_time()
199 self.simulate_call('profiler')
Guido van Rossumb6775db1994-08-01 11:34:53 +0000200
Tim Peters2344fae2001-01-15 00:50:52 +0000201 # Heavily optimized dispatch routine for os.times() timer
Guido van Rossumb6775db1994-08-01 11:34:53 +0000202
Tim Peters2344fae2001-01-15 00:50:52 +0000203 def trace_dispatch(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000204 timer = self.timer
205 t = timer()
Tim Peters659a6032001-10-09 20:51:19 +0000206 t = t[0] + t[1] - self.t - self.bias
Tim Peters2344fae2001-01-15 00:50:52 +0000207
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000208 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000209 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000210
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000211 if self.dispatch[event](self, frame,t):
212 t = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000213 self.t = t[0] + t[1]
214 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000215 r = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000216 self.t = r[0] + r[1] - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000217
Tim Peters6e221492001-10-07 04:02:36 +0000218 # Dispatch routine for best timer program (return = scalar, fastest if
219 # an integer but float works too -- and time.clock() relies on that).
Guido van Rossumb6775db1994-08-01 11:34:53 +0000220
Tim Peters2344fae2001-01-15 00:50:52 +0000221 def trace_dispatch_i(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000222 timer = self.timer
Tim Peters659a6032001-10-09 20:51:19 +0000223 t = timer() - self.t - self.bias
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000224
225 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000226 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000227
228 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000229 self.t = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000230 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000231 self.t = timer() - t # put back unrecorded delta
Guido van Rossumcbf3dd51997-10-08 15:23:02 +0000232
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000233 # Dispatch routine for macintosh (timer returns time in ticks of
234 # 1/60th second)
Tim Peters2344fae2001-01-15 00:50:52 +0000235
236 def trace_dispatch_mac(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000237 timer = self.timer
Tim Peters659a6032001-10-09 20:51:19 +0000238 t = timer()/60.0 - self.t - self.bias
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000239
240 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000241 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000242
Tim Peters659a6032001-10-09 20:51:19 +0000243 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000244 self.t = timer()/60.0
Tim Peters2344fae2001-01-15 00:50:52 +0000245 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000246 self.t = timer()/60.0 - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000247
Tim Peters2344fae2001-01-15 00:50:52 +0000248 # SLOW generic dispatch routine for timer returning lists of numbers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000249
Tim Peters2344fae2001-01-15 00:50:52 +0000250 def trace_dispatch_l(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000251 get_time = self.get_time
Tim Peters659a6032001-10-09 20:51:19 +0000252 t = get_time() - self.t - self.bias
Guido van Rossumb6775db1994-08-01 11:34:53 +0000253
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000254 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000255 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000256
Tim Peters659a6032001-10-09 20:51:19 +0000257 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000258 self.t = get_time()
Tim Peters2344fae2001-01-15 00:50:52 +0000259 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000260 self.t = get_time() - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000261
Tim Peters8d061ed2001-10-07 08:35:44 +0000262 # In the event handlers, the first 3 elements of self.cur are unpacked
263 # into vrbls w/ 3-letter names. The last two characters are meant to be
264 # mnemonic:
265 # _pt self.cur[0] "parent time" time to be charged to parent frame
266 # _it self.cur[1] "internal time" time spent directly in the function
267 # _et self.cur[2] "external time" time spent in subfunctions
Guido van Rossumb6775db1994-08-01 11:34:53 +0000268
Tim Peters2344fae2001-01-15 00:50:52 +0000269 def trace_dispatch_exception(self, frame, t):
Tim Peters8d061ed2001-10-07 08:35:44 +0000270 rpt, rit, ret, rfn, rframe, rcur = self.cur
Fred Drakea0bc9992001-10-03 21:12:32 +0000271 if (rframe is not frame) and rcur:
Tim Peters2344fae2001-01-15 00:50:52 +0000272 return self.trace_dispatch_return(rframe, t)
Tim Peters8d061ed2001-10-07 08:35:44 +0000273 self.cur = rpt, rit+t, ret, rfn, rframe, rcur
Guido van Rossumf137f752001-10-04 00:58:24 +0000274 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000275
276
Tim Peters2344fae2001-01-15 00:50:52 +0000277 def trace_dispatch_call(self, frame, t):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000278 if self.cur and frame.f_back is not self.cur[-2]:
Tim Peters8d061ed2001-10-07 08:35:44 +0000279 rpt, rit, ret, rfn, rframe, rcur = self.cur
Guido van Rossumf137f752001-10-04 00:58:24 +0000280 if not isinstance(rframe, Profile.fake_frame):
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000281 assert rframe.f_back is frame.f_back, ("Bad call", rfn,
282 rframe, rframe.f_back,
283 frame, frame.f_back)
Guido van Rossumf137f752001-10-04 00:58:24 +0000284 self.trace_dispatch_return(rframe, 0)
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000285 assert (self.cur is None or \
286 frame.f_back is self.cur[-2]), ("Bad call",
287 self.cur[-3])
Tim Peters2344fae2001-01-15 00:50:52 +0000288 fcode = frame.f_code
289 fn = (fcode.co_filename, fcode.co_firstlineno, fcode.co_name)
290 self.cur = (t, 0, 0, fn, frame, self.cur)
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000291 timings = self.timings
Raymond Hettinger54f02222002-06-01 14:18:47 +0000292 if fn in timings:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000293 cc, ns, tt, ct, callers = timings[fn]
294 timings[fn] = cc, ns + 1, tt, ct, callers
Tim Peters2344fae2001-01-15 00:50:52 +0000295 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000296 timings[fn] = 0, 0, 0, 0, {}
Tim Peters2344fae2001-01-15 00:50:52 +0000297 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000298
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000299 def trace_dispatch_c_call (self, frame, t):
300 fn = ("", 0, self.c_func_name)
301 self.cur = (t, 0, 0, fn, frame, self.cur)
302 timings = self.timings
303 if timings.has_key(fn):
304 cc, ns, tt, ct, callers = timings[fn]
305 timings[fn] = cc, ns+1, tt, ct, callers
306 else:
307 timings[fn] = 0, 0, 0, 0, {}
308 return 1
309
Tim Peters2344fae2001-01-15 00:50:52 +0000310 def trace_dispatch_return(self, frame, t):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000311 if frame is not self.cur[-2]:
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000312 assert frame is self.cur[-2].f_back, ("Bad return", self.cur[-3])
313 self.trace_dispatch_return(self.cur[-2], 0)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000314
Tim Peters8d061ed2001-10-07 08:35:44 +0000315 # Prefix "r" means part of the Returning or exiting frame.
316 # Prefix "p" means part of the Previous or Parent or older frame.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000317
Tim Peters8d061ed2001-10-07 08:35:44 +0000318 rpt, rit, ret, rfn, frame, rcur = self.cur
319 rit = rit + t
320 frame_total = rit + ret
Guido van Rossumb6775db1994-08-01 11:34:53 +0000321
Tim Peters8d061ed2001-10-07 08:35:44 +0000322 ppt, pit, pet, pfn, pframe, pcur = rcur
323 self.cur = ppt, pit + rpt, pet + frame_total, pfn, pframe, pcur
Guido van Rossumb6775db1994-08-01 11:34:53 +0000324
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000325 timings = self.timings
326 cc, ns, tt, ct, callers = timings[rfn]
Tim Peters2344fae2001-01-15 00:50:52 +0000327 if not ns:
Tim Peters8d061ed2001-10-07 08:35:44 +0000328 # This is the only occurrence of the function on the stack.
329 # Else this is a (directly or indirectly) recursive call, and
330 # its cumulative time will get updated when the topmost call to
331 # it returns.
332 ct = ct + frame_total
Tim Peters2344fae2001-01-15 00:50:52 +0000333 cc = cc + 1
Tim Peters8d061ed2001-10-07 08:35:44 +0000334
Raymond Hettinger54f02222002-06-01 14:18:47 +0000335 if pfn in callers:
Tim Peters2344fae2001-01-15 00:50:52 +0000336 callers[pfn] = callers[pfn] + 1 # hack: gather more
337 # stats such as the amount of time added to ct courtesy
338 # of this specific call, and the contribution to cc
339 # courtesy of this call.
340 else:
341 callers[pfn] = 1
Tim Peters8d061ed2001-10-07 08:35:44 +0000342
343 timings[rfn] = cc, ns - 1, tt + rit, ct, callers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000344
Tim Peters2344fae2001-01-15 00:50:52 +0000345 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000346
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000347
348 dispatch = {
349 "call": trace_dispatch_call,
350 "exception": trace_dispatch_exception,
351 "return": trace_dispatch_return,
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000352 "c_call": trace_dispatch_c_call,
353 "c_exception": trace_dispatch_exception,
354 "c_return": trace_dispatch_return,
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000355 }
356
357
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000358 # The next few functions play with self.cmd. By carefully preloading
Tim Peters2344fae2001-01-15 00:50:52 +0000359 # our parallel stack, we can force the profiled result to include
360 # an arbitrary string as the name of the calling function.
361 # We use self.cmd as that string, and the resulting stats look
362 # very nice :-).
Guido van Rossumb6775db1994-08-01 11:34:53 +0000363
Tim Peters2344fae2001-01-15 00:50:52 +0000364 def set_cmd(self, cmd):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000365 if self.cur[-1]: return # already set
Tim Peters2344fae2001-01-15 00:50:52 +0000366 self.cmd = cmd
367 self.simulate_call(cmd)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000368
Tim Peters2344fae2001-01-15 00:50:52 +0000369 class fake_code:
370 def __init__(self, filename, line, name):
371 self.co_filename = filename
372 self.co_line = line
373 self.co_name = name
374 self.co_firstlineno = 0
Guido van Rossumb6775db1994-08-01 11:34:53 +0000375
Tim Peters2344fae2001-01-15 00:50:52 +0000376 def __repr__(self):
377 return repr((self.co_filename, self.co_line, self.co_name))
Guido van Rossumb6775db1994-08-01 11:34:53 +0000378
Tim Peters2344fae2001-01-15 00:50:52 +0000379 class fake_frame:
380 def __init__(self, code, prior):
381 self.f_code = code
382 self.f_back = prior
Guido van Rossumb6775db1994-08-01 11:34:53 +0000383
Tim Peters2344fae2001-01-15 00:50:52 +0000384 def simulate_call(self, name):
385 code = self.fake_code('profile', 0, name)
386 if self.cur:
Tim Petersdf5cfd82001-10-05 23:15:10 +0000387 pframe = self.cur[-2]
Tim Peters2344fae2001-01-15 00:50:52 +0000388 else:
389 pframe = None
390 frame = self.fake_frame(code, pframe)
Fred Draked10ed8b2001-10-17 01:49:50 +0000391 self.dispatch['call'](self, frame, 0)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000392
Tim Peters2344fae2001-01-15 00:50:52 +0000393 # collect stats from pending stack, including getting final
394 # timings for self.cmd frame.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000395
Tim Peters2344fae2001-01-15 00:50:52 +0000396 def simulate_cmd_complete(self):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000397 get_time = self.get_time
398 t = get_time() - self.t
Tim Petersdf5cfd82001-10-05 23:15:10 +0000399 while self.cur[-1]:
Tim Peters2344fae2001-01-15 00:50:52 +0000400 # We *can* cause assertion errors here if
401 # dispatch_trace_return checks for a frame match!
Fred Draked10ed8b2001-10-17 01:49:50 +0000402 self.dispatch['return'](self, self.cur[-2], t)
Tim Peters2344fae2001-01-15 00:50:52 +0000403 t = 0
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000404 self.t = get_time() - t
Guido van Rossumb6775db1994-08-01 11:34:53 +0000405
406
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000407 def print_stats(self, sort=-1):
Tim Peters2344fae2001-01-15 00:50:52 +0000408 import pstats
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000409 pstats.Stats(self).strip_dirs().sort_stats(sort). \
Tim Peters2344fae2001-01-15 00:50:52 +0000410 print_stats()
Guido van Rossumb6775db1994-08-01 11:34:53 +0000411
Tim Peters2344fae2001-01-15 00:50:52 +0000412 def dump_stats(self, file):
413 f = open(file, 'wb')
414 self.create_stats()
415 marshal.dump(self.stats, f)
416 f.close()
417
418 def create_stats(self):
419 self.simulate_cmd_complete()
420 self.snapshot_stats()
421
422 def snapshot_stats(self):
423 self.stats = {}
Raymond Hettingere0d49722002-06-02 18:55:56 +0000424 for func, (cc, ns, tt, ct, callers) in self.timings.iteritems():
Tim Peters2344fae2001-01-15 00:50:52 +0000425 callers = callers.copy()
426 nc = 0
Raymond Hettingere0d49722002-06-02 18:55:56 +0000427 for callcnt in callers.itervalues():
428 nc += callcnt
Tim Peters2344fae2001-01-15 00:50:52 +0000429 self.stats[func] = cc, nc, tt, ct, callers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000430
431
Tim Peters2344fae2001-01-15 00:50:52 +0000432 # The following two methods can be called by clients to use
433 # a profiler to profile a statement, given as a string.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000434
Tim Peters2344fae2001-01-15 00:50:52 +0000435 def run(self, cmd):
436 import __main__
437 dict = __main__.__dict__
438 return self.runctx(cmd, dict, dict)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000439
Tim Peters2344fae2001-01-15 00:50:52 +0000440 def runctx(self, cmd, globals, locals):
441 self.set_cmd(cmd)
442 sys.setprofile(self.dispatcher)
443 try:
444 exec cmd in globals, locals
445 finally:
446 sys.setprofile(None)
447 return self
Guido van Rossumb6775db1994-08-01 11:34:53 +0000448
Tim Peters2344fae2001-01-15 00:50:52 +0000449 # This method is more useful to profile a single function call.
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000450 def runcall(self, func, *args, **kw):
Walter Dörwald70a6b492004-02-12 17:35:32 +0000451 self.set_cmd(repr(func))
Tim Peters2344fae2001-01-15 00:50:52 +0000452 sys.setprofile(self.dispatcher)
453 try:
Guido van Rossum68468eb2003-02-27 20:14:51 +0000454 return func(*args, **kw)
Tim Peters2344fae2001-01-15 00:50:52 +0000455 finally:
456 sys.setprofile(None)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000457
Tim Peters2344fae2001-01-15 00:50:52 +0000458
459 #******************************************************************
460 # The following calculates the overhead for using a profiler. The
461 # problem is that it takes a fair amount of time for the profiler
462 # to stop the stopwatch (from the time it receives an event).
463 # Similarly, there is a delay from the time that the profiler
464 # re-starts the stopwatch before the user's code really gets to
465 # continue. The following code tries to measure the difference on
Tim Peters659a6032001-10-09 20:51:19 +0000466 # a per-event basis.
467 #
468 # Note that this difference is only significant if there are a lot of
Tim Peters2344fae2001-01-15 00:50:52 +0000469 # events, and relatively little user code per event. For example,
470 # code with small functions will typically benefit from having the
471 # profiler calibrated for the current platform. This *could* be
472 # done on the fly during init() time, but it is not worth the
473 # effort. Also note that if too large a value specified, then
474 # execution time on some functions will actually appear as a
475 # negative number. It is *normal* for some functions (with very
476 # low call counts) to have such negative stats, even if the
477 # calibration figure is "correct."
478 #
479 # One alternative to profile-time calibration adjustments (i.e.,
480 # adding in the magic little delta during each event) is to track
481 # more carefully the number of events (and cumulatively, the number
482 # of events during sub functions) that are seen. If this were
483 # done, then the arithmetic could be done after the fact (i.e., at
484 # display time). Currently, we track only call/return events.
485 # These values can be deduced by examining the callees and callers
486 # vectors for each functions. Hence we *can* almost correct the
487 # internal time figure at print time (note that we currently don't
488 # track exception event processing counts). Unfortunately, there
489 # is currently no similar information for cumulative sub-function
490 # time. It would not be hard to "get all this info" at profiler
491 # time. Specifically, we would have to extend the tuples to keep
492 # counts of this in each frame, and then extend the defs of timing
493 # tuples to include the significant two figures. I'm a bit fearful
494 # that this additional feature will slow the heavily optimized
495 # event/time ratio (i.e., the profiler would run slower, fur a very
496 # low "value added" feature.)
Tim Peters2344fae2001-01-15 00:50:52 +0000497 #**************************************************************
498
Tim Peterscce092d2001-10-09 05:31:56 +0000499 def calibrate(self, m, verbose=0):
Tim Peters659a6032001-10-09 20:51:19 +0000500 if self.__class__ is not Profile:
501 raise TypeError("Subclasses must override .calibrate().")
502
503 saved_bias = self.bias
504 self.bias = 0
505 try:
Tim Peterse13cc922001-10-09 21:01:31 +0000506 return self._calibrate_inner(m, verbose)
Tim Peters659a6032001-10-09 20:51:19 +0000507 finally:
508 self.bias = saved_bias
509
Tim Peterse13cc922001-10-09 21:01:31 +0000510 def _calibrate_inner(self, m, verbose):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000511 get_time = self.get_time
Tim Peters2344fae2001-01-15 00:50:52 +0000512
Tim Peterscce092d2001-10-09 05:31:56 +0000513 # Set up a test case to be run with and without profiling. Include
514 # lots of calls, because we're trying to quantify stopwatch overhead.
515 # Do not raise any exceptions, though, because we want to know
516 # exactly how many profile events are generated (one call event, +
517 # one return event, per Python-level call).
Tim Peters2344fae2001-01-15 00:50:52 +0000518
Tim Peterscce092d2001-10-09 05:31:56 +0000519 def f1(n):
520 for i in range(n):
521 x = 1
Tim Peters2344fae2001-01-15 00:50:52 +0000522
Tim Peterscce092d2001-10-09 05:31:56 +0000523 def f(m, f1=f1):
524 for i in range(m):
525 f1(100)
Tim Peters2344fae2001-01-15 00:50:52 +0000526
Tim Peterscce092d2001-10-09 05:31:56 +0000527 f(m) # warm up the cache
528
529 # elapsed_noprofile <- time f(m) takes without profiling.
530 t0 = get_time()
531 f(m)
532 t1 = get_time()
533 elapsed_noprofile = t1 - t0
534 if verbose:
535 print "elapsed time without profiling =", elapsed_noprofile
536
537 # elapsed_profile <- time f(m) takes with profiling. The difference
538 # is profiling overhead, only some of which the profiler subtracts
539 # out on its own.
540 p = Profile()
541 t0 = get_time()
542 p.runctx('f(m)', globals(), locals())
543 t1 = get_time()
544 elapsed_profile = t1 - t0
545 if verbose:
546 print "elapsed time with profiling =", elapsed_profile
547
548 # reported_time <- "CPU seconds" the profiler charged to f and f1.
549 total_calls = 0.0
550 reported_time = 0.0
551 for (filename, line, funcname), (cc, ns, tt, ct, callers) in \
552 p.timings.items():
553 if funcname in ("f", "f1"):
554 total_calls += cc
555 reported_time += tt
556
557 if verbose:
558 print "'CPU seconds' profiler reported =", reported_time
559 print "total # calls =", total_calls
560 if total_calls != m + 1:
561 raise ValueError("internal error: total calls = %d" % total_calls)
562
563 # reported_time - elapsed_noprofile = overhead the profiler wasn't
564 # able to measure. Divide by twice the number of calls (since there
565 # are two profiler events per call in this test) to get the hidden
566 # overhead per event.
567 mean = (reported_time - elapsed_noprofile) / 2.0 / total_calls
568 if verbose:
569 print "mean stopwatch overhead per profile event =", mean
570 return mean
Guido van Rossumb6775db1994-08-01 11:34:53 +0000571
Guido van Rossumb6775db1994-08-01 11:34:53 +0000572#****************************************************************************
573def Stats(*args):
Tim Peters2344fae2001-01-15 00:50:52 +0000574 print 'Report generating functions are in the "pstats" module\a'
Guido van Rossumcc778eb1996-10-01 02:55:54 +0000575
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000576def main():
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000577 usage = "profile.py [-o output_file_path] [-s sort] scriptfile [arg] ..."
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000578 parser = OptionParser(usage=usage)
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000579 parser.allow_interspersed_args = False
Tim Peters4e0e1b62004-07-07 20:54:48 +0000580 parser.add_option('-o', '--outfile', dest="outfile",
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000581 help="Save stats to <outfile>", default=None)
582 parser.add_option('-s', '--sort', dest="sort",
583 help="Sort order when printing to stdout, based on pstats.Stats class", default=-1)
Tim Petersb497c102005-01-10 16:48:37 +0000584
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000585 if not sys.argv[1:]:
586 parser.print_usage()
587 sys.exit(2)
Tim Petersb497c102005-01-10 16:48:37 +0000588
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000589 (options, args) = parser.parse_args()
590 sys.argv[:] = args
Tim Petersb497c102005-01-10 16:48:37 +0000591
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000592 if (len(sys.argv) > 0):
593 sys.path.insert(0, os.path.dirname(sys.argv[0]))
594 run('execfile(%r)' % (sys.argv[0],), options.outfile, options.sort)
595 else:
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000596 parser.print_usage()
597 return parser
598
599# When invoked as main program, invoke the profiler on a script
600if __name__ == '__main__':
601 main()