blob: 297e32d64add7604dcad9156d0d7534df483c064 [file] [log] [blame]
Benjamin Peterson90f5ba52010-03-11 22:53:45 +00001#! /usr/bin/env python3
Guido van Rossum81762581992-04-21 15:36:23 +00002#
Guido van Rossumb6775db1994-08-01 11:34:53 +00003# Class for profiling python code. rev 1.0 6/2/94
Guido van Rossum81762581992-04-21 15:36:23 +00004#
Benjamin Peterson8d770692011-06-27 09:14:34 -05005# Written by James Roskind
Guido van Rossumb6775db1994-08-01 11:34:53 +00006# Based on prior profile module by Sjoerd Mullender...
7# which was hacked somewhat by: Guido van Rossum
Guido van Rossumb6775db1994-08-01 11:34:53 +00008
Guido van Rossum54f22ed2000-02-04 15:10:34 +00009"""Class for profiling Python code."""
Guido van Rossumb6775db1994-08-01 11:34:53 +000010
Benjamin Peterson8d770692011-06-27 09:14:34 -050011# Copyright Disney Enterprises, Inc. All Rights Reserved.
12# Licensed to PSF under a Contributor Agreement
Benjamin Peterson0f93d3d2011-06-27 09:18:46 -050013#
Benjamin Peterson8d770692011-06-27 09:14:34 -050014# Licensed under the Apache License, Version 2.0 (the "License");
15# you may not use this file except in compliance with the License.
16# You may obtain a copy of the License at
Benjamin Peterson0f93d3d2011-06-27 09:18:46 -050017#
Benjamin Peterson8d770692011-06-27 09:14:34 -050018# http://www.apache.org/licenses/LICENSE-2.0
Benjamin Peterson0f93d3d2011-06-27 09:18:46 -050019#
Benjamin Peterson8d770692011-06-27 09:14:34 -050020# Unless required by applicable law or agreed to in writing, software
21# distributed under the License is distributed on an "AS IS" BASIS,
22# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
23# either express or implied. See the License for the specific language
24# governing permissions and limitations under the License.
Guido van Rossumb6775db1994-08-01 11:34:53 +000025
Guido van Rossum81762581992-04-21 15:36:23 +000026
27import sys
Guido van Rossum4e160981992-09-02 20:43:20 +000028import os
Guido van Rossumb6775db1994-08-01 11:34:53 +000029import time
Guido van Rossum4e160981992-09-02 20:43:20 +000030import marshal
Nicholas Bastin824b1b22004-03-23 18:44:39 +000031from optparse import OptionParser
Guido van Rossum81762581992-04-21 15:36:23 +000032
Georg Brandlb6b13242009-09-04 17:15:16 +000033__all__ = ["run", "runctx", "Profile"]
Guido van Rossum81762581992-04-21 15:36:23 +000034
Tim Peters2344fae2001-01-15 00:50:52 +000035# Sample timer for use with
Guido van Rossumb6775db1994-08-01 11:34:53 +000036#i_count = 0
37#def integer_timer():
Tim Peters2344fae2001-01-15 00:50:52 +000038# global i_count
39# i_count = i_count + 1
40# return i_count
Guido van Rossumb6775db1994-08-01 11:34:53 +000041#itimes = integer_timer # replace with C coded timer returning integers
Guido van Rossum81762581992-04-21 15:36:23 +000042
Guido van Rossumb6775db1994-08-01 11:34:53 +000043#**************************************************************************
44# The following are the static member functions for the profiler class
45# Note that an instance of Profile() is *not* needed to call them.
46#**************************************************************************
Guido van Rossum81762581992-04-21 15:36:23 +000047
Nicholas Bastin824b1b22004-03-23 18:44:39 +000048def run(statement, filename=None, sort=-1):
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000049 """Run statement under profiler optionally saving results in filename
Guido van Rossum4e160981992-09-02 20:43:20 +000050
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000051 This function takes a single argument that can be passed to the
52 "exec" statement, and an optional file name. In all cases this
53 routine attempts to "exec" its first argument and gather profiling
54 statistics from the execution. If no file name is present, then this
55 function automatically prints a simple profiling report, sorted by the
56 standard name string (file/line/function-name) that is presented in
57 each line.
58 """
Tim Peters2344fae2001-01-15 00:50:52 +000059 prof = Profile()
60 try:
61 prof = prof.run(statement)
62 except SystemExit:
63 pass
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000064 if filename is not None:
65 prof.dump_stats(filename)
Tim Peters2344fae2001-01-15 00:50:52 +000066 else:
Nicholas Bastin824b1b22004-03-23 18:44:39 +000067 return prof.print_stats(sort)
Guido van Rossume61fa0a1993-10-22 13:56:35 +000068
Georg Brandl8e43fbf2010-08-02 12:20:23 +000069def runctx(statement, globals, locals, filename=None, sort=-1):
Nicholas Bastin1eb4bfc2004-03-22 20:12:56 +000070 """Run statement under profiler, supplying your own globals and locals,
71 optionally saving results in filename.
72
73 statement and filename have the same semantics as profile.run
74 """
75 prof = Profile()
76 try:
77 prof = prof.runctx(statement, globals, locals)
78 except SystemExit:
79 pass
80
81 if filename is not None:
82 prof.dump_stats(filename)
83 else:
Georg Brandl8e43fbf2010-08-02 12:20:23 +000084 return prof.print_stats(sort)
Nicholas Bastin1eb4bfc2004-03-22 20:12:56 +000085
Fred Drakeedb5ffb2001-06-08 04:25:24 +000086if hasattr(os, "times"):
87 def _get_time_times(timer=os.times):
88 t = timer()
89 return t[0] + t[1]
90
Martin v. Löwisa4dac402005-03-03 11:39:45 +000091# Using getrusage(3) is better than clock(3) if available:
92# on some systems (e.g. FreeBSD), getrusage has a higher resolution
93# Furthermore, on a POSIX system, returns microseconds, which
94# wrap around after 36min.
95_has_res = 0
96try:
97 import resource
98 resgetrusage = lambda: resource.getrusage(resource.RUSAGE_SELF)
99 def _get_time_resource(timer=resgetrusage):
100 t = timer()
101 return t[0] + t[1]
102 _has_res = 1
103except ImportError:
104 pass
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000105
Guido van Rossumb6775db1994-08-01 11:34:53 +0000106class Profile:
Tim Peters2344fae2001-01-15 00:50:52 +0000107 """Profiler class.
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000108
Tim Peters2344fae2001-01-15 00:50:52 +0000109 self.cur is always a tuple. Each such tuple corresponds to a stack
110 frame that is currently active (self.cur[-2]). The following are the
111 definitions of its members. We use this external "parallel stack" to
112 avoid contaminating the program that we are profiling. (old profiler
113 used to write into the frames local dictionary!!) Derived classes
114 can change the definition of some entries, as long as they leave
Tim Petersdf5cfd82001-10-05 23:15:10 +0000115 [-2:] intact (frame and previous tuple). In case an internal error is
116 detected, the -3 element is used as the function name.
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000117
Tim Petersdf5cfd82001-10-05 23:15:10 +0000118 [ 0] = Time that needs to be charged to the parent frame's function.
119 It is used so that a function call will not have to access the
120 timing data for the parent frame.
121 [ 1] = Total time spent in this frame's function, excluding time in
Tim Peters8d061ed2001-10-07 08:35:44 +0000122 subfunctions (this latter is tallied in cur[2]).
Tim Petersfb163782001-10-07 08:49:02 +0000123 [ 2] = Total time spent in subfunctions, excluding time executing the
Tim Peters8d061ed2001-10-07 08:35:44 +0000124 frame's function (this latter is tallied in cur[1]).
Tim Petersdf5cfd82001-10-05 23:15:10 +0000125 [-3] = Name of the function that corresponds to this frame.
Tim Peters8d061ed2001-10-07 08:35:44 +0000126 [-2] = Actual frame that we correspond to (used to sync exception handling).
127 [-1] = Our parent 6-tuple (corresponds to frame.f_back).
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000128
Tim Peters2344fae2001-01-15 00:50:52 +0000129 Timing data for each function is stored as a 5-tuple in the dictionary
Tim Petersdf5cfd82001-10-05 23:15:10 +0000130 self.timings[]. The index is always the name stored in self.cur[-3].
Tim Peters2344fae2001-01-15 00:50:52 +0000131 The following are the definitions of the members:
Guido van Rossumb6775db1994-08-01 11:34:53 +0000132
Tim Peters2344fae2001-01-15 00:50:52 +0000133 [0] = The number of times this function was called, not counting direct
134 or indirect recursion,
135 [1] = Number of times this function appears on the stack, minus one
136 [2] = Total time spent internal to this function
137 [3] = Cumulative time that this function was present on the stack. In
138 non-recursive functions, this is the total execution time from start
139 to finish of each invocation of a function, including time spent in
140 all subfunctions.
Tim Peters6e221492001-10-07 04:02:36 +0000141 [4] = A dictionary indicating for each function name, the number of times
Tim Peters2344fae2001-01-15 00:50:52 +0000142 it was called by us.
143 """
Guido van Rossumb6775db1994-08-01 11:34:53 +0000144
Tim Peters659a6032001-10-09 20:51:19 +0000145 bias = 0 # calibration constant
146
147 def __init__(self, timer=None, bias=None):
Tim Peters2344fae2001-01-15 00:50:52 +0000148 self.timings = {}
149 self.cur = None
150 self.cmd = ""
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000151 self.c_func_name = ""
Guido van Rossumb6775db1994-08-01 11:34:53 +0000152
Tim Peters659a6032001-10-09 20:51:19 +0000153 if bias is None:
154 bias = self.bias
155 self.bias = bias # Materialize in local dict for lookup speed.
156
Martin v. Löwisa4dac402005-03-03 11:39:45 +0000157 if not timer:
158 if _has_res:
159 self.timer = resgetrusage
160 self.dispatcher = self.trace_dispatch
161 self.get_time = _get_time_resource
Tim Peters2344fae2001-01-15 00:50:52 +0000162 elif hasattr(time, 'clock'):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000163 self.timer = self.get_time = time.clock
Tim Peters2344fae2001-01-15 00:50:52 +0000164 self.dispatcher = self.trace_dispatch_i
165 elif hasattr(os, 'times'):
166 self.timer = os.times
167 self.dispatcher = self.trace_dispatch
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000168 self.get_time = _get_time_times
Tim Peters2344fae2001-01-15 00:50:52 +0000169 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000170 self.timer = self.get_time = time.time
Tim Peters2344fae2001-01-15 00:50:52 +0000171 self.dispatcher = self.trace_dispatch_i
172 else:
173 self.timer = timer
174 t = self.timer() # test out timer function
175 try:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000176 length = len(t)
177 except TypeError:
178 self.get_time = timer
179 self.dispatcher = self.trace_dispatch_i
180 else:
181 if length == 2:
Tim Peters2344fae2001-01-15 00:50:52 +0000182 self.dispatcher = self.trace_dispatch
183 else:
184 self.dispatcher = self.trace_dispatch_l
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000185 # This get_time() implementation needs to be defined
186 # here to capture the passed-in timer in the parameter
187 # list (for performance). Note that we can't assume
188 # the timer() result contains two values in all
189 # cases.
Raymond Hettinger97aa32b2003-10-22 16:49:01 +0000190 def get_time_timer(timer=timer, sum=sum):
191 return sum(timer())
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000192 self.get_time = get_time_timer
Tim Peters2344fae2001-01-15 00:50:52 +0000193 self.t = self.get_time()
194 self.simulate_call('profiler')
Guido van Rossumb6775db1994-08-01 11:34:53 +0000195
Tim Peters2344fae2001-01-15 00:50:52 +0000196 # Heavily optimized dispatch routine for os.times() timer
Guido van Rossumb6775db1994-08-01 11:34:53 +0000197
Tim Peters2344fae2001-01-15 00:50:52 +0000198 def trace_dispatch(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000199 timer = self.timer
200 t = timer()
Tim Peters659a6032001-10-09 20:51:19 +0000201 t = t[0] + t[1] - self.t - self.bias
Tim Peters2344fae2001-01-15 00:50:52 +0000202
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000203 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000204 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000205
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000206 if self.dispatch[event](self, frame,t):
207 t = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000208 self.t = t[0] + t[1]
209 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000210 r = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000211 self.t = r[0] + r[1] - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000212
Tim Peters6e221492001-10-07 04:02:36 +0000213 # Dispatch routine for best timer program (return = scalar, fastest if
214 # an integer but float works too -- and time.clock() relies on that).
Guido van Rossumb6775db1994-08-01 11:34:53 +0000215
Tim Peters2344fae2001-01-15 00:50:52 +0000216 def trace_dispatch_i(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000217 timer = self.timer
Tim Peters659a6032001-10-09 20:51:19 +0000218 t = timer() - self.t - self.bias
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000219
220 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000221 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000222
223 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000224 self.t = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000225 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000226 self.t = timer() - t # put back unrecorded delta
Guido van Rossumcbf3dd51997-10-08 15:23:02 +0000227
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000228 # Dispatch routine for macintosh (timer returns time in ticks of
229 # 1/60th second)
Tim Peters2344fae2001-01-15 00:50:52 +0000230
231 def trace_dispatch_mac(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000232 timer = self.timer
Tim Peters659a6032001-10-09 20:51:19 +0000233 t = timer()/60.0 - self.t - self.bias
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000234
235 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000236 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000237
Tim Peters659a6032001-10-09 20:51:19 +0000238 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000239 self.t = timer()/60.0
Tim Peters2344fae2001-01-15 00:50:52 +0000240 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000241 self.t = timer()/60.0 - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000242
Tim Peters2344fae2001-01-15 00:50:52 +0000243 # SLOW generic dispatch routine for timer returning lists of numbers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000244
Tim Peters2344fae2001-01-15 00:50:52 +0000245 def trace_dispatch_l(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000246 get_time = self.get_time
Tim Peters659a6032001-10-09 20:51:19 +0000247 t = get_time() - self.t - self.bias
Guido van Rossumb6775db1994-08-01 11:34:53 +0000248
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000249 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000250 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000251
Tim Peters659a6032001-10-09 20:51:19 +0000252 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000253 self.t = get_time()
Tim Peters2344fae2001-01-15 00:50:52 +0000254 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000255 self.t = get_time() - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000256
Tim Peters8d061ed2001-10-07 08:35:44 +0000257 # In the event handlers, the first 3 elements of self.cur are unpacked
258 # into vrbls w/ 3-letter names. The last two characters are meant to be
259 # mnemonic:
260 # _pt self.cur[0] "parent time" time to be charged to parent frame
261 # _it self.cur[1] "internal time" time spent directly in the function
262 # _et self.cur[2] "external time" time spent in subfunctions
Guido van Rossumb6775db1994-08-01 11:34:53 +0000263
Tim Peters2344fae2001-01-15 00:50:52 +0000264 def trace_dispatch_exception(self, frame, t):
Tim Peters8d061ed2001-10-07 08:35:44 +0000265 rpt, rit, ret, rfn, rframe, rcur = self.cur
Fred Drakea0bc9992001-10-03 21:12:32 +0000266 if (rframe is not frame) and rcur:
Tim Peters2344fae2001-01-15 00:50:52 +0000267 return self.trace_dispatch_return(rframe, t)
Tim Peters8d061ed2001-10-07 08:35:44 +0000268 self.cur = rpt, rit+t, ret, rfn, rframe, rcur
Guido van Rossumf137f752001-10-04 00:58:24 +0000269 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000270
271
Tim Peters2344fae2001-01-15 00:50:52 +0000272 def trace_dispatch_call(self, frame, t):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000273 if self.cur and frame.f_back is not self.cur[-2]:
Tim Peters8d061ed2001-10-07 08:35:44 +0000274 rpt, rit, ret, rfn, rframe, rcur = self.cur
Guido van Rossumf137f752001-10-04 00:58:24 +0000275 if not isinstance(rframe, Profile.fake_frame):
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000276 assert rframe.f_back is frame.f_back, ("Bad call", rfn,
277 rframe, rframe.f_back,
278 frame, frame.f_back)
Guido van Rossumf137f752001-10-04 00:58:24 +0000279 self.trace_dispatch_return(rframe, 0)
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000280 assert (self.cur is None or \
281 frame.f_back is self.cur[-2]), ("Bad call",
282 self.cur[-3])
Tim Peters2344fae2001-01-15 00:50:52 +0000283 fcode = frame.f_code
284 fn = (fcode.co_filename, fcode.co_firstlineno, fcode.co_name)
285 self.cur = (t, 0, 0, fn, frame, self.cur)
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000286 timings = self.timings
Raymond Hettinger54f02222002-06-01 14:18:47 +0000287 if fn in timings:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000288 cc, ns, tt, ct, callers = timings[fn]
289 timings[fn] = cc, ns + 1, tt, ct, callers
Tim Peters2344fae2001-01-15 00:50:52 +0000290 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000291 timings[fn] = 0, 0, 0, 0, {}
Tim Peters2344fae2001-01-15 00:50:52 +0000292 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000293
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000294 def trace_dispatch_c_call (self, frame, t):
295 fn = ("", 0, self.c_func_name)
296 self.cur = (t, 0, 0, fn, frame, self.cur)
297 timings = self.timings
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000298 if fn in timings:
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000299 cc, ns, tt, ct, callers = timings[fn]
300 timings[fn] = cc, ns+1, tt, ct, callers
301 else:
302 timings[fn] = 0, 0, 0, 0, {}
303 return 1
304
Tim Peters2344fae2001-01-15 00:50:52 +0000305 def trace_dispatch_return(self, frame, t):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000306 if frame is not self.cur[-2]:
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000307 assert frame is self.cur[-2].f_back, ("Bad return", self.cur[-3])
308 self.trace_dispatch_return(self.cur[-2], 0)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000309
Tim Peters8d061ed2001-10-07 08:35:44 +0000310 # Prefix "r" means part of the Returning or exiting frame.
311 # Prefix "p" means part of the Previous or Parent or older frame.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000312
Tim Peters8d061ed2001-10-07 08:35:44 +0000313 rpt, rit, ret, rfn, frame, rcur = self.cur
314 rit = rit + t
315 frame_total = rit + ret
Guido van Rossumb6775db1994-08-01 11:34:53 +0000316
Tim Peters8d061ed2001-10-07 08:35:44 +0000317 ppt, pit, pet, pfn, pframe, pcur = rcur
318 self.cur = ppt, pit + rpt, pet + frame_total, pfn, pframe, pcur
Guido van Rossumb6775db1994-08-01 11:34:53 +0000319
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000320 timings = self.timings
321 cc, ns, tt, ct, callers = timings[rfn]
Tim Peters2344fae2001-01-15 00:50:52 +0000322 if not ns:
Tim Peters8d061ed2001-10-07 08:35:44 +0000323 # This is the only occurrence of the function on the stack.
324 # Else this is a (directly or indirectly) recursive call, and
325 # its cumulative time will get updated when the topmost call to
326 # it returns.
327 ct = ct + frame_total
Tim Peters2344fae2001-01-15 00:50:52 +0000328 cc = cc + 1
Tim Peters8d061ed2001-10-07 08:35:44 +0000329
Raymond Hettinger54f02222002-06-01 14:18:47 +0000330 if pfn in callers:
Tim Peters2344fae2001-01-15 00:50:52 +0000331 callers[pfn] = callers[pfn] + 1 # hack: gather more
332 # stats such as the amount of time added to ct courtesy
333 # of this specific call, and the contribution to cc
334 # courtesy of this call.
335 else:
336 callers[pfn] = 1
Tim Peters8d061ed2001-10-07 08:35:44 +0000337
338 timings[rfn] = cc, ns - 1, tt + rit, ct, callers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000339
Tim Peters2344fae2001-01-15 00:50:52 +0000340 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000341
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000342
343 dispatch = {
344 "call": trace_dispatch_call,
345 "exception": trace_dispatch_exception,
346 "return": trace_dispatch_return,
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000347 "c_call": trace_dispatch_c_call,
Armin Rigof8790242005-09-20 18:50:13 +0000348 "c_exception": trace_dispatch_return, # the C function returned
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000349 "c_return": trace_dispatch_return,
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000350 }
351
352
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000353 # The next few functions play with self.cmd. By carefully preloading
Tim Peters2344fae2001-01-15 00:50:52 +0000354 # our parallel stack, we can force the profiled result to include
355 # an arbitrary string as the name of the calling function.
356 # We use self.cmd as that string, and the resulting stats look
357 # very nice :-).
Guido van Rossumb6775db1994-08-01 11:34:53 +0000358
Tim Peters2344fae2001-01-15 00:50:52 +0000359 def set_cmd(self, cmd):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000360 if self.cur[-1]: return # already set
Tim Peters2344fae2001-01-15 00:50:52 +0000361 self.cmd = cmd
362 self.simulate_call(cmd)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000363
Tim Peters2344fae2001-01-15 00:50:52 +0000364 class fake_code:
365 def __init__(self, filename, line, name):
366 self.co_filename = filename
367 self.co_line = line
368 self.co_name = name
369 self.co_firstlineno = 0
Guido van Rossumb6775db1994-08-01 11:34:53 +0000370
Tim Peters2344fae2001-01-15 00:50:52 +0000371 def __repr__(self):
372 return repr((self.co_filename, self.co_line, self.co_name))
Guido van Rossumb6775db1994-08-01 11:34:53 +0000373
Tim Peters2344fae2001-01-15 00:50:52 +0000374 class fake_frame:
375 def __init__(self, code, prior):
376 self.f_code = code
377 self.f_back = prior
Guido van Rossumb6775db1994-08-01 11:34:53 +0000378
Tim Peters2344fae2001-01-15 00:50:52 +0000379 def simulate_call(self, name):
380 code = self.fake_code('profile', 0, name)
381 if self.cur:
Tim Petersdf5cfd82001-10-05 23:15:10 +0000382 pframe = self.cur[-2]
Tim Peters2344fae2001-01-15 00:50:52 +0000383 else:
384 pframe = None
385 frame = self.fake_frame(code, pframe)
Fred Draked10ed8b2001-10-17 01:49:50 +0000386 self.dispatch['call'](self, frame, 0)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000387
Tim Peters2344fae2001-01-15 00:50:52 +0000388 # collect stats from pending stack, including getting final
389 # timings for self.cmd frame.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000390
Tim Peters2344fae2001-01-15 00:50:52 +0000391 def simulate_cmd_complete(self):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000392 get_time = self.get_time
393 t = get_time() - self.t
Tim Petersdf5cfd82001-10-05 23:15:10 +0000394 while self.cur[-1]:
Tim Peters2344fae2001-01-15 00:50:52 +0000395 # We *can* cause assertion errors here if
396 # dispatch_trace_return checks for a frame match!
Fred Draked10ed8b2001-10-17 01:49:50 +0000397 self.dispatch['return'](self, self.cur[-2], t)
Tim Peters2344fae2001-01-15 00:50:52 +0000398 t = 0
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000399 self.t = get_time() - t
Guido van Rossumb6775db1994-08-01 11:34:53 +0000400
401
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000402 def print_stats(self, sort=-1):
Tim Peters2344fae2001-01-15 00:50:52 +0000403 import pstats
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000404 pstats.Stats(self).strip_dirs().sort_stats(sort). \
Tim Peters2344fae2001-01-15 00:50:52 +0000405 print_stats()
Guido van Rossumb6775db1994-08-01 11:34:53 +0000406
Tim Peters2344fae2001-01-15 00:50:52 +0000407 def dump_stats(self, file):
408 f = open(file, 'wb')
409 self.create_stats()
410 marshal.dump(self.stats, f)
411 f.close()
412
413 def create_stats(self):
414 self.simulate_cmd_complete()
415 self.snapshot_stats()
416
417 def snapshot_stats(self):
418 self.stats = {}
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000419 for func, (cc, ns, tt, ct, callers) in self.timings.items():
Tim Peters2344fae2001-01-15 00:50:52 +0000420 callers = callers.copy()
421 nc = 0
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000422 for callcnt in callers.values():
Raymond Hettingere0d49722002-06-02 18:55:56 +0000423 nc += callcnt
Tim Peters2344fae2001-01-15 00:50:52 +0000424 self.stats[func] = cc, nc, tt, ct, callers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000425
426
Tim Peters2344fae2001-01-15 00:50:52 +0000427 # The following two methods can be called by clients to use
428 # a profiler to profile a statement, given as a string.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000429
Tim Peters2344fae2001-01-15 00:50:52 +0000430 def run(self, cmd):
431 import __main__
432 dict = __main__.__dict__
433 return self.runctx(cmd, dict, dict)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000434
Tim Peters2344fae2001-01-15 00:50:52 +0000435 def runctx(self, cmd, globals, locals):
436 self.set_cmd(cmd)
437 sys.setprofile(self.dispatcher)
438 try:
Georg Brandl7cae87c2006-09-06 06:51:57 +0000439 exec(cmd, globals, locals)
Tim Peters2344fae2001-01-15 00:50:52 +0000440 finally:
441 sys.setprofile(None)
442 return self
Guido van Rossumb6775db1994-08-01 11:34:53 +0000443
Tim Peters2344fae2001-01-15 00:50:52 +0000444 # This method is more useful to profile a single function call.
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000445 def runcall(self, func, *args, **kw):
Walter Dörwald70a6b492004-02-12 17:35:32 +0000446 self.set_cmd(repr(func))
Tim Peters2344fae2001-01-15 00:50:52 +0000447 sys.setprofile(self.dispatcher)
448 try:
Guido van Rossum68468eb2003-02-27 20:14:51 +0000449 return func(*args, **kw)
Tim Peters2344fae2001-01-15 00:50:52 +0000450 finally:
451 sys.setprofile(None)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000452
Tim Peters2344fae2001-01-15 00:50:52 +0000453
454 #******************************************************************
455 # The following calculates the overhead for using a profiler. The
456 # problem is that it takes a fair amount of time for the profiler
457 # to stop the stopwatch (from the time it receives an event).
458 # Similarly, there is a delay from the time that the profiler
459 # re-starts the stopwatch before the user's code really gets to
460 # continue. The following code tries to measure the difference on
Tim Peters659a6032001-10-09 20:51:19 +0000461 # a per-event basis.
462 #
463 # Note that this difference is only significant if there are a lot of
Tim Peters2344fae2001-01-15 00:50:52 +0000464 # events, and relatively little user code per event. For example,
465 # code with small functions will typically benefit from having the
466 # profiler calibrated for the current platform. This *could* be
467 # done on the fly during init() time, but it is not worth the
468 # effort. Also note that if too large a value specified, then
469 # execution time on some functions will actually appear as a
470 # negative number. It is *normal* for some functions (with very
471 # low call counts) to have such negative stats, even if the
472 # calibration figure is "correct."
473 #
474 # One alternative to profile-time calibration adjustments (i.e.,
475 # adding in the magic little delta during each event) is to track
476 # more carefully the number of events (and cumulatively, the number
477 # of events during sub functions) that are seen. If this were
478 # done, then the arithmetic could be done after the fact (i.e., at
479 # display time). Currently, we track only call/return events.
480 # These values can be deduced by examining the callees and callers
481 # vectors for each functions. Hence we *can* almost correct the
482 # internal time figure at print time (note that we currently don't
483 # track exception event processing counts). Unfortunately, there
484 # is currently no similar information for cumulative sub-function
485 # time. It would not be hard to "get all this info" at profiler
486 # time. Specifically, we would have to extend the tuples to keep
487 # counts of this in each frame, and then extend the defs of timing
488 # tuples to include the significant two figures. I'm a bit fearful
489 # that this additional feature will slow the heavily optimized
490 # event/time ratio (i.e., the profiler would run slower, fur a very
491 # low "value added" feature.)
Tim Peters2344fae2001-01-15 00:50:52 +0000492 #**************************************************************
493
Tim Peterscce092d2001-10-09 05:31:56 +0000494 def calibrate(self, m, verbose=0):
Tim Peters659a6032001-10-09 20:51:19 +0000495 if self.__class__ is not Profile:
496 raise TypeError("Subclasses must override .calibrate().")
497
498 saved_bias = self.bias
499 self.bias = 0
500 try:
Tim Peterse13cc922001-10-09 21:01:31 +0000501 return self._calibrate_inner(m, verbose)
Tim Peters659a6032001-10-09 20:51:19 +0000502 finally:
503 self.bias = saved_bias
504
Tim Peterse13cc922001-10-09 21:01:31 +0000505 def _calibrate_inner(self, m, verbose):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000506 get_time = self.get_time
Tim Peters2344fae2001-01-15 00:50:52 +0000507
Tim Peterscce092d2001-10-09 05:31:56 +0000508 # Set up a test case to be run with and without profiling. Include
509 # lots of calls, because we're trying to quantify stopwatch overhead.
510 # Do not raise any exceptions, though, because we want to know
511 # exactly how many profile events are generated (one call event, +
512 # one return event, per Python-level call).
Tim Peters2344fae2001-01-15 00:50:52 +0000513
Tim Peterscce092d2001-10-09 05:31:56 +0000514 def f1(n):
515 for i in range(n):
516 x = 1
Tim Peters2344fae2001-01-15 00:50:52 +0000517
Tim Peterscce092d2001-10-09 05:31:56 +0000518 def f(m, f1=f1):
519 for i in range(m):
520 f1(100)
Tim Peters2344fae2001-01-15 00:50:52 +0000521
Tim Peterscce092d2001-10-09 05:31:56 +0000522 f(m) # warm up the cache
523
524 # elapsed_noprofile <- time f(m) takes without profiling.
525 t0 = get_time()
526 f(m)
527 t1 = get_time()
528 elapsed_noprofile = t1 - t0
529 if verbose:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000530 print("elapsed time without profiling =", elapsed_noprofile)
Tim Peterscce092d2001-10-09 05:31:56 +0000531
532 # elapsed_profile <- time f(m) takes with profiling. The difference
533 # is profiling overhead, only some of which the profiler subtracts
534 # out on its own.
535 p = Profile()
536 t0 = get_time()
537 p.runctx('f(m)', globals(), locals())
538 t1 = get_time()
539 elapsed_profile = t1 - t0
540 if verbose:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000541 print("elapsed time with profiling =", elapsed_profile)
Tim Peterscce092d2001-10-09 05:31:56 +0000542
543 # reported_time <- "CPU seconds" the profiler charged to f and f1.
544 total_calls = 0.0
545 reported_time = 0.0
546 for (filename, line, funcname), (cc, ns, tt, ct, callers) in \
547 p.timings.items():
548 if funcname in ("f", "f1"):
549 total_calls += cc
550 reported_time += tt
551
552 if verbose:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000553 print("'CPU seconds' profiler reported =", reported_time)
554 print("total # calls =", total_calls)
Tim Peterscce092d2001-10-09 05:31:56 +0000555 if total_calls != m + 1:
556 raise ValueError("internal error: total calls = %d" % total_calls)
557
558 # reported_time - elapsed_noprofile = overhead the profiler wasn't
559 # able to measure. Divide by twice the number of calls (since there
560 # are two profiler events per call in this test) to get the hidden
561 # overhead per event.
562 mean = (reported_time - elapsed_noprofile) / 2.0 / total_calls
563 if verbose:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000564 print("mean stopwatch overhead per profile event =", mean)
Tim Peterscce092d2001-10-09 05:31:56 +0000565 return mean
Guido van Rossumb6775db1994-08-01 11:34:53 +0000566
Guido van Rossumb6775db1994-08-01 11:34:53 +0000567#****************************************************************************
Guido van Rossumcc778eb1996-10-01 02:55:54 +0000568
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000569def main():
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000570 usage = "profile.py [-o output_file_path] [-s sort] scriptfile [arg] ..."
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000571 parser = OptionParser(usage=usage)
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000572 parser.allow_interspersed_args = False
Tim Peters4e0e1b62004-07-07 20:54:48 +0000573 parser.add_option('-o', '--outfile', dest="outfile",
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000574 help="Save stats to <outfile>", default=None)
575 parser.add_option('-s', '--sort', dest="sort",
Georg Brandl8e43fbf2010-08-02 12:20:23 +0000576 help="Sort order when printing to stdout, based on pstats.Stats class",
577 default=-1)
Tim Petersb497c102005-01-10 16:48:37 +0000578
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000579 if not sys.argv[1:]:
580 parser.print_usage()
581 sys.exit(2)
Tim Petersb497c102005-01-10 16:48:37 +0000582
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000583 (options, args) = parser.parse_args()
Georg Brandl8e43fbf2010-08-02 12:20:23 +0000584 sys.argv[:] = args
Tim Petersb497c102005-01-10 16:48:37 +0000585
Georg Brandl8e43fbf2010-08-02 12:20:23 +0000586 if len(args) > 0:
587 progname = args[0]
588 sys.path.insert(0, os.path.dirname(progname))
589 with open(progname, 'rb') as fp:
590 code = compile(fp.read(), progname, 'exec')
591 globs = {
592 '__file__': progname,
593 '__name__': '__main__',
594 '__package__': None,
595 '__cached__': None,
596 }
597 runctx(code, globs, None, options.outfile, options.sort)
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000598 else:
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000599 parser.print_usage()
600 return parser
601
602# When invoked as main program, invoke the profiler on a script
603if __name__ == '__main__':
604 main()