blob: 743e77d7bf2908a0a95ddfc4a73b414fd26676be [file] [log] [blame]
Benjamin Peterson90f5ba52010-03-11 22:53:45 +00001#! /usr/bin/env python3
Guido van Rossum81762581992-04-21 15:36:23 +00002#
Guido van Rossumb6775db1994-08-01 11:34:53 +00003# Class for profiling python code. rev 1.0 6/2/94
Guido van Rossum81762581992-04-21 15:36:23 +00004#
Benjamin Peterson8d770692011-06-27 09:14:34 -05005# Written by James Roskind
Guido van Rossumb6775db1994-08-01 11:34:53 +00006# Based on prior profile module by Sjoerd Mullender...
7# which was hacked somewhat by: Guido van Rossum
Guido van Rossumb6775db1994-08-01 11:34:53 +00008
Guido van Rossum54f22ed2000-02-04 15:10:34 +00009"""Class for profiling Python code."""
Guido van Rossumb6775db1994-08-01 11:34:53 +000010
Benjamin Peterson8d770692011-06-27 09:14:34 -050011# Copyright Disney Enterprises, Inc. All Rights Reserved.
12# Licensed to PSF under a Contributor Agreement
Benjamin Peterson0f93d3d2011-06-27 09:18:46 -050013#
Benjamin Peterson8d770692011-06-27 09:14:34 -050014# Licensed under the Apache License, Version 2.0 (the "License");
15# you may not use this file except in compliance with the License.
16# You may obtain a copy of the License at
Benjamin Peterson0f93d3d2011-06-27 09:18:46 -050017#
Benjamin Peterson8d770692011-06-27 09:14:34 -050018# http://www.apache.org/licenses/LICENSE-2.0
Benjamin Peterson0f93d3d2011-06-27 09:18:46 -050019#
Benjamin Peterson8d770692011-06-27 09:14:34 -050020# Unless required by applicable law or agreed to in writing, software
21# distributed under the License is distributed on an "AS IS" BASIS,
22# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
23# either express or implied. See the License for the specific language
24# governing permissions and limitations under the License.
Guido van Rossumb6775db1994-08-01 11:34:53 +000025
Guido van Rossum81762581992-04-21 15:36:23 +000026
27import sys
Guido van Rossum4e160981992-09-02 20:43:20 +000028import os
Guido van Rossumb6775db1994-08-01 11:34:53 +000029import time
Guido van Rossum4e160981992-09-02 20:43:20 +000030import marshal
Nicholas Bastin824b1b22004-03-23 18:44:39 +000031from optparse import OptionParser
Guido van Rossum81762581992-04-21 15:36:23 +000032
Georg Brandlb6b13242009-09-04 17:15:16 +000033__all__ = ["run", "runctx", "Profile"]
Guido van Rossum81762581992-04-21 15:36:23 +000034
Tim Peters2344fae2001-01-15 00:50:52 +000035# Sample timer for use with
Guido van Rossumb6775db1994-08-01 11:34:53 +000036#i_count = 0
37#def integer_timer():
Tim Peters2344fae2001-01-15 00:50:52 +000038# global i_count
39# i_count = i_count + 1
40# return i_count
Guido van Rossumb6775db1994-08-01 11:34:53 +000041#itimes = integer_timer # replace with C coded timer returning integers
Guido van Rossum81762581992-04-21 15:36:23 +000042
Guido van Rossumb6775db1994-08-01 11:34:53 +000043#**************************************************************************
44# The following are the static member functions for the profiler class
45# Note that an instance of Profile() is *not* needed to call them.
46#**************************************************************************
Guido van Rossum81762581992-04-21 15:36:23 +000047
Nicholas Bastin824b1b22004-03-23 18:44:39 +000048def run(statement, filename=None, sort=-1):
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000049 """Run statement under profiler optionally saving results in filename
Guido van Rossum4e160981992-09-02 20:43:20 +000050
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000051 This function takes a single argument that can be passed to the
52 "exec" statement, and an optional file name. In all cases this
53 routine attempts to "exec" its first argument and gather profiling
54 statistics from the execution. If no file name is present, then this
55 function automatically prints a simple profiling report, sorted by the
56 standard name string (file/line/function-name) that is presented in
57 each line.
58 """
Tim Peters2344fae2001-01-15 00:50:52 +000059 prof = Profile()
60 try:
61 prof = prof.run(statement)
62 except SystemExit:
63 pass
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000064 if filename is not None:
65 prof.dump_stats(filename)
Tim Peters2344fae2001-01-15 00:50:52 +000066 else:
Nicholas Bastin824b1b22004-03-23 18:44:39 +000067 return prof.print_stats(sort)
Guido van Rossume61fa0a1993-10-22 13:56:35 +000068
Georg Brandl8e43fbf2010-08-02 12:20:23 +000069def runctx(statement, globals, locals, filename=None, sort=-1):
Nicholas Bastin1eb4bfc2004-03-22 20:12:56 +000070 """Run statement under profiler, supplying your own globals and locals,
71 optionally saving results in filename.
72
73 statement and filename have the same semantics as profile.run
74 """
75 prof = Profile()
76 try:
77 prof = prof.runctx(statement, globals, locals)
78 except SystemExit:
79 pass
80
81 if filename is not None:
82 prof.dump_stats(filename)
83 else:
Georg Brandl8e43fbf2010-08-02 12:20:23 +000084 return prof.print_stats(sort)
Nicholas Bastin1eb4bfc2004-03-22 20:12:56 +000085
Guido van Rossumb6775db1994-08-01 11:34:53 +000086class Profile:
Tim Peters2344fae2001-01-15 00:50:52 +000087 """Profiler class.
Guido van Rossum54f22ed2000-02-04 15:10:34 +000088
Tim Peters2344fae2001-01-15 00:50:52 +000089 self.cur is always a tuple. Each such tuple corresponds to a stack
90 frame that is currently active (self.cur[-2]). The following are the
91 definitions of its members. We use this external "parallel stack" to
92 avoid contaminating the program that we are profiling. (old profiler
93 used to write into the frames local dictionary!!) Derived classes
94 can change the definition of some entries, as long as they leave
Tim Petersdf5cfd82001-10-05 23:15:10 +000095 [-2:] intact (frame and previous tuple). In case an internal error is
96 detected, the -3 element is used as the function name.
Guido van Rossum54f22ed2000-02-04 15:10:34 +000097
Tim Petersdf5cfd82001-10-05 23:15:10 +000098 [ 0] = Time that needs to be charged to the parent frame's function.
99 It is used so that a function call will not have to access the
100 timing data for the parent frame.
101 [ 1] = Total time spent in this frame's function, excluding time in
Tim Peters8d061ed2001-10-07 08:35:44 +0000102 subfunctions (this latter is tallied in cur[2]).
Tim Petersfb163782001-10-07 08:49:02 +0000103 [ 2] = Total time spent in subfunctions, excluding time executing the
Tim Peters8d061ed2001-10-07 08:35:44 +0000104 frame's function (this latter is tallied in cur[1]).
Tim Petersdf5cfd82001-10-05 23:15:10 +0000105 [-3] = Name of the function that corresponds to this frame.
Tim Peters8d061ed2001-10-07 08:35:44 +0000106 [-2] = Actual frame that we correspond to (used to sync exception handling).
107 [-1] = Our parent 6-tuple (corresponds to frame.f_back).
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000108
Tim Peters2344fae2001-01-15 00:50:52 +0000109 Timing data for each function is stored as a 5-tuple in the dictionary
Tim Petersdf5cfd82001-10-05 23:15:10 +0000110 self.timings[]. The index is always the name stored in self.cur[-3].
Tim Peters2344fae2001-01-15 00:50:52 +0000111 The following are the definitions of the members:
Guido van Rossumb6775db1994-08-01 11:34:53 +0000112
Tim Peters2344fae2001-01-15 00:50:52 +0000113 [0] = The number of times this function was called, not counting direct
114 or indirect recursion,
115 [1] = Number of times this function appears on the stack, minus one
116 [2] = Total time spent internal to this function
117 [3] = Cumulative time that this function was present on the stack. In
118 non-recursive functions, this is the total execution time from start
119 to finish of each invocation of a function, including time spent in
120 all subfunctions.
Tim Peters6e221492001-10-07 04:02:36 +0000121 [4] = A dictionary indicating for each function name, the number of times
Tim Peters2344fae2001-01-15 00:50:52 +0000122 it was called by us.
123 """
Guido van Rossumb6775db1994-08-01 11:34:53 +0000124
Tim Peters659a6032001-10-09 20:51:19 +0000125 bias = 0 # calibration constant
126
127 def __init__(self, timer=None, bias=None):
Tim Peters2344fae2001-01-15 00:50:52 +0000128 self.timings = {}
129 self.cur = None
130 self.cmd = ""
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000131 self.c_func_name = ""
Guido van Rossumb6775db1994-08-01 11:34:53 +0000132
Tim Peters659a6032001-10-09 20:51:19 +0000133 if bias is None:
134 bias = self.bias
135 self.bias = bias # Materialize in local dict for lookup speed.
136
Martin v. Löwisa4dac402005-03-03 11:39:45 +0000137 if not timer:
Victor Stinnerfe98e2f2012-04-29 03:01:20 +0200138 self.timer = self.get_time = time.process_time
139 self.dispatcher = self.trace_dispatch_i
Tim Peters2344fae2001-01-15 00:50:52 +0000140 else:
141 self.timer = timer
142 t = self.timer() # test out timer function
143 try:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000144 length = len(t)
145 except TypeError:
146 self.get_time = timer
147 self.dispatcher = self.trace_dispatch_i
148 else:
149 if length == 2:
Tim Peters2344fae2001-01-15 00:50:52 +0000150 self.dispatcher = self.trace_dispatch
151 else:
152 self.dispatcher = self.trace_dispatch_l
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000153 # This get_time() implementation needs to be defined
154 # here to capture the passed-in timer in the parameter
155 # list (for performance). Note that we can't assume
156 # the timer() result contains two values in all
157 # cases.
Raymond Hettinger97aa32b2003-10-22 16:49:01 +0000158 def get_time_timer(timer=timer, sum=sum):
159 return sum(timer())
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000160 self.get_time = get_time_timer
Tim Peters2344fae2001-01-15 00:50:52 +0000161 self.t = self.get_time()
162 self.simulate_call('profiler')
Guido van Rossumb6775db1994-08-01 11:34:53 +0000163
Tim Peters2344fae2001-01-15 00:50:52 +0000164 # Heavily optimized dispatch routine for os.times() timer
Guido van Rossumb6775db1994-08-01 11:34:53 +0000165
Tim Peters2344fae2001-01-15 00:50:52 +0000166 def trace_dispatch(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000167 timer = self.timer
168 t = timer()
Tim Peters659a6032001-10-09 20:51:19 +0000169 t = t[0] + t[1] - self.t - self.bias
Tim Peters2344fae2001-01-15 00:50:52 +0000170
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000171 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000172 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000173
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000174 if self.dispatch[event](self, frame,t):
175 t = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000176 self.t = t[0] + t[1]
177 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000178 r = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000179 self.t = r[0] + r[1] - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000180
Tim Peters6e221492001-10-07 04:02:36 +0000181 # Dispatch routine for best timer program (return = scalar, fastest if
182 # an integer but float works too -- and time.clock() relies on that).
Guido van Rossumb6775db1994-08-01 11:34:53 +0000183
Tim Peters2344fae2001-01-15 00:50:52 +0000184 def trace_dispatch_i(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000185 timer = self.timer
Tim Peters659a6032001-10-09 20:51:19 +0000186 t = timer() - self.t - self.bias
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000187
188 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000189 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000190
191 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000192 self.t = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000193 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000194 self.t = timer() - t # put back unrecorded delta
Guido van Rossumcbf3dd51997-10-08 15:23:02 +0000195
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000196 # Dispatch routine for macintosh (timer returns time in ticks of
197 # 1/60th second)
Tim Peters2344fae2001-01-15 00:50:52 +0000198
199 def trace_dispatch_mac(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000200 timer = self.timer
Tim Peters659a6032001-10-09 20:51:19 +0000201 t = timer()/60.0 - self.t - self.bias
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000202
203 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000204 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000205
Tim Peters659a6032001-10-09 20:51:19 +0000206 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000207 self.t = timer()/60.0
Tim Peters2344fae2001-01-15 00:50:52 +0000208 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000209 self.t = timer()/60.0 - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000210
Tim Peters2344fae2001-01-15 00:50:52 +0000211 # SLOW generic dispatch routine for timer returning lists of numbers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000212
Tim Peters2344fae2001-01-15 00:50:52 +0000213 def trace_dispatch_l(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000214 get_time = self.get_time
Tim Peters659a6032001-10-09 20:51:19 +0000215 t = get_time() - self.t - self.bias
Guido van Rossumb6775db1994-08-01 11:34:53 +0000216
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000217 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000218 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000219
Tim Peters659a6032001-10-09 20:51:19 +0000220 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000221 self.t = get_time()
Tim Peters2344fae2001-01-15 00:50:52 +0000222 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000223 self.t = get_time() - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000224
Tim Peters8d061ed2001-10-07 08:35:44 +0000225 # In the event handlers, the first 3 elements of self.cur are unpacked
226 # into vrbls w/ 3-letter names. The last two characters are meant to be
227 # mnemonic:
228 # _pt self.cur[0] "parent time" time to be charged to parent frame
229 # _it self.cur[1] "internal time" time spent directly in the function
230 # _et self.cur[2] "external time" time spent in subfunctions
Guido van Rossumb6775db1994-08-01 11:34:53 +0000231
Tim Peters2344fae2001-01-15 00:50:52 +0000232 def trace_dispatch_exception(self, frame, t):
Tim Peters8d061ed2001-10-07 08:35:44 +0000233 rpt, rit, ret, rfn, rframe, rcur = self.cur
Fred Drakea0bc9992001-10-03 21:12:32 +0000234 if (rframe is not frame) and rcur:
Tim Peters2344fae2001-01-15 00:50:52 +0000235 return self.trace_dispatch_return(rframe, t)
Tim Peters8d061ed2001-10-07 08:35:44 +0000236 self.cur = rpt, rit+t, ret, rfn, rframe, rcur
Guido van Rossumf137f752001-10-04 00:58:24 +0000237 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000238
239
Tim Peters2344fae2001-01-15 00:50:52 +0000240 def trace_dispatch_call(self, frame, t):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000241 if self.cur and frame.f_back is not self.cur[-2]:
Tim Peters8d061ed2001-10-07 08:35:44 +0000242 rpt, rit, ret, rfn, rframe, rcur = self.cur
Guido van Rossumf137f752001-10-04 00:58:24 +0000243 if not isinstance(rframe, Profile.fake_frame):
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000244 assert rframe.f_back is frame.f_back, ("Bad call", rfn,
245 rframe, rframe.f_back,
246 frame, frame.f_back)
Guido van Rossumf137f752001-10-04 00:58:24 +0000247 self.trace_dispatch_return(rframe, 0)
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000248 assert (self.cur is None or \
249 frame.f_back is self.cur[-2]), ("Bad call",
250 self.cur[-3])
Tim Peters2344fae2001-01-15 00:50:52 +0000251 fcode = frame.f_code
252 fn = (fcode.co_filename, fcode.co_firstlineno, fcode.co_name)
253 self.cur = (t, 0, 0, fn, frame, self.cur)
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000254 timings = self.timings
Raymond Hettinger54f02222002-06-01 14:18:47 +0000255 if fn in timings:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000256 cc, ns, tt, ct, callers = timings[fn]
257 timings[fn] = cc, ns + 1, tt, ct, callers
Tim Peters2344fae2001-01-15 00:50:52 +0000258 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000259 timings[fn] = 0, 0, 0, 0, {}
Tim Peters2344fae2001-01-15 00:50:52 +0000260 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000261
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000262 def trace_dispatch_c_call (self, frame, t):
263 fn = ("", 0, self.c_func_name)
264 self.cur = (t, 0, 0, fn, frame, self.cur)
265 timings = self.timings
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000266 if fn in timings:
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000267 cc, ns, tt, ct, callers = timings[fn]
268 timings[fn] = cc, ns+1, tt, ct, callers
269 else:
270 timings[fn] = 0, 0, 0, 0, {}
271 return 1
272
Tim Peters2344fae2001-01-15 00:50:52 +0000273 def trace_dispatch_return(self, frame, t):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000274 if frame is not self.cur[-2]:
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000275 assert frame is self.cur[-2].f_back, ("Bad return", self.cur[-3])
276 self.trace_dispatch_return(self.cur[-2], 0)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000277
Tim Peters8d061ed2001-10-07 08:35:44 +0000278 # Prefix "r" means part of the Returning or exiting frame.
279 # Prefix "p" means part of the Previous or Parent or older frame.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000280
Tim Peters8d061ed2001-10-07 08:35:44 +0000281 rpt, rit, ret, rfn, frame, rcur = self.cur
282 rit = rit + t
283 frame_total = rit + ret
Guido van Rossumb6775db1994-08-01 11:34:53 +0000284
Tim Peters8d061ed2001-10-07 08:35:44 +0000285 ppt, pit, pet, pfn, pframe, pcur = rcur
286 self.cur = ppt, pit + rpt, pet + frame_total, pfn, pframe, pcur
Guido van Rossumb6775db1994-08-01 11:34:53 +0000287
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000288 timings = self.timings
289 cc, ns, tt, ct, callers = timings[rfn]
Tim Peters2344fae2001-01-15 00:50:52 +0000290 if not ns:
Tim Peters8d061ed2001-10-07 08:35:44 +0000291 # This is the only occurrence of the function on the stack.
292 # Else this is a (directly or indirectly) recursive call, and
293 # its cumulative time will get updated when the topmost call to
294 # it returns.
295 ct = ct + frame_total
Tim Peters2344fae2001-01-15 00:50:52 +0000296 cc = cc + 1
Tim Peters8d061ed2001-10-07 08:35:44 +0000297
Raymond Hettinger54f02222002-06-01 14:18:47 +0000298 if pfn in callers:
Tim Peters2344fae2001-01-15 00:50:52 +0000299 callers[pfn] = callers[pfn] + 1 # hack: gather more
300 # stats such as the amount of time added to ct courtesy
301 # of this specific call, and the contribution to cc
302 # courtesy of this call.
303 else:
304 callers[pfn] = 1
Tim Peters8d061ed2001-10-07 08:35:44 +0000305
306 timings[rfn] = cc, ns - 1, tt + rit, ct, callers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000307
Tim Peters2344fae2001-01-15 00:50:52 +0000308 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000309
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000310
311 dispatch = {
312 "call": trace_dispatch_call,
313 "exception": trace_dispatch_exception,
314 "return": trace_dispatch_return,
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000315 "c_call": trace_dispatch_c_call,
Armin Rigof8790242005-09-20 18:50:13 +0000316 "c_exception": trace_dispatch_return, # the C function returned
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000317 "c_return": trace_dispatch_return,
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000318 }
319
320
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000321 # The next few functions play with self.cmd. By carefully preloading
Tim Peters2344fae2001-01-15 00:50:52 +0000322 # our parallel stack, we can force the profiled result to include
323 # an arbitrary string as the name of the calling function.
324 # We use self.cmd as that string, and the resulting stats look
325 # very nice :-).
Guido van Rossumb6775db1994-08-01 11:34:53 +0000326
Tim Peters2344fae2001-01-15 00:50:52 +0000327 def set_cmd(self, cmd):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000328 if self.cur[-1]: return # already set
Tim Peters2344fae2001-01-15 00:50:52 +0000329 self.cmd = cmd
330 self.simulate_call(cmd)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000331
Tim Peters2344fae2001-01-15 00:50:52 +0000332 class fake_code:
333 def __init__(self, filename, line, name):
334 self.co_filename = filename
335 self.co_line = line
336 self.co_name = name
337 self.co_firstlineno = 0
Guido van Rossumb6775db1994-08-01 11:34:53 +0000338
Tim Peters2344fae2001-01-15 00:50:52 +0000339 def __repr__(self):
340 return repr((self.co_filename, self.co_line, self.co_name))
Guido van Rossumb6775db1994-08-01 11:34:53 +0000341
Tim Peters2344fae2001-01-15 00:50:52 +0000342 class fake_frame:
343 def __init__(self, code, prior):
344 self.f_code = code
345 self.f_back = prior
Guido van Rossumb6775db1994-08-01 11:34:53 +0000346
Tim Peters2344fae2001-01-15 00:50:52 +0000347 def simulate_call(self, name):
348 code = self.fake_code('profile', 0, name)
349 if self.cur:
Tim Petersdf5cfd82001-10-05 23:15:10 +0000350 pframe = self.cur[-2]
Tim Peters2344fae2001-01-15 00:50:52 +0000351 else:
352 pframe = None
353 frame = self.fake_frame(code, pframe)
Fred Draked10ed8b2001-10-17 01:49:50 +0000354 self.dispatch['call'](self, frame, 0)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000355
Tim Peters2344fae2001-01-15 00:50:52 +0000356 # collect stats from pending stack, including getting final
357 # timings for self.cmd frame.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000358
Tim Peters2344fae2001-01-15 00:50:52 +0000359 def simulate_cmd_complete(self):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000360 get_time = self.get_time
361 t = get_time() - self.t
Tim Petersdf5cfd82001-10-05 23:15:10 +0000362 while self.cur[-1]:
Tim Peters2344fae2001-01-15 00:50:52 +0000363 # We *can* cause assertion errors here if
364 # dispatch_trace_return checks for a frame match!
Fred Draked10ed8b2001-10-17 01:49:50 +0000365 self.dispatch['return'](self, self.cur[-2], t)
Tim Peters2344fae2001-01-15 00:50:52 +0000366 t = 0
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000367 self.t = get_time() - t
Guido van Rossumb6775db1994-08-01 11:34:53 +0000368
369
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000370 def print_stats(self, sort=-1):
Tim Peters2344fae2001-01-15 00:50:52 +0000371 import pstats
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000372 pstats.Stats(self).strip_dirs().sort_stats(sort). \
Tim Peters2344fae2001-01-15 00:50:52 +0000373 print_stats()
Guido van Rossumb6775db1994-08-01 11:34:53 +0000374
Tim Peters2344fae2001-01-15 00:50:52 +0000375 def dump_stats(self, file):
376 f = open(file, 'wb')
377 self.create_stats()
378 marshal.dump(self.stats, f)
379 f.close()
380
381 def create_stats(self):
382 self.simulate_cmd_complete()
383 self.snapshot_stats()
384
385 def snapshot_stats(self):
386 self.stats = {}
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000387 for func, (cc, ns, tt, ct, callers) in self.timings.items():
Tim Peters2344fae2001-01-15 00:50:52 +0000388 callers = callers.copy()
389 nc = 0
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000390 for callcnt in callers.values():
Raymond Hettingere0d49722002-06-02 18:55:56 +0000391 nc += callcnt
Tim Peters2344fae2001-01-15 00:50:52 +0000392 self.stats[func] = cc, nc, tt, ct, callers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000393
394
Tim Peters2344fae2001-01-15 00:50:52 +0000395 # The following two methods can be called by clients to use
396 # a profiler to profile a statement, given as a string.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000397
Tim Peters2344fae2001-01-15 00:50:52 +0000398 def run(self, cmd):
399 import __main__
400 dict = __main__.__dict__
401 return self.runctx(cmd, dict, dict)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000402
Tim Peters2344fae2001-01-15 00:50:52 +0000403 def runctx(self, cmd, globals, locals):
404 self.set_cmd(cmd)
405 sys.setprofile(self.dispatcher)
406 try:
Georg Brandl7cae87c2006-09-06 06:51:57 +0000407 exec(cmd, globals, locals)
Tim Peters2344fae2001-01-15 00:50:52 +0000408 finally:
409 sys.setprofile(None)
410 return self
Guido van Rossumb6775db1994-08-01 11:34:53 +0000411
Tim Peters2344fae2001-01-15 00:50:52 +0000412 # This method is more useful to profile a single function call.
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000413 def runcall(self, func, *args, **kw):
Walter Dörwald70a6b492004-02-12 17:35:32 +0000414 self.set_cmd(repr(func))
Tim Peters2344fae2001-01-15 00:50:52 +0000415 sys.setprofile(self.dispatcher)
416 try:
Guido van Rossum68468eb2003-02-27 20:14:51 +0000417 return func(*args, **kw)
Tim Peters2344fae2001-01-15 00:50:52 +0000418 finally:
419 sys.setprofile(None)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000420
Tim Peters2344fae2001-01-15 00:50:52 +0000421
422 #******************************************************************
423 # The following calculates the overhead for using a profiler. The
424 # problem is that it takes a fair amount of time for the profiler
425 # to stop the stopwatch (from the time it receives an event).
426 # Similarly, there is a delay from the time that the profiler
427 # re-starts the stopwatch before the user's code really gets to
428 # continue. The following code tries to measure the difference on
Tim Peters659a6032001-10-09 20:51:19 +0000429 # a per-event basis.
430 #
431 # Note that this difference is only significant if there are a lot of
Tim Peters2344fae2001-01-15 00:50:52 +0000432 # events, and relatively little user code per event. For example,
433 # code with small functions will typically benefit from having the
434 # profiler calibrated for the current platform. This *could* be
435 # done on the fly during init() time, but it is not worth the
436 # effort. Also note that if too large a value specified, then
437 # execution time on some functions will actually appear as a
438 # negative number. It is *normal* for some functions (with very
439 # low call counts) to have such negative stats, even if the
440 # calibration figure is "correct."
441 #
442 # One alternative to profile-time calibration adjustments (i.e.,
443 # adding in the magic little delta during each event) is to track
444 # more carefully the number of events (and cumulatively, the number
445 # of events during sub functions) that are seen. If this were
446 # done, then the arithmetic could be done after the fact (i.e., at
447 # display time). Currently, we track only call/return events.
448 # These values can be deduced by examining the callees and callers
449 # vectors for each functions. Hence we *can* almost correct the
450 # internal time figure at print time (note that we currently don't
451 # track exception event processing counts). Unfortunately, there
452 # is currently no similar information for cumulative sub-function
453 # time. It would not be hard to "get all this info" at profiler
454 # time. Specifically, we would have to extend the tuples to keep
455 # counts of this in each frame, and then extend the defs of timing
456 # tuples to include the significant two figures. I'm a bit fearful
457 # that this additional feature will slow the heavily optimized
458 # event/time ratio (i.e., the profiler would run slower, fur a very
459 # low "value added" feature.)
Tim Peters2344fae2001-01-15 00:50:52 +0000460 #**************************************************************
461
Tim Peterscce092d2001-10-09 05:31:56 +0000462 def calibrate(self, m, verbose=0):
Tim Peters659a6032001-10-09 20:51:19 +0000463 if self.__class__ is not Profile:
464 raise TypeError("Subclasses must override .calibrate().")
465
466 saved_bias = self.bias
467 self.bias = 0
468 try:
Tim Peterse13cc922001-10-09 21:01:31 +0000469 return self._calibrate_inner(m, verbose)
Tim Peters659a6032001-10-09 20:51:19 +0000470 finally:
471 self.bias = saved_bias
472
Tim Peterse13cc922001-10-09 21:01:31 +0000473 def _calibrate_inner(self, m, verbose):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000474 get_time = self.get_time
Tim Peters2344fae2001-01-15 00:50:52 +0000475
Tim Peterscce092d2001-10-09 05:31:56 +0000476 # Set up a test case to be run with and without profiling. Include
477 # lots of calls, because we're trying to quantify stopwatch overhead.
478 # Do not raise any exceptions, though, because we want to know
479 # exactly how many profile events are generated (one call event, +
480 # one return event, per Python-level call).
Tim Peters2344fae2001-01-15 00:50:52 +0000481
Tim Peterscce092d2001-10-09 05:31:56 +0000482 def f1(n):
483 for i in range(n):
484 x = 1
Tim Peters2344fae2001-01-15 00:50:52 +0000485
Tim Peterscce092d2001-10-09 05:31:56 +0000486 def f(m, f1=f1):
487 for i in range(m):
488 f1(100)
Tim Peters2344fae2001-01-15 00:50:52 +0000489
Tim Peterscce092d2001-10-09 05:31:56 +0000490 f(m) # warm up the cache
491
492 # elapsed_noprofile <- time f(m) takes without profiling.
493 t0 = get_time()
494 f(m)
495 t1 = get_time()
496 elapsed_noprofile = t1 - t0
497 if verbose:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000498 print("elapsed time without profiling =", elapsed_noprofile)
Tim Peterscce092d2001-10-09 05:31:56 +0000499
500 # elapsed_profile <- time f(m) takes with profiling. The difference
501 # is profiling overhead, only some of which the profiler subtracts
502 # out on its own.
503 p = Profile()
504 t0 = get_time()
505 p.runctx('f(m)', globals(), locals())
506 t1 = get_time()
507 elapsed_profile = t1 - t0
508 if verbose:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000509 print("elapsed time with profiling =", elapsed_profile)
Tim Peterscce092d2001-10-09 05:31:56 +0000510
511 # reported_time <- "CPU seconds" the profiler charged to f and f1.
512 total_calls = 0.0
513 reported_time = 0.0
514 for (filename, line, funcname), (cc, ns, tt, ct, callers) in \
515 p.timings.items():
516 if funcname in ("f", "f1"):
517 total_calls += cc
518 reported_time += tt
519
520 if verbose:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000521 print("'CPU seconds' profiler reported =", reported_time)
522 print("total # calls =", total_calls)
Tim Peterscce092d2001-10-09 05:31:56 +0000523 if total_calls != m + 1:
524 raise ValueError("internal error: total calls = %d" % total_calls)
525
526 # reported_time - elapsed_noprofile = overhead the profiler wasn't
527 # able to measure. Divide by twice the number of calls (since there
528 # are two profiler events per call in this test) to get the hidden
529 # overhead per event.
530 mean = (reported_time - elapsed_noprofile) / 2.0 / total_calls
531 if verbose:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000532 print("mean stopwatch overhead per profile event =", mean)
Tim Peterscce092d2001-10-09 05:31:56 +0000533 return mean
Guido van Rossumb6775db1994-08-01 11:34:53 +0000534
Guido van Rossumb6775db1994-08-01 11:34:53 +0000535#****************************************************************************
Guido van Rossumcc778eb1996-10-01 02:55:54 +0000536
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000537def main():
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000538 usage = "profile.py [-o output_file_path] [-s sort] scriptfile [arg] ..."
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000539 parser = OptionParser(usage=usage)
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000540 parser.allow_interspersed_args = False
Tim Peters4e0e1b62004-07-07 20:54:48 +0000541 parser.add_option('-o', '--outfile', dest="outfile",
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000542 help="Save stats to <outfile>", default=None)
543 parser.add_option('-s', '--sort', dest="sort",
Georg Brandl8e43fbf2010-08-02 12:20:23 +0000544 help="Sort order when printing to stdout, based on pstats.Stats class",
545 default=-1)
Tim Petersb497c102005-01-10 16:48:37 +0000546
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000547 if not sys.argv[1:]:
548 parser.print_usage()
549 sys.exit(2)
Tim Petersb497c102005-01-10 16:48:37 +0000550
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000551 (options, args) = parser.parse_args()
Georg Brandl8e43fbf2010-08-02 12:20:23 +0000552 sys.argv[:] = args
Tim Petersb497c102005-01-10 16:48:37 +0000553
Georg Brandl8e43fbf2010-08-02 12:20:23 +0000554 if len(args) > 0:
555 progname = args[0]
556 sys.path.insert(0, os.path.dirname(progname))
557 with open(progname, 'rb') as fp:
558 code = compile(fp.read(), progname, 'exec')
559 globs = {
560 '__file__': progname,
561 '__name__': '__main__',
562 '__package__': None,
563 '__cached__': None,
564 }
565 runctx(code, globs, None, options.outfile, options.sort)
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000566 else:
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000567 parser.print_usage()
568 return parser
569
570# When invoked as main program, invoke the profiler on a script
571if __name__ == '__main__':
572 main()