blob: 297aa04cf7cf3f624b8aa7c6d0077c7ee8c8e9e2 [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum81762581992-04-21 15:36:23 +00002#
Guido van Rossumb6775db1994-08-01 11:34:53 +00003# Class for profiling python code. rev 1.0 6/2/94
Guido van Rossum81762581992-04-21 15:36:23 +00004#
Benjamin Peterson7e6b3aa2011-06-27 09:14:34 -05005# Written by James Roskind
Guido van Rossumb6775db1994-08-01 11:34:53 +00006# Based on prior profile module by Sjoerd Mullender...
7# which was hacked somewhat by: Guido van Rossum
Guido van Rossumb6775db1994-08-01 11:34:53 +00008
Guido van Rossum54f22ed2000-02-04 15:10:34 +00009"""Class for profiling Python code."""
Guido van Rossumb6775db1994-08-01 11:34:53 +000010
Benjamin Peterson7e6b3aa2011-06-27 09:14:34 -050011# Copyright Disney Enterprises, Inc. All Rights Reserved.
12# Licensed to PSF under a Contributor Agreement
Benjamin Petersoncfb77312011-06-27 09:18:46 -050013#
Benjamin Peterson7e6b3aa2011-06-27 09:14:34 -050014# Licensed under the Apache License, Version 2.0 (the "License");
15# you may not use this file except in compliance with the License.
16# You may obtain a copy of the License at
Benjamin Petersoncfb77312011-06-27 09:18:46 -050017#
Benjamin Peterson7e6b3aa2011-06-27 09:14:34 -050018# http://www.apache.org/licenses/LICENSE-2.0
Benjamin Petersoncfb77312011-06-27 09:18:46 -050019#
Benjamin Peterson7e6b3aa2011-06-27 09:14:34 -050020# Unless required by applicable law or agreed to in writing, software
21# distributed under the License is distributed on an "AS IS" BASIS,
22# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
23# either express or implied. See the License for the specific language
24# governing permissions and limitations under the License.
Guido van Rossumb6775db1994-08-01 11:34:53 +000025
Guido van Rossum81762581992-04-21 15:36:23 +000026
27import sys
Guido van Rossum4e160981992-09-02 20:43:20 +000028import os
Guido van Rossumb6775db1994-08-01 11:34:53 +000029import time
Guido van Rossum4e160981992-09-02 20:43:20 +000030import marshal
Nicholas Bastin824b1b22004-03-23 18:44:39 +000031from optparse import OptionParser
Guido van Rossum81762581992-04-21 15:36:23 +000032
Guido van Rossum48713e82004-03-23 19:19:21 +000033__all__ = ["run", "runctx", "help", "Profile"]
Guido van Rossum81762581992-04-21 15:36:23 +000034
Tim Peters2344fae2001-01-15 00:50:52 +000035# Sample timer for use with
Guido van Rossumb6775db1994-08-01 11:34:53 +000036#i_count = 0
37#def integer_timer():
Tim Peters2344fae2001-01-15 00:50:52 +000038# global i_count
39# i_count = i_count + 1
40# return i_count
Guido van Rossumb6775db1994-08-01 11:34:53 +000041#itimes = integer_timer # replace with C coded timer returning integers
Guido van Rossum81762581992-04-21 15:36:23 +000042
Guido van Rossumb6775db1994-08-01 11:34:53 +000043#**************************************************************************
44# The following are the static member functions for the profiler class
45# Note that an instance of Profile() is *not* needed to call them.
46#**************************************************************************
Guido van Rossum81762581992-04-21 15:36:23 +000047
Nicholas Bastin824b1b22004-03-23 18:44:39 +000048def run(statement, filename=None, sort=-1):
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000049 """Run statement under profiler optionally saving results in filename
Guido van Rossum4e160981992-09-02 20:43:20 +000050
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000051 This function takes a single argument that can be passed to the
52 "exec" statement, and an optional file name. In all cases this
53 routine attempts to "exec" its first argument and gather profiling
54 statistics from the execution. If no file name is present, then this
55 function automatically prints a simple profiling report, sorted by the
56 standard name string (file/line/function-name) that is presented in
57 each line.
58 """
Tim Peters2344fae2001-01-15 00:50:52 +000059 prof = Profile()
60 try:
61 prof = prof.run(statement)
62 except SystemExit:
63 pass
Jeremy Hyltonadcf8a02001-03-14 20:01:19 +000064 if filename is not None:
65 prof.dump_stats(filename)
Tim Peters2344fae2001-01-15 00:50:52 +000066 else:
Nicholas Bastin824b1b22004-03-23 18:44:39 +000067 return prof.print_stats(sort)
Guido van Rossume61fa0a1993-10-22 13:56:35 +000068
Florent Xicluna92847452010-09-13 17:36:36 +000069def runctx(statement, globals, locals, filename=None, sort=-1):
Nicholas Bastin1eb4bfc2004-03-22 20:12:56 +000070 """Run statement under profiler, supplying your own globals and locals,
71 optionally saving results in filename.
72
73 statement and filename have the same semantics as profile.run
74 """
75 prof = Profile()
76 try:
77 prof = prof.runctx(statement, globals, locals)
78 except SystemExit:
79 pass
80
81 if filename is not None:
82 prof.dump_stats(filename)
83 else:
Florent Xicluna92847452010-09-13 17:36:36 +000084 return prof.print_stats(sort)
Nicholas Bastin1eb4bfc2004-03-22 20:12:56 +000085
Johannes Gijsbersc0b194a2005-01-10 09:07:22 +000086# Backwards compatibility.
Guido van Rossume61fa0a1993-10-22 13:56:35 +000087def help():
Johannes Gijsbersc0b194a2005-01-10 09:07:22 +000088 print "Documentation for the profile module can be found "
89 print "in the Python Library Reference, section 'The Python Profiler'."
Guido van Rossumb6775db1994-08-01 11:34:53 +000090
Fred Drakeedb5ffb2001-06-08 04:25:24 +000091if hasattr(os, "times"):
92 def _get_time_times(timer=os.times):
93 t = timer()
94 return t[0] + t[1]
95
Martin v. Löwisa4dac402005-03-03 11:39:45 +000096# Using getrusage(3) is better than clock(3) if available:
97# on some systems (e.g. FreeBSD), getrusage has a higher resolution
98# Furthermore, on a POSIX system, returns microseconds, which
99# wrap around after 36min.
100_has_res = 0
101try:
102 import resource
103 resgetrusage = lambda: resource.getrusage(resource.RUSAGE_SELF)
104 def _get_time_resource(timer=resgetrusage):
105 t = timer()
106 return t[0] + t[1]
107 _has_res = 1
108except ImportError:
109 pass
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000110
Guido van Rossumb6775db1994-08-01 11:34:53 +0000111class Profile:
Tim Peters2344fae2001-01-15 00:50:52 +0000112 """Profiler class.
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000113
Tim Peters2344fae2001-01-15 00:50:52 +0000114 self.cur is always a tuple. Each such tuple corresponds to a stack
115 frame that is currently active (self.cur[-2]). The following are the
116 definitions of its members. We use this external "parallel stack" to
117 avoid contaminating the program that we are profiling. (old profiler
118 used to write into the frames local dictionary!!) Derived classes
119 can change the definition of some entries, as long as they leave
Tim Petersdf5cfd82001-10-05 23:15:10 +0000120 [-2:] intact (frame and previous tuple). In case an internal error is
121 detected, the -3 element is used as the function name.
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000122
Tim Petersdf5cfd82001-10-05 23:15:10 +0000123 [ 0] = Time that needs to be charged to the parent frame's function.
124 It is used so that a function call will not have to access the
125 timing data for the parent frame.
126 [ 1] = Total time spent in this frame's function, excluding time in
Tim Peters8d061ed2001-10-07 08:35:44 +0000127 subfunctions (this latter is tallied in cur[2]).
Tim Petersfb163782001-10-07 08:49:02 +0000128 [ 2] = Total time spent in subfunctions, excluding time executing the
Tim Peters8d061ed2001-10-07 08:35:44 +0000129 frame's function (this latter is tallied in cur[1]).
Tim Petersdf5cfd82001-10-05 23:15:10 +0000130 [-3] = Name of the function that corresponds to this frame.
Tim Peters8d061ed2001-10-07 08:35:44 +0000131 [-2] = Actual frame that we correspond to (used to sync exception handling).
132 [-1] = Our parent 6-tuple (corresponds to frame.f_back).
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000133
Tim Peters2344fae2001-01-15 00:50:52 +0000134 Timing data for each function is stored as a 5-tuple in the dictionary
Tim Petersdf5cfd82001-10-05 23:15:10 +0000135 self.timings[]. The index is always the name stored in self.cur[-3].
Tim Peters2344fae2001-01-15 00:50:52 +0000136 The following are the definitions of the members:
Guido van Rossumb6775db1994-08-01 11:34:53 +0000137
Tim Peters2344fae2001-01-15 00:50:52 +0000138 [0] = The number of times this function was called, not counting direct
139 or indirect recursion,
140 [1] = Number of times this function appears on the stack, minus one
141 [2] = Total time spent internal to this function
142 [3] = Cumulative time that this function was present on the stack. In
143 non-recursive functions, this is the total execution time from start
144 to finish of each invocation of a function, including time spent in
145 all subfunctions.
Tim Peters6e221492001-10-07 04:02:36 +0000146 [4] = A dictionary indicating for each function name, the number of times
Tim Peters2344fae2001-01-15 00:50:52 +0000147 it was called by us.
148 """
Guido van Rossumb6775db1994-08-01 11:34:53 +0000149
Tim Peters659a6032001-10-09 20:51:19 +0000150 bias = 0 # calibration constant
151
152 def __init__(self, timer=None, bias=None):
Tim Peters2344fae2001-01-15 00:50:52 +0000153 self.timings = {}
154 self.cur = None
155 self.cmd = ""
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000156 self.c_func_name = ""
Guido van Rossumb6775db1994-08-01 11:34:53 +0000157
Tim Peters659a6032001-10-09 20:51:19 +0000158 if bias is None:
159 bias = self.bias
160 self.bias = bias # Materialize in local dict for lookup speed.
161
Martin v. Löwisa4dac402005-03-03 11:39:45 +0000162 if not timer:
163 if _has_res:
164 self.timer = resgetrusage
165 self.dispatcher = self.trace_dispatch
166 self.get_time = _get_time_resource
Tim Peters2344fae2001-01-15 00:50:52 +0000167 elif hasattr(time, 'clock'):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000168 self.timer = self.get_time = time.clock
Tim Peters2344fae2001-01-15 00:50:52 +0000169 self.dispatcher = self.trace_dispatch_i
170 elif hasattr(os, 'times'):
171 self.timer = os.times
172 self.dispatcher = self.trace_dispatch
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000173 self.get_time = _get_time_times
Tim Peters2344fae2001-01-15 00:50:52 +0000174 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000175 self.timer = self.get_time = time.time
Tim Peters2344fae2001-01-15 00:50:52 +0000176 self.dispatcher = self.trace_dispatch_i
177 else:
178 self.timer = timer
179 t = self.timer() # test out timer function
180 try:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000181 length = len(t)
182 except TypeError:
183 self.get_time = timer
184 self.dispatcher = self.trace_dispatch_i
185 else:
186 if length == 2:
Tim Peters2344fae2001-01-15 00:50:52 +0000187 self.dispatcher = self.trace_dispatch
188 else:
189 self.dispatcher = self.trace_dispatch_l
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000190 # This get_time() implementation needs to be defined
191 # here to capture the passed-in timer in the parameter
192 # list (for performance). Note that we can't assume
193 # the timer() result contains two values in all
194 # cases.
Raymond Hettinger97aa32b2003-10-22 16:49:01 +0000195 def get_time_timer(timer=timer, sum=sum):
196 return sum(timer())
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000197 self.get_time = get_time_timer
Tim Peters2344fae2001-01-15 00:50:52 +0000198 self.t = self.get_time()
199 self.simulate_call('profiler')
Guido van Rossumb6775db1994-08-01 11:34:53 +0000200
Tim Peters2344fae2001-01-15 00:50:52 +0000201 # Heavily optimized dispatch routine for os.times() timer
Guido van Rossumb6775db1994-08-01 11:34:53 +0000202
Tim Peters2344fae2001-01-15 00:50:52 +0000203 def trace_dispatch(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000204 timer = self.timer
205 t = timer()
Tim Peters659a6032001-10-09 20:51:19 +0000206 t = t[0] + t[1] - self.t - self.bias
Tim Peters2344fae2001-01-15 00:50:52 +0000207
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000208 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000209 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000210
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000211 if self.dispatch[event](self, frame,t):
212 t = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000213 self.t = t[0] + t[1]
214 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000215 r = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000216 self.t = r[0] + r[1] - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000217
Tim Peters6e221492001-10-07 04:02:36 +0000218 # Dispatch routine for best timer program (return = scalar, fastest if
219 # an integer but float works too -- and time.clock() relies on that).
Guido van Rossumb6775db1994-08-01 11:34:53 +0000220
Tim Peters2344fae2001-01-15 00:50:52 +0000221 def trace_dispatch_i(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000222 timer = self.timer
Tim Peters659a6032001-10-09 20:51:19 +0000223 t = timer() - self.t - self.bias
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000224
225 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000226 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000227
228 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000229 self.t = timer()
Tim Peters2344fae2001-01-15 00:50:52 +0000230 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000231 self.t = timer() - t # put back unrecorded delta
Guido van Rossumcbf3dd51997-10-08 15:23:02 +0000232
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000233 # Dispatch routine for macintosh (timer returns time in ticks of
234 # 1/60th second)
Tim Peters2344fae2001-01-15 00:50:52 +0000235
236 def trace_dispatch_mac(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000237 timer = self.timer
Tim Peters659a6032001-10-09 20:51:19 +0000238 t = timer()/60.0 - self.t - self.bias
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000239
240 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000241 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000242
Tim Peters659a6032001-10-09 20:51:19 +0000243 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000244 self.t = timer()/60.0
Tim Peters2344fae2001-01-15 00:50:52 +0000245 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000246 self.t = timer()/60.0 - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000247
Tim Peters2344fae2001-01-15 00:50:52 +0000248 # SLOW generic dispatch routine for timer returning lists of numbers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000249
Tim Peters2344fae2001-01-15 00:50:52 +0000250 def trace_dispatch_l(self, frame, event, arg):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000251 get_time = self.get_time
Tim Peters659a6032001-10-09 20:51:19 +0000252 t = get_time() - self.t - self.bias
Guido van Rossumb6775db1994-08-01 11:34:53 +0000253
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000254 if event == "c_call":
Nicholas Bastin12ac3e12004-07-12 23:38:02 +0000255 self.c_func_name = arg.__name__
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000256
Tim Peters659a6032001-10-09 20:51:19 +0000257 if self.dispatch[event](self, frame, t):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000258 self.t = get_time()
Tim Peters2344fae2001-01-15 00:50:52 +0000259 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000260 self.t = get_time() - t # put back unrecorded delta
Guido van Rossumb6775db1994-08-01 11:34:53 +0000261
Tim Peters8d061ed2001-10-07 08:35:44 +0000262 # In the event handlers, the first 3 elements of self.cur are unpacked
263 # into vrbls w/ 3-letter names. The last two characters are meant to be
264 # mnemonic:
265 # _pt self.cur[0] "parent time" time to be charged to parent frame
266 # _it self.cur[1] "internal time" time spent directly in the function
267 # _et self.cur[2] "external time" time spent in subfunctions
Guido van Rossumb6775db1994-08-01 11:34:53 +0000268
Tim Peters2344fae2001-01-15 00:50:52 +0000269 def trace_dispatch_exception(self, frame, t):
Tim Peters8d061ed2001-10-07 08:35:44 +0000270 rpt, rit, ret, rfn, rframe, rcur = self.cur
Fred Drakea0bc9992001-10-03 21:12:32 +0000271 if (rframe is not frame) and rcur:
Tim Peters2344fae2001-01-15 00:50:52 +0000272 return self.trace_dispatch_return(rframe, t)
Tim Peters8d061ed2001-10-07 08:35:44 +0000273 self.cur = rpt, rit+t, ret, rfn, rframe, rcur
Guido van Rossumf137f752001-10-04 00:58:24 +0000274 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000275
276
Tim Peters2344fae2001-01-15 00:50:52 +0000277 def trace_dispatch_call(self, frame, t):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000278 if self.cur and frame.f_back is not self.cur[-2]:
Tim Peters8d061ed2001-10-07 08:35:44 +0000279 rpt, rit, ret, rfn, rframe, rcur = self.cur
Guido van Rossumf137f752001-10-04 00:58:24 +0000280 if not isinstance(rframe, Profile.fake_frame):
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000281 assert rframe.f_back is frame.f_back, ("Bad call", rfn,
282 rframe, rframe.f_back,
283 frame, frame.f_back)
Guido van Rossumf137f752001-10-04 00:58:24 +0000284 self.trace_dispatch_return(rframe, 0)
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000285 assert (self.cur is None or \
286 frame.f_back is self.cur[-2]), ("Bad call",
287 self.cur[-3])
Tim Peters2344fae2001-01-15 00:50:52 +0000288 fcode = frame.f_code
289 fn = (fcode.co_filename, fcode.co_firstlineno, fcode.co_name)
290 self.cur = (t, 0, 0, fn, frame, self.cur)
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000291 timings = self.timings
Raymond Hettinger54f02222002-06-01 14:18:47 +0000292 if fn in timings:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000293 cc, ns, tt, ct, callers = timings[fn]
294 timings[fn] = cc, ns + 1, tt, ct, callers
Tim Peters2344fae2001-01-15 00:50:52 +0000295 else:
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000296 timings[fn] = 0, 0, 0, 0, {}
Tim Peters2344fae2001-01-15 00:50:52 +0000297 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000298
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000299 def trace_dispatch_c_call (self, frame, t):
300 fn = ("", 0, self.c_func_name)
301 self.cur = (t, 0, 0, fn, frame, self.cur)
302 timings = self.timings
Brett Cannoncc2f7b42008-08-03 22:38:19 +0000303 if fn in timings:
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000304 cc, ns, tt, ct, callers = timings[fn]
305 timings[fn] = cc, ns+1, tt, ct, callers
306 else:
307 timings[fn] = 0, 0, 0, 0, {}
308 return 1
309
Tim Peters2344fae2001-01-15 00:50:52 +0000310 def trace_dispatch_return(self, frame, t):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000311 if frame is not self.cur[-2]:
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000312 assert frame is self.cur[-2].f_back, ("Bad return", self.cur[-3])
313 self.trace_dispatch_return(self.cur[-2], 0)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000314
Tim Peters8d061ed2001-10-07 08:35:44 +0000315 # Prefix "r" means part of the Returning or exiting frame.
316 # Prefix "p" means part of the Previous or Parent or older frame.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000317
Tim Peters8d061ed2001-10-07 08:35:44 +0000318 rpt, rit, ret, rfn, frame, rcur = self.cur
319 rit = rit + t
320 frame_total = rit + ret
Guido van Rossumb6775db1994-08-01 11:34:53 +0000321
Tim Peters8d061ed2001-10-07 08:35:44 +0000322 ppt, pit, pet, pfn, pframe, pcur = rcur
323 self.cur = ppt, pit + rpt, pet + frame_total, pfn, pframe, pcur
Guido van Rossumb6775db1994-08-01 11:34:53 +0000324
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000325 timings = self.timings
326 cc, ns, tt, ct, callers = timings[rfn]
Tim Peters2344fae2001-01-15 00:50:52 +0000327 if not ns:
Tim Peters8d061ed2001-10-07 08:35:44 +0000328 # This is the only occurrence of the function on the stack.
329 # Else this is a (directly or indirectly) recursive call, and
330 # its cumulative time will get updated when the topmost call to
331 # it returns.
332 ct = ct + frame_total
Tim Peters2344fae2001-01-15 00:50:52 +0000333 cc = cc + 1
Tim Peters8d061ed2001-10-07 08:35:44 +0000334
Raymond Hettinger54f02222002-06-01 14:18:47 +0000335 if pfn in callers:
Tim Peters2344fae2001-01-15 00:50:52 +0000336 callers[pfn] = callers[pfn] + 1 # hack: gather more
337 # stats such as the amount of time added to ct courtesy
338 # of this specific call, and the contribution to cc
339 # courtesy of this call.
340 else:
341 callers[pfn] = 1
Tim Peters8d061ed2001-10-07 08:35:44 +0000342
343 timings[rfn] = cc, ns - 1, tt + rit, ct, callers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000344
Tim Peters2344fae2001-01-15 00:50:52 +0000345 return 1
Guido van Rossumb6775db1994-08-01 11:34:53 +0000346
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000347
348 dispatch = {
349 "call": trace_dispatch_call,
350 "exception": trace_dispatch_exception,
351 "return": trace_dispatch_return,
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000352 "c_call": trace_dispatch_c_call,
Armin Rigof8790242005-09-20 18:50:13 +0000353 "c_exception": trace_dispatch_return, # the C function returned
Nicholas Bastinc69ebe82004-03-24 21:57:10 +0000354 "c_return": trace_dispatch_return,
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000355 }
356
357
Tim Petersdb1ed2a2001-10-07 04:30:53 +0000358 # The next few functions play with self.cmd. By carefully preloading
Tim Peters2344fae2001-01-15 00:50:52 +0000359 # our parallel stack, we can force the profiled result to include
360 # an arbitrary string as the name of the calling function.
361 # We use self.cmd as that string, and the resulting stats look
362 # very nice :-).
Guido van Rossumb6775db1994-08-01 11:34:53 +0000363
Tim Peters2344fae2001-01-15 00:50:52 +0000364 def set_cmd(self, cmd):
Tim Petersdf5cfd82001-10-05 23:15:10 +0000365 if self.cur[-1]: return # already set
Tim Peters2344fae2001-01-15 00:50:52 +0000366 self.cmd = cmd
367 self.simulate_call(cmd)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000368
Tim Peters2344fae2001-01-15 00:50:52 +0000369 class fake_code:
370 def __init__(self, filename, line, name):
371 self.co_filename = filename
372 self.co_line = line
373 self.co_name = name
374 self.co_firstlineno = 0
Guido van Rossumb6775db1994-08-01 11:34:53 +0000375
Tim Peters2344fae2001-01-15 00:50:52 +0000376 def __repr__(self):
377 return repr((self.co_filename, self.co_line, self.co_name))
Guido van Rossumb6775db1994-08-01 11:34:53 +0000378
Tim Peters2344fae2001-01-15 00:50:52 +0000379 class fake_frame:
380 def __init__(self, code, prior):
381 self.f_code = code
382 self.f_back = prior
Guido van Rossumb6775db1994-08-01 11:34:53 +0000383
Tim Peters2344fae2001-01-15 00:50:52 +0000384 def simulate_call(self, name):
385 code = self.fake_code('profile', 0, name)
386 if self.cur:
Tim Petersdf5cfd82001-10-05 23:15:10 +0000387 pframe = self.cur[-2]
Tim Peters2344fae2001-01-15 00:50:52 +0000388 else:
389 pframe = None
390 frame = self.fake_frame(code, pframe)
Fred Draked10ed8b2001-10-17 01:49:50 +0000391 self.dispatch['call'](self, frame, 0)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000392
Tim Peters2344fae2001-01-15 00:50:52 +0000393 # collect stats from pending stack, including getting final
394 # timings for self.cmd frame.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000395
Tim Peters2344fae2001-01-15 00:50:52 +0000396 def simulate_cmd_complete(self):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000397 get_time = self.get_time
398 t = get_time() - self.t
Tim Petersdf5cfd82001-10-05 23:15:10 +0000399 while self.cur[-1]:
Tim Peters2344fae2001-01-15 00:50:52 +0000400 # We *can* cause assertion errors here if
401 # dispatch_trace_return checks for a frame match!
Fred Draked10ed8b2001-10-17 01:49:50 +0000402 self.dispatch['return'](self, self.cur[-2], t)
Tim Peters2344fae2001-01-15 00:50:52 +0000403 t = 0
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000404 self.t = get_time() - t
Guido van Rossumb6775db1994-08-01 11:34:53 +0000405
406
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000407 def print_stats(self, sort=-1):
Tim Peters2344fae2001-01-15 00:50:52 +0000408 import pstats
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000409 pstats.Stats(self).strip_dirs().sort_stats(sort). \
Tim Peters2344fae2001-01-15 00:50:52 +0000410 print_stats()
Guido van Rossumb6775db1994-08-01 11:34:53 +0000411
Tim Peters2344fae2001-01-15 00:50:52 +0000412 def dump_stats(self, file):
413 f = open(file, 'wb')
414 self.create_stats()
415 marshal.dump(self.stats, f)
416 f.close()
417
418 def create_stats(self):
419 self.simulate_cmd_complete()
420 self.snapshot_stats()
421
422 def snapshot_stats(self):
423 self.stats = {}
Raymond Hettingere0d49722002-06-02 18:55:56 +0000424 for func, (cc, ns, tt, ct, callers) in self.timings.iteritems():
Tim Peters2344fae2001-01-15 00:50:52 +0000425 callers = callers.copy()
426 nc = 0
Raymond Hettingere0d49722002-06-02 18:55:56 +0000427 for callcnt in callers.itervalues():
428 nc += callcnt
Tim Peters2344fae2001-01-15 00:50:52 +0000429 self.stats[func] = cc, nc, tt, ct, callers
Guido van Rossumb6775db1994-08-01 11:34:53 +0000430
431
Tim Peters2344fae2001-01-15 00:50:52 +0000432 # The following two methods can be called by clients to use
433 # a profiler to profile a statement, given as a string.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000434
Tim Peters2344fae2001-01-15 00:50:52 +0000435 def run(self, cmd):
436 import __main__
437 dict = __main__.__dict__
438 return self.runctx(cmd, dict, dict)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000439
Tim Peters2344fae2001-01-15 00:50:52 +0000440 def runctx(self, cmd, globals, locals):
441 self.set_cmd(cmd)
442 sys.setprofile(self.dispatcher)
443 try:
444 exec cmd in globals, locals
445 finally:
446 sys.setprofile(None)
447 return self
Guido van Rossumb6775db1994-08-01 11:34:53 +0000448
Tim Peters2344fae2001-01-15 00:50:52 +0000449 # This method is more useful to profile a single function call.
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000450 def runcall(self, func, *args, **kw):
Walter Dörwald70a6b492004-02-12 17:35:32 +0000451 self.set_cmd(repr(func))
Tim Peters2344fae2001-01-15 00:50:52 +0000452 sys.setprofile(self.dispatcher)
453 try:
Guido van Rossum68468eb2003-02-27 20:14:51 +0000454 return func(*args, **kw)
Tim Peters2344fae2001-01-15 00:50:52 +0000455 finally:
456 sys.setprofile(None)
Guido van Rossumb6775db1994-08-01 11:34:53 +0000457
Tim Peters2344fae2001-01-15 00:50:52 +0000458
459 #******************************************************************
460 # The following calculates the overhead for using a profiler. The
461 # problem is that it takes a fair amount of time for the profiler
462 # to stop the stopwatch (from the time it receives an event).
463 # Similarly, there is a delay from the time that the profiler
464 # re-starts the stopwatch before the user's code really gets to
465 # continue. The following code tries to measure the difference on
Tim Peters659a6032001-10-09 20:51:19 +0000466 # a per-event basis.
467 #
468 # Note that this difference is only significant if there are a lot of
Tim Peters2344fae2001-01-15 00:50:52 +0000469 # events, and relatively little user code per event. For example,
470 # code with small functions will typically benefit from having the
471 # profiler calibrated for the current platform. This *could* be
472 # done on the fly during init() time, but it is not worth the
473 # effort. Also note that if too large a value specified, then
474 # execution time on some functions will actually appear as a
475 # negative number. It is *normal* for some functions (with very
476 # low call counts) to have such negative stats, even if the
477 # calibration figure is "correct."
478 #
479 # One alternative to profile-time calibration adjustments (i.e.,
480 # adding in the magic little delta during each event) is to track
481 # more carefully the number of events (and cumulatively, the number
482 # of events during sub functions) that are seen. If this were
483 # done, then the arithmetic could be done after the fact (i.e., at
484 # display time). Currently, we track only call/return events.
485 # These values can be deduced by examining the callees and callers
486 # vectors for each functions. Hence we *can* almost correct the
487 # internal time figure at print time (note that we currently don't
488 # track exception event processing counts). Unfortunately, there
489 # is currently no similar information for cumulative sub-function
490 # time. It would not be hard to "get all this info" at profiler
491 # time. Specifically, we would have to extend the tuples to keep
492 # counts of this in each frame, and then extend the defs of timing
493 # tuples to include the significant two figures. I'm a bit fearful
494 # that this additional feature will slow the heavily optimized
495 # event/time ratio (i.e., the profiler would run slower, fur a very
496 # low "value added" feature.)
Tim Peters2344fae2001-01-15 00:50:52 +0000497 #**************************************************************
498
Tim Peterscce092d2001-10-09 05:31:56 +0000499 def calibrate(self, m, verbose=0):
Tim Peters659a6032001-10-09 20:51:19 +0000500 if self.__class__ is not Profile:
501 raise TypeError("Subclasses must override .calibrate().")
502
503 saved_bias = self.bias
504 self.bias = 0
505 try:
Tim Peterse13cc922001-10-09 21:01:31 +0000506 return self._calibrate_inner(m, verbose)
Tim Peters659a6032001-10-09 20:51:19 +0000507 finally:
508 self.bias = saved_bias
509
Tim Peterse13cc922001-10-09 21:01:31 +0000510 def _calibrate_inner(self, m, verbose):
Fred Drakeedb5ffb2001-06-08 04:25:24 +0000511 get_time = self.get_time
Tim Peters2344fae2001-01-15 00:50:52 +0000512
Tim Peterscce092d2001-10-09 05:31:56 +0000513 # Set up a test case to be run with and without profiling. Include
514 # lots of calls, because we're trying to quantify stopwatch overhead.
515 # Do not raise any exceptions, though, because we want to know
516 # exactly how many profile events are generated (one call event, +
517 # one return event, per Python-level call).
Tim Peters2344fae2001-01-15 00:50:52 +0000518
Tim Peterscce092d2001-10-09 05:31:56 +0000519 def f1(n):
520 for i in range(n):
521 x = 1
Tim Peters2344fae2001-01-15 00:50:52 +0000522
Tim Peterscce092d2001-10-09 05:31:56 +0000523 def f(m, f1=f1):
524 for i in range(m):
525 f1(100)
Tim Peters2344fae2001-01-15 00:50:52 +0000526
Tim Peterscce092d2001-10-09 05:31:56 +0000527 f(m) # warm up the cache
528
529 # elapsed_noprofile <- time f(m) takes without profiling.
530 t0 = get_time()
531 f(m)
532 t1 = get_time()
533 elapsed_noprofile = t1 - t0
534 if verbose:
535 print "elapsed time without profiling =", elapsed_noprofile
536
537 # elapsed_profile <- time f(m) takes with profiling. The difference
538 # is profiling overhead, only some of which the profiler subtracts
539 # out on its own.
540 p = Profile()
541 t0 = get_time()
542 p.runctx('f(m)', globals(), locals())
543 t1 = get_time()
544 elapsed_profile = t1 - t0
545 if verbose:
546 print "elapsed time with profiling =", elapsed_profile
547
548 # reported_time <- "CPU seconds" the profiler charged to f and f1.
549 total_calls = 0.0
550 reported_time = 0.0
551 for (filename, line, funcname), (cc, ns, tt, ct, callers) in \
552 p.timings.items():
553 if funcname in ("f", "f1"):
554 total_calls += cc
555 reported_time += tt
556
557 if verbose:
558 print "'CPU seconds' profiler reported =", reported_time
559 print "total # calls =", total_calls
560 if total_calls != m + 1:
561 raise ValueError("internal error: total calls = %d" % total_calls)
562
563 # reported_time - elapsed_noprofile = overhead the profiler wasn't
564 # able to measure. Divide by twice the number of calls (since there
565 # are two profiler events per call in this test) to get the hidden
566 # overhead per event.
567 mean = (reported_time - elapsed_noprofile) / 2.0 / total_calls
568 if verbose:
569 print "mean stopwatch overhead per profile event =", mean
570 return mean
Guido van Rossumb6775db1994-08-01 11:34:53 +0000571
Guido van Rossumb6775db1994-08-01 11:34:53 +0000572#****************************************************************************
573def Stats(*args):
Tim Peters2344fae2001-01-15 00:50:52 +0000574 print 'Report generating functions are in the "pstats" module\a'
Guido van Rossumcc778eb1996-10-01 02:55:54 +0000575
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000576def main():
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000577 usage = "profile.py [-o output_file_path] [-s sort] scriptfile [arg] ..."
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000578 parser = OptionParser(usage=usage)
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000579 parser.allow_interspersed_args = False
Tim Peters4e0e1b62004-07-07 20:54:48 +0000580 parser.add_option('-o', '--outfile', dest="outfile",
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000581 help="Save stats to <outfile>", default=None)
582 parser.add_option('-s', '--sort', dest="sort",
Florent Xicluna92847452010-09-13 17:36:36 +0000583 help="Sort order when printing to stdout, based on pstats.Stats class",
584 default=-1)
Tim Petersb497c102005-01-10 16:48:37 +0000585
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000586 if not sys.argv[1:]:
587 parser.print_usage()
588 sys.exit(2)
Tim Petersb497c102005-01-10 16:48:37 +0000589
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000590 (options, args) = parser.parse_args()
Florent Xicluna92847452010-09-13 17:36:36 +0000591 sys.argv[:] = args
Tim Petersb497c102005-01-10 16:48:37 +0000592
Florent Xicluna92847452010-09-13 17:36:36 +0000593 if len(args) > 0:
594 progname = args[0]
595 sys.path.insert(0, os.path.dirname(progname))
596 with open(progname, 'rb') as fp:
597 code = compile(fp.read(), progname, 'exec')
598 globs = {
599 '__file__': progname,
600 '__name__': '__main__',
601 '__package__': None,
602 }
603 runctx(code, globs, None, options.outfile, options.sort)
Nicholas Bastin824b1b22004-03-23 18:44:39 +0000604 else:
Johannes Gijsbers2abe7852005-01-09 01:58:02 +0000605 parser.print_usage()
606 return parser
607
608# When invoked as main program, invoke the profiler on a script
609if __name__ == '__main__':
610 main()