blob: 8ae50fc246203619bc4ef5a70d95c00e15d735e7 [file] [log] [blame]
Martin v. Löwis09776b72002-08-04 17:22:59 +00001# -*- coding: iso-8859-1 -*-
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +00002"""Get useful information from live Python objects.
3
4This module encapsulates the interface provided by the internal special
5attributes (func_*, co_*, im_*, tb_*, etc.) in a friendlier fashion.
6It also provides some help for examining source code and class layout.
7
8Here are some of the useful functions provided by this module:
9
10 ismodule(), isclass(), ismethod(), isfunction(), istraceback(),
11 isframe(), iscode(), isbuiltin(), isroutine() - check object types
12 getmembers() - get members of an object that satisfy a given condition
13
14 getfile(), getsourcefile(), getsource() - find an object's source code
15 getdoc(), getcomments() - get documentation on an object
16 getmodule() - determine the module that an object came from
17 getclasstree() - arrange classes so as to represent their hierarchy
18
19 getargspec(), getargvalues() - get info about function arguments
20 formatargspec(), formatargvalues() - format an argument spec
21 getouterframes(), getinnerframes() - get info about frames
22 currentframe() - get the current stack frame
23 stack(), trace() - get info about frames on the stack or in a traceback
24"""
25
26# This module is in the public domain. No warranties.
27
Ka-Ping Yee8b58b842001-03-01 13:56:16 +000028__author__ = 'Ka-Ping Yee <ping@lfw.org>'
29__date__ = '1 Jan 2001'
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +000030
Neil Schemenauerf06f8532002-03-23 23:51:04 +000031import sys, os, types, string, re, dis, imp, tokenize, linecache
Raymond Hettingera1a992c2005-03-11 06:46:45 +000032from operator import attrgetter
Raymond Hettingere896acc2008-01-11 03:04:50 +000033from collections import namedtuple
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +000034
35# ----------------------------------------------------------- type-checking
36def ismodule(object):
37 """Return true if the object is a module.
38
39 Module objects provide these attributes:
40 __doc__ documentation string
41 __file__ filename (missing for built-in modules)"""
Tim Peters28bc59f2001-09-16 08:40:16 +000042 return isinstance(object, types.ModuleType)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +000043
44def isclass(object):
45 """Return true if the object is a class.
46
47 Class objects provide these attributes:
48 __doc__ documentation string
49 __module__ name of module in which this class was defined"""
Tim Peters28bc59f2001-09-16 08:40:16 +000050 return isinstance(object, types.ClassType) or hasattr(object, '__bases__')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +000051
52def ismethod(object):
53 """Return true if the object is an instance method.
54
55 Instance method objects provide these attributes:
56 __doc__ documentation string
57 __name__ name with which this method was defined
58 im_class class object in which this method belongs
59 im_func function object containing implementation of method
60 im_self instance to which this method is bound, or None"""
Tim Peters28bc59f2001-09-16 08:40:16 +000061 return isinstance(object, types.MethodType)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +000062
Tim Peters536d2262001-09-20 05:13:38 +000063def ismethoddescriptor(object):
Tim Petersf1d90b92001-09-20 05:47:55 +000064 """Return true if the object is a method descriptor.
65
66 But not if ismethod() or isclass() or isfunction() are true.
Tim Peters536d2262001-09-20 05:13:38 +000067
68 This is new in Python 2.2, and, for example, is true of int.__add__.
69 An object passing this test has a __get__ attribute but not a __set__
70 attribute, but beyond that the set of attributes varies. __name__ is
71 usually sensible, and __doc__ often is.
72
Tim Petersf1d90b92001-09-20 05:47:55 +000073 Methods implemented via descriptors that also pass one of the other
74 tests return false from the ismethoddescriptor() test, simply because
75 the other tests promise more -- you can, e.g., count on having the
76 im_func attribute (etc) when an object passes ismethod()."""
Tim Peters536d2262001-09-20 05:13:38 +000077 return (hasattr(object, "__get__")
78 and not hasattr(object, "__set__") # else it's a data descriptor
79 and not ismethod(object) # mutual exclusion
Tim Petersf1d90b92001-09-20 05:47:55 +000080 and not isfunction(object)
Tim Peters536d2262001-09-20 05:13:38 +000081 and not isclass(object))
82
Martin v. Löwise59e2ba2003-05-03 09:09:02 +000083def isdatadescriptor(object):
84 """Return true if the object is a data descriptor.
85
86 Data descriptors have both a __get__ and a __set__ attribute. Examples are
87 properties (defined in Python) and getsets and members (defined in C).
88 Typically, data descriptors will also have __name__ and __doc__ attributes
89 (properties, getsets, and members have both of these attributes), but this
90 is not guaranteed."""
91 return (hasattr(object, "__set__") and hasattr(object, "__get__"))
92
Barry Warsaw00decd72006-07-27 23:43:15 +000093if hasattr(types, 'MemberDescriptorType'):
94 # CPython and equivalent
95 def ismemberdescriptor(object):
96 """Return true if the object is a member descriptor.
97
98 Member descriptors are specialized descriptors defined in extension
99 modules."""
100 return isinstance(object, types.MemberDescriptorType)
101else:
102 # Other implementations
103 def ismemberdescriptor(object):
104 """Return true if the object is a member descriptor.
105
106 Member descriptors are specialized descriptors defined in extension
107 modules."""
108 return False
109
110if hasattr(types, 'GetSetDescriptorType'):
111 # CPython and equivalent
112 def isgetsetdescriptor(object):
113 """Return true if the object is a getset descriptor.
114
115 getset descriptors are specialized descriptors defined in extension
116 modules."""
117 return isinstance(object, types.GetSetDescriptorType)
118else:
119 # Other implementations
120 def isgetsetdescriptor(object):
121 """Return true if the object is a getset descriptor.
122
123 getset descriptors are specialized descriptors defined in extension
124 modules."""
125 return False
Tim Petersce70a3b2006-07-27 23:45:48 +0000126
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000127def isfunction(object):
128 """Return true if the object is a user-defined function.
129
130 Function objects provide these attributes:
131 __doc__ documentation string
132 __name__ name with which this function was defined
133 func_code code object containing compiled function bytecode
134 func_defaults tuple of any default values for arguments
135 func_doc (same as __doc__)
136 func_globals global namespace in which this function was defined
137 func_name (same as __name__)"""
Tim Peters28bc59f2001-09-16 08:40:16 +0000138 return isinstance(object, types.FunctionType)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000139
140def istraceback(object):
141 """Return true if the object is a traceback.
142
143 Traceback objects provide these attributes:
144 tb_frame frame object at this level
145 tb_lasti index of last attempted instruction in bytecode
146 tb_lineno current line number in Python source code
147 tb_next next inner traceback object (called by this level)"""
Tim Peters28bc59f2001-09-16 08:40:16 +0000148 return isinstance(object, types.TracebackType)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000149
150def isframe(object):
151 """Return true if the object is a frame object.
152
153 Frame objects provide these attributes:
154 f_back next outer frame object (this frame's caller)
155 f_builtins built-in namespace seen by this frame
156 f_code code object being executed in this frame
157 f_exc_traceback traceback if raised in this frame, or None
158 f_exc_type exception type if raised in this frame, or None
159 f_exc_value exception value if raised in this frame, or None
160 f_globals global namespace seen by this frame
161 f_lasti index of last attempted instruction in bytecode
162 f_lineno current line number in Python source code
163 f_locals local namespace seen by this frame
164 f_restricted 0 or 1 if frame is in restricted execution mode
165 f_trace tracing function for this frame, or None"""
Tim Peters28bc59f2001-09-16 08:40:16 +0000166 return isinstance(object, types.FrameType)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000167
168def iscode(object):
169 """Return true if the object is a code object.
170
171 Code objects provide these attributes:
172 co_argcount number of arguments (not including * or ** args)
173 co_code string of raw compiled bytecode
174 co_consts tuple of constants used in the bytecode
175 co_filename name of file in which this code object was created
176 co_firstlineno number of first line in Python source code
177 co_flags bitmap: 1=optimized | 2=newlocals | 4=*arg | 8=**arg
178 co_lnotab encoded mapping of line numbers to bytecode indices
179 co_name name with which this code object was defined
180 co_names tuple of names of local variables
181 co_nlocals number of local variables
182 co_stacksize virtual machine stack space required
183 co_varnames tuple of names of arguments and local variables"""
Tim Peters28bc59f2001-09-16 08:40:16 +0000184 return isinstance(object, types.CodeType)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000185
186def isbuiltin(object):
187 """Return true if the object is a built-in function or method.
188
189 Built-in functions and methods provide these attributes:
190 __doc__ documentation string
191 __name__ original name of this function or method
192 __self__ instance to which a method is bound, or None"""
Tim Peters28bc59f2001-09-16 08:40:16 +0000193 return isinstance(object, types.BuiltinFunctionType)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000194
195def isroutine(object):
196 """Return true if the object is any kind of function or method."""
Tim Peters536d2262001-09-20 05:13:38 +0000197 return (isbuiltin(object)
198 or isfunction(object)
199 or ismethod(object)
200 or ismethoddescriptor(object))
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000201
202def getmembers(object, predicate=None):
203 """Return all members of an object as (name, value) pairs sorted by name.
204 Optionally, only return members that satisfy a given predicate."""
205 results = []
206 for key in dir(object):
207 value = getattr(object, key)
208 if not predicate or predicate(value):
209 results.append((key, value))
210 results.sort()
211 return results
212
Raymond Hettingere896acc2008-01-11 03:04:50 +0000213Attribute = namedtuple('Attribute', 'name kind defining_class object')
214
Tim Peters13b49d32001-09-23 02:00:29 +0000215def classify_class_attrs(cls):
216 """Return list of attribute-descriptor tuples.
217
218 For each name in dir(cls), the return list contains a 4-tuple
219 with these elements:
220
221 0. The name (a string).
222
223 1. The kind of attribute this is, one of these strings:
224 'class method' created via classmethod()
225 'static method' created via staticmethod()
226 'property' created via property()
227 'method' any other flavor of method
228 'data' not a method
229
230 2. The class which defined this attribute (a class).
231
232 3. The object as obtained directly from the defining class's
233 __dict__, not via getattr. This is especially important for
234 data attributes: C.data is just a data object, but
235 C.__dict__['data'] may be a data descriptor with additional
236 info, like a __doc__ string.
237 """
238
239 mro = getmro(cls)
240 names = dir(cls)
241 result = []
242 for name in names:
243 # Get the object associated with the name.
244 # Getting an obj from the __dict__ sometimes reveals more than
245 # using getattr. Static and class methods are dramatic examples.
246 if name in cls.__dict__:
247 obj = cls.__dict__[name]
248 else:
249 obj = getattr(cls, name)
250
251 # Figure out where it was defined.
Tim Peters13b49d32001-09-23 02:00:29 +0000252 homecls = getattr(obj, "__objclass__", None)
253 if homecls is None:
Guido van Rossum687ae002001-10-15 22:03:32 +0000254 # search the dicts.
Tim Peters13b49d32001-09-23 02:00:29 +0000255 for base in mro:
256 if name in base.__dict__:
257 homecls = base
258 break
259
260 # Get the object again, in order to get it from the defining
261 # __dict__ instead of via getattr (if possible).
262 if homecls is not None and name in homecls.__dict__:
263 obj = homecls.__dict__[name]
264
265 # Also get the object via getattr.
266 obj_via_getattr = getattr(cls, name)
267
268 # Classify the object.
269 if isinstance(obj, staticmethod):
270 kind = "static method"
271 elif isinstance(obj, classmethod):
272 kind = "class method"
273 elif isinstance(obj, property):
274 kind = "property"
275 elif (ismethod(obj_via_getattr) or
276 ismethoddescriptor(obj_via_getattr)):
277 kind = "method"
278 else:
279 kind = "data"
280
Raymond Hettingere896acc2008-01-11 03:04:50 +0000281 result.append(Attribute(name, kind, homecls, obj))
Tim Peters13b49d32001-09-23 02:00:29 +0000282
283 return result
284
Tim Peterse0b2d7a2001-09-22 06:10:55 +0000285# ----------------------------------------------------------- class helpers
286def _searchbases(cls, accum):
287 # Simulate the "classic class" search order.
288 if cls in accum:
289 return
290 accum.append(cls)
291 for base in cls.__bases__:
292 _searchbases(base, accum)
293
294def getmro(cls):
295 "Return tuple of base classes (including cls) in method resolution order."
296 if hasattr(cls, "__mro__"):
297 return cls.__mro__
298 else:
299 result = []
300 _searchbases(cls, result)
301 return tuple(result)
302
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000303# -------------------------------------------------- source code extraction
304def indentsize(line):
305 """Return the indent size, in spaces, at the start of a line of text."""
306 expline = string.expandtabs(line)
307 return len(expline) - len(string.lstrip(expline))
308
309def getdoc(object):
310 """Get the documentation string for an object.
311
312 All tabs are expanded to spaces. To clean up docstrings that are
313 indented to line up with blocks of code, any whitespace than can be
314 uniformly removed from the second line onwards is removed."""
Tim Peters24008312002-03-17 18:56:20 +0000315 try:
316 doc = object.__doc__
317 except AttributeError:
318 return None
Michael W. Hudson755f75e2002-05-20 17:29:46 +0000319 if not isinstance(doc, types.StringTypes):
Tim Peters24008312002-03-17 18:56:20 +0000320 return None
321 try:
322 lines = string.split(string.expandtabs(doc), '\n')
323 except UnicodeError:
324 return None
325 else:
Ka-Ping Yeea59ef7b2002-11-30 03:53:15 +0000326 # Find minimum indentation of any non-blank lines after first line.
327 margin = sys.maxint
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000328 for line in lines[1:]:
329 content = len(string.lstrip(line))
Ka-Ping Yeea59ef7b2002-11-30 03:53:15 +0000330 if content:
331 indent = len(line) - content
332 margin = min(margin, indent)
333 # Remove indentation.
334 if lines:
335 lines[0] = lines[0].lstrip()
336 if margin < sys.maxint:
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000337 for i in range(1, len(lines)): lines[i] = lines[i][margin:]
Ka-Ping Yeea59ef7b2002-11-30 03:53:15 +0000338 # Remove any trailing or leading blank lines.
339 while lines and not lines[-1]:
340 lines.pop()
341 while lines and not lines[0]:
342 lines.pop(0)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000343 return string.join(lines, '\n')
344
345def getfile(object):
Ka-Ping Yeec113c242001-03-02 02:08:53 +0000346 """Work out which source or compiled file an object was defined in."""
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000347 if ismodule(object):
348 if hasattr(object, '__file__'):
349 return object.__file__
Jeremy Hyltonab919022003-06-27 18:41:20 +0000350 raise TypeError('arg is a built-in module')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000351 if isclass(object):
Ka-Ping Yeec99e0f12001-04-13 12:10:40 +0000352 object = sys.modules.get(object.__module__)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000353 if hasattr(object, '__file__'):
354 return object.__file__
Jeremy Hyltonab919022003-06-27 18:41:20 +0000355 raise TypeError('arg is a built-in class')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000356 if ismethod(object):
357 object = object.im_func
358 if isfunction(object):
359 object = object.func_code
360 if istraceback(object):
361 object = object.tb_frame
362 if isframe(object):
363 object = object.f_code
364 if iscode(object):
365 return object.co_filename
Tim Peters478c1052003-06-29 05:46:54 +0000366 raise TypeError('arg is not a module, class, method, '
Jeremy Hyltonab919022003-06-27 18:41:20 +0000367 'function, traceback, frame, or code object')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000368
Raymond Hettingere896acc2008-01-11 03:04:50 +0000369ModuleInfo = namedtuple('ModuleInfo', 'name suffix mode module_type')
370
Ka-Ping Yee4d6fc7f2001-04-10 11:43:00 +0000371def getmoduleinfo(path):
372 """Get the module name, suffix, mode, and module type for a given file."""
373 filename = os.path.basename(path)
374 suffixes = map(lambda (suffix, mode, mtype):
375 (-len(suffix), suffix, mode, mtype), imp.get_suffixes())
376 suffixes.sort() # try longest suffixes first, in case they overlap
377 for neglen, suffix, mode, mtype in suffixes:
378 if filename[neglen:] == suffix:
Raymond Hettingere896acc2008-01-11 03:04:50 +0000379 return ModuleInfo(filename[:neglen], suffix, mode, mtype)
Ka-Ping Yee4d6fc7f2001-04-10 11:43:00 +0000380
381def getmodulename(path):
382 """Return the module name for a given file, or None."""
383 info = getmoduleinfo(path)
384 if info: return info[0]
385
Ka-Ping Yeec113c242001-03-02 02:08:53 +0000386def getsourcefile(object):
387 """Return the Python source file an object was defined in, if it exists."""
388 filename = getfile(object)
Raymond Hettingerdbecd932005-02-06 06:57:08 +0000389 if string.lower(filename[-4:]) in ('.pyc', '.pyo'):
Ka-Ping Yeec113c242001-03-02 02:08:53 +0000390 filename = filename[:-4] + '.py'
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000391 for suffix, mode, kind in imp.get_suffixes():
392 if 'b' in mode and string.lower(filename[-len(suffix):]) == suffix:
393 # Looks like a binary file. We want to only return a text file.
394 return None
Phillip J. Eby72ae6c82006-04-30 15:59:26 +0000395 if os.path.exists(filename):
396 return filename
Phillip J. Eby5d86bdb2006-07-10 19:03:29 +0000397 # only return a non-existent filename if the module has a PEP 302 loader
398 if hasattr(getmodule(object, filename), '__loader__'):
Ka-Ping Yeec113c242001-03-02 02:08:53 +0000399 return filename
400
Phillip J. Eby5d86bdb2006-07-10 19:03:29 +0000401def getabsfile(object, _filename=None):
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000402 """Return an absolute path to the source or compiled file for an object.
Ka-Ping Yeec113c242001-03-02 02:08:53 +0000403
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000404 The idea is for each object to have a unique origin, so this routine
405 normalizes the result as much as possible."""
Phillip J. Eby1a2959c2006-07-20 15:54:16 +0000406 if _filename is None:
407 _filename = getsourcefile(object) or getfile(object)
408 return os.path.normcase(os.path.abspath(_filename))
Ka-Ping Yeec113c242001-03-02 02:08:53 +0000409
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000410modulesbyfile = {}
Nick Coghlanc495c662006-09-07 10:50:34 +0000411_filesbymodname = {}
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000412
Phillip J. Eby5d86bdb2006-07-10 19:03:29 +0000413def getmodule(object, _filename=None):
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000414 """Return the module an object was defined in, or None if not found."""
Ka-Ping Yee202c99b2001-04-13 09:15:08 +0000415 if ismodule(object):
416 return object
Johannes Gijsbers93245262004-09-11 15:53:22 +0000417 if hasattr(object, '__module__'):
Ka-Ping Yee8b58b842001-03-01 13:56:16 +0000418 return sys.modules.get(object.__module__)
Nick Coghlanc495c662006-09-07 10:50:34 +0000419 # Try the filename to modulename cache
420 if _filename is not None and _filename in modulesbyfile:
421 return sys.modules.get(modulesbyfile[_filename])
422 # Try the cache again with the absolute file name
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000423 try:
Phillip J. Eby5d86bdb2006-07-10 19:03:29 +0000424 file = getabsfile(object, _filename)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000425 except TypeError:
426 return None
Raymond Hettinger54f02222002-06-01 14:18:47 +0000427 if file in modulesbyfile:
Ka-Ping Yeeb38bbbd2003-03-28 16:29:50 +0000428 return sys.modules.get(modulesbyfile[file])
Nick Coghlanc495c662006-09-07 10:50:34 +0000429 # Update the filename to module name cache and check yet again
430 # Copy sys.modules in order to cope with changes while iterating
431 for modname, module in sys.modules.items():
Phillip J. Eby47032112006-04-11 01:07:43 +0000432 if ismodule(module) and hasattr(module, '__file__'):
Nick Coghlanc495c662006-09-07 10:50:34 +0000433 f = module.__file__
434 if f == _filesbymodname.get(modname, None):
435 # Have already mapped this module, so skip it
436 continue
437 _filesbymodname[modname] = f
Phillip J. Eby5d86bdb2006-07-10 19:03:29 +0000438 f = getabsfile(module)
Nick Coghlanc495c662006-09-07 10:50:34 +0000439 # Always map to the name the module knows itself by
Phillip J. Eby5d86bdb2006-07-10 19:03:29 +0000440 modulesbyfile[f] = modulesbyfile[
441 os.path.realpath(f)] = module.__name__
Raymond Hettinger54f02222002-06-01 14:18:47 +0000442 if file in modulesbyfile:
Ka-Ping Yeeb38bbbd2003-03-28 16:29:50 +0000443 return sys.modules.get(modulesbyfile[file])
Nick Coghlanc495c662006-09-07 10:50:34 +0000444 # Check the main module
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000445 main = sys.modules['__main__']
Brett Cannon4a671fe2003-06-15 22:33:28 +0000446 if not hasattr(object, '__name__'):
447 return None
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000448 if hasattr(main, object.__name__):
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000449 mainobject = getattr(main, object.__name__)
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000450 if mainobject is object:
451 return main
Nick Coghlanc495c662006-09-07 10:50:34 +0000452 # Check builtins
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000453 builtin = sys.modules['__builtin__']
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000454 if hasattr(builtin, object.__name__):
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000455 builtinobject = getattr(builtin, object.__name__)
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000456 if builtinobject is object:
457 return builtin
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000458
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000459def findsource(object):
460 """Return the entire source file and starting line number for an object.
461
462 The argument may be a module, class, method, function, traceback, frame,
463 or code object. The source code is returned as a list of all the lines
464 in the file and the line number indexes a line in that list. An IOError
465 is raised if the source code cannot be retrieved."""
Neil Schemenauerf06f8532002-03-23 23:51:04 +0000466 file = getsourcefile(object) or getfile(object)
Nick Coghlanc495c662006-09-07 10:50:34 +0000467 module = getmodule(object, file)
Georg Brandl208badd2006-04-30 17:42:26 +0000468 if module:
469 lines = linecache.getlines(file, module.__dict__)
470 else:
471 lines = linecache.getlines(file)
Neil Schemenauerf06f8532002-03-23 23:51:04 +0000472 if not lines:
Jeremy Hyltonab919022003-06-27 18:41:20 +0000473 raise IOError('could not get source code')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000474
475 if ismodule(object):
476 return lines, 0
477
478 if isclass(object):
479 name = object.__name__
Georg Brandlb2e81e32006-10-12 09:20:33 +0000480 pat = re.compile(r'^(\s*)class\s*' + name + r'\b')
481 # make some effort to find the best matching class definition:
482 # use the one with the least indentation, which is the one
483 # that's most probably not inside a function definition.
484 candidates = []
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000485 for i in range(len(lines)):
Georg Brandlb2e81e32006-10-12 09:20:33 +0000486 match = pat.match(lines[i])
487 if match:
488 # if it's at toplevel, it's already the best one
489 if lines[i][0] == 'c':
490 return lines, i
491 # else add whitespace to candidate list
492 candidates.append((match.group(1), i))
493 if candidates:
494 # this will sort by whitespace, and by line number,
495 # less whitespace first
496 candidates.sort()
497 return lines, candidates[0][1]
Jeremy Hyltonab919022003-06-27 18:41:20 +0000498 else:
499 raise IOError('could not find class definition')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000500
501 if ismethod(object):
502 object = object.im_func
503 if isfunction(object):
504 object = object.func_code
505 if istraceback(object):
506 object = object.tb_frame
507 if isframe(object):
508 object = object.f_code
509 if iscode(object):
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000510 if not hasattr(object, 'co_firstlineno'):
Jeremy Hyltonab919022003-06-27 18:41:20 +0000511 raise IOError('could not find function definition')
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000512 lnum = object.co_firstlineno - 1
Johannes Gijsbers1542f342004-12-12 16:46:28 +0000513 pat = re.compile(r'^(\s*def\s)|(.*(?<!\w)lambda(:|\s))|^(\s*@)')
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000514 while lnum > 0:
Ka-Ping Yeea6e59712001-03-10 09:31:55 +0000515 if pat.match(lines[lnum]): break
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000516 lnum = lnum - 1
517 return lines, lnum
Jeremy Hyltonab919022003-06-27 18:41:20 +0000518 raise IOError('could not find code object')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000519
520def getcomments(object):
Jeremy Hyltonb4c17c82002-03-28 23:01:56 +0000521 """Get lines of comments immediately preceding an object's source code.
522
523 Returns None when source can't be found.
524 """
525 try:
526 lines, lnum = findsource(object)
527 except (IOError, TypeError):
528 return None
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000529
530 if ismodule(object):
531 # Look for a comment block at the top of the file.
532 start = 0
Ka-Ping Yeeb910efe2001-04-12 13:17:17 +0000533 if lines and lines[0][:2] == '#!': start = 1
Raymond Hettingerdbecd932005-02-06 06:57:08 +0000534 while start < len(lines) and string.strip(lines[start]) in ('', '#'):
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000535 start = start + 1
Ka-Ping Yeeb910efe2001-04-12 13:17:17 +0000536 if start < len(lines) and lines[start][:1] == '#':
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000537 comments = []
538 end = start
539 while end < len(lines) and lines[end][:1] == '#':
540 comments.append(string.expandtabs(lines[end]))
541 end = end + 1
542 return string.join(comments, '')
543
544 # Look for a preceding block of comments at the same indentation.
545 elif lnum > 0:
546 indent = indentsize(lines[lnum])
547 end = lnum - 1
548 if end >= 0 and string.lstrip(lines[end])[:1] == '#' and \
549 indentsize(lines[end]) == indent:
550 comments = [string.lstrip(string.expandtabs(lines[end]))]
551 if end > 0:
552 end = end - 1
553 comment = string.lstrip(string.expandtabs(lines[end]))
554 while comment[:1] == '#' and indentsize(lines[end]) == indent:
555 comments[:0] = [comment]
556 end = end - 1
557 if end < 0: break
558 comment = string.lstrip(string.expandtabs(lines[end]))
559 while comments and string.strip(comments[0]) == '#':
560 comments[:1] = []
561 while comments and string.strip(comments[-1]) == '#':
562 comments[-1:] = []
563 return string.join(comments, '')
564
Tim Peters4efb6e92001-06-29 23:51:08 +0000565class EndOfBlock(Exception): pass
566
567class BlockFinder:
568 """Provide a tokeneater() method to detect the end of a code block."""
569 def __init__(self):
570 self.indent = 0
Johannes Gijsbersa5855d52005-03-12 16:37:11 +0000571 self.islambda = False
Johannes Gijsbers1542f342004-12-12 16:46:28 +0000572 self.started = False
573 self.passline = False
Armin Rigodd5c0232005-09-25 11:45:45 +0000574 self.last = 1
Tim Peters4efb6e92001-06-29 23:51:08 +0000575
576 def tokeneater(self, type, token, (srow, scol), (erow, ecol), line):
577 if not self.started:
Armin Rigodd5c0232005-09-25 11:45:45 +0000578 # look for the first "def", "class" or "lambda"
Johannes Gijsbers1542f342004-12-12 16:46:28 +0000579 if token in ("def", "class", "lambda"):
Johannes Gijsbersa5855d52005-03-12 16:37:11 +0000580 if token == "lambda":
581 self.islambda = True
Johannes Gijsbers1542f342004-12-12 16:46:28 +0000582 self.started = True
Armin Rigodd5c0232005-09-25 11:45:45 +0000583 self.passline = True # skip to the end of the line
Tim Peters4efb6e92001-06-29 23:51:08 +0000584 elif type == tokenize.NEWLINE:
Armin Rigodd5c0232005-09-25 11:45:45 +0000585 self.passline = False # stop skipping when a NEWLINE is seen
Tim Peters4efb6e92001-06-29 23:51:08 +0000586 self.last = srow
Armin Rigodd5c0232005-09-25 11:45:45 +0000587 if self.islambda: # lambdas always end at the first NEWLINE
588 raise EndOfBlock
Johannes Gijsbers1542f342004-12-12 16:46:28 +0000589 elif self.passline:
590 pass
Tim Peters4efb6e92001-06-29 23:51:08 +0000591 elif type == tokenize.INDENT:
592 self.indent = self.indent + 1
Johannes Gijsbers1542f342004-12-12 16:46:28 +0000593 self.passline = True
Tim Peters4efb6e92001-06-29 23:51:08 +0000594 elif type == tokenize.DEDENT:
595 self.indent = self.indent - 1
Armin Rigodd5c0232005-09-25 11:45:45 +0000596 # the end of matching indent/dedent pairs end a block
597 # (note that this only works for "def"/"class" blocks,
598 # not e.g. for "if: else:" or "try: finally:" blocks)
599 if self.indent <= 0:
600 raise EndOfBlock
601 elif self.indent == 0 and type not in (tokenize.COMMENT, tokenize.NL):
602 # any other token on the same indentation level end the previous
603 # block as well, except the pseudo-tokens COMMENT and NL.
604 raise EndOfBlock
Tim Peters4efb6e92001-06-29 23:51:08 +0000605
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000606def getblock(lines):
607 """Extract the block of code at the top of the given list of lines."""
Armin Rigodd5c0232005-09-25 11:45:45 +0000608 blockfinder = BlockFinder()
Tim Peters4efb6e92001-06-29 23:51:08 +0000609 try:
Armin Rigodd5c0232005-09-25 11:45:45 +0000610 tokenize.tokenize(iter(lines).next, blockfinder.tokeneater)
611 except (EndOfBlock, IndentationError):
612 pass
613 return lines[:blockfinder.last]
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000614
615def getsourcelines(object):
616 """Return a list of source lines and starting line number for an object.
617
618 The argument may be a module, class, method, function, traceback, frame,
619 or code object. The source code is returned as a list of the lines
620 corresponding to the object and the line number indicates where in the
621 original source file the first line of code was found. An IOError is
622 raised if the source code cannot be retrieved."""
623 lines, lnum = findsource(object)
624
625 if ismodule(object): return lines, 0
626 else: return getblock(lines[lnum:]), lnum + 1
627
628def getsource(object):
629 """Return the text of the source code for an object.
630
631 The argument may be a module, class, method, function, traceback, frame,
632 or code object. The source code is returned as a single string. An
633 IOError is raised if the source code cannot be retrieved."""
634 lines, lnum = getsourcelines(object)
635 return string.join(lines, '')
636
637# --------------------------------------------------- class tree extraction
638def walktree(classes, children, parent):
639 """Recursive helper function for getclasstree()."""
640 results = []
Raymond Hettingera1a992c2005-03-11 06:46:45 +0000641 classes.sort(key=attrgetter('__module__', '__name__'))
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000642 for c in classes:
643 results.append((c, c.__bases__))
Raymond Hettinger54f02222002-06-01 14:18:47 +0000644 if c in children:
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000645 results.append(walktree(children[c], children, c))
646 return results
647
648def getclasstree(classes, unique=0):
649 """Arrange the given list of classes into a hierarchy of nested lists.
650
651 Where a nested list appears, it contains classes derived from the class
652 whose entry immediately precedes the list. Each entry is a 2-tuple
653 containing a class and a tuple of its base classes. If the 'unique'
654 argument is true, exactly one entry appears in the returned structure
655 for each class in the given list. Otherwise, classes using multiple
656 inheritance and their descendants will appear multiple times."""
657 children = {}
658 roots = []
659 for c in classes:
660 if c.__bases__:
661 for parent in c.__bases__:
Raymond Hettinger54f02222002-06-01 14:18:47 +0000662 if not parent in children:
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000663 children[parent] = []
664 children[parent].append(c)
665 if unique and parent in classes: break
666 elif c not in roots:
667 roots.append(c)
Raymond Hettingere0d49722002-06-02 18:55:56 +0000668 for parent in children:
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000669 if parent not in classes:
670 roots.append(parent)
671 return walktree(roots, children, None)
672
673# ------------------------------------------------ argument list extraction
674# These constants are from Python's compile.h.
675CO_OPTIMIZED, CO_NEWLOCALS, CO_VARARGS, CO_VARKEYWORDS = 1, 2, 4, 8
676
Raymond Hettingere896acc2008-01-11 03:04:50 +0000677Arguments = namedtuple('Arguments', 'args varargs keywords')
678
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000679def getargs(co):
680 """Get information about the arguments accepted by a code object.
681
682 Three things are returned: (args, varargs, varkw), where 'args' is
683 a list of argument names (possibly containing nested lists), and
684 'varargs' and 'varkw' are the names of the * and ** arguments or None."""
Jeremy Hylton64967882003-06-27 18:14:39 +0000685
686 if not iscode(co):
687 raise TypeError('arg is not a code object')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000688
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000689 nargs = co.co_argcount
690 names = co.co_varnames
691 args = list(names[:nargs])
692 step = 0
693
694 # The following acrobatics are for anonymous (tuple) arguments.
695 for i in range(nargs):
Raymond Hettingerdbecd932005-02-06 06:57:08 +0000696 if args[i][:1] in ('', '.'):
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000697 stack, remain, count = [], [], []
Georg Brandlbc5fbd92007-07-12 08:11:29 +0000698 while step < len(co.co_code):
699 op = ord(co.co_code[step])
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000700 step = step + 1
701 if op >= dis.HAVE_ARGUMENT:
702 opname = dis.opname[op]
Georg Brandlbc5fbd92007-07-12 08:11:29 +0000703 value = ord(co.co_code[step]) + ord(co.co_code[step+1])*256
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000704 step = step + 2
Raymond Hettingerdbecd932005-02-06 06:57:08 +0000705 if opname in ('UNPACK_TUPLE', 'UNPACK_SEQUENCE'):
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000706 remain.append(value)
707 count.append(value)
708 elif opname == 'STORE_FAST':
709 stack.append(names[value])
Matthias Klose2e829c02004-08-15 17:04:33 +0000710
711 # Special case for sublists of length 1: def foo((bar))
712 # doesn't generate the UNPACK_TUPLE bytecode, so if
713 # `remain` is empty here, we have such a sublist.
714 if not remain:
715 stack[0] = [stack[0]]
716 break
717 else:
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000718 remain[-1] = remain[-1] - 1
Matthias Klose2e829c02004-08-15 17:04:33 +0000719 while remain[-1] == 0:
720 remain.pop()
721 size = count.pop()
722 stack[-size:] = [stack[-size:]]
723 if not remain: break
724 remain[-1] = remain[-1] - 1
725 if not remain: break
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000726 args[i] = stack[0]
727
728 varargs = None
729 if co.co_flags & CO_VARARGS:
730 varargs = co.co_varnames[nargs]
731 nargs = nargs + 1
732 varkw = None
733 if co.co_flags & CO_VARKEYWORDS:
734 varkw = co.co_varnames[nargs]
Raymond Hettingere896acc2008-01-11 03:04:50 +0000735 return Arguments(args, varargs, varkw)
736
737ArgSpec = namedtuple('ArgSpec', 'args varargs keywords defaults')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000738
739def getargspec(func):
740 """Get the names and default values of a function's arguments.
741
742 A tuple of four things is returned: (args, varargs, varkw, defaults).
743 'args' is a list of the argument names (it may contain nested lists).
744 'varargs' and 'varkw' are the names of the * and ** arguments or None.
Jeremy Hylton64967882003-06-27 18:14:39 +0000745 'defaults' is an n-tuple of the default values of the last n arguments.
746 """
747
748 if ismethod(func):
749 func = func.im_func
750 if not isfunction(func):
751 raise TypeError('arg is not a Python function')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000752 args, varargs, varkw = getargs(func.func_code)
Raymond Hettingere896acc2008-01-11 03:04:50 +0000753 return ArgSpec(args, varargs, varkw, func.func_defaults)
754
755ArgInfo = namedtuple('ArgInfo', 'args varargs keywords locals')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000756
757def getargvalues(frame):
758 """Get information about arguments passed into a particular frame.
759
760 A tuple of four things is returned: (args, varargs, varkw, locals).
761 'args' is a list of the argument names (it may contain nested lists).
762 'varargs' and 'varkw' are the names of the * and ** arguments or None.
763 'locals' is the locals dictionary of the given frame."""
764 args, varargs, varkw = getargs(frame.f_code)
765 return args, varargs, varkw, frame.f_locals
766
767def joinseq(seq):
768 if len(seq) == 1:
769 return '(' + seq[0] + ',)'
770 else:
771 return '(' + string.join(seq, ', ') + ')'
772
773def strseq(object, convert, join=joinseq):
774 """Recursively walk a sequence, stringifying each element."""
Raymond Hettingerdbecd932005-02-06 06:57:08 +0000775 if type(object) in (list, tuple):
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000776 return join(map(lambda o, c=convert, j=join: strseq(o, c, j), object))
777 else:
778 return convert(object)
779
780def formatargspec(args, varargs=None, varkw=None, defaults=None,
781 formatarg=str,
782 formatvarargs=lambda name: '*' + name,
783 formatvarkw=lambda name: '**' + name,
784 formatvalue=lambda value: '=' + repr(value),
785 join=joinseq):
786 """Format an argument spec from the 4 values returned by getargspec.
787
788 The first four arguments are (args, varargs, varkw, defaults). The
789 other four arguments are the corresponding optional formatting functions
790 that are called to turn names and values into strings. The ninth
791 argument is an optional function to format the sequence of arguments."""
792 specs = []
793 if defaults:
794 firstdefault = len(args) - len(defaults)
795 for i in range(len(args)):
796 spec = strseq(args[i], formatarg, join)
797 if defaults and i >= firstdefault:
798 spec = spec + formatvalue(defaults[i - firstdefault])
799 specs.append(spec)
Raymond Hettinger936654b2002-06-01 03:06:31 +0000800 if varargs is not None:
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000801 specs.append(formatvarargs(varargs))
Raymond Hettinger936654b2002-06-01 03:06:31 +0000802 if varkw is not None:
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000803 specs.append(formatvarkw(varkw))
804 return '(' + string.join(specs, ', ') + ')'
805
806def formatargvalues(args, varargs, varkw, locals,
807 formatarg=str,
808 formatvarargs=lambda name: '*' + name,
809 formatvarkw=lambda name: '**' + name,
810 formatvalue=lambda value: '=' + repr(value),
811 join=joinseq):
812 """Format an argument spec from the 4 values returned by getargvalues.
813
814 The first four arguments are (args, varargs, varkw, locals). The
815 next four arguments are the corresponding optional formatting functions
816 that are called to turn names and values into strings. The ninth
817 argument is an optional function to format the sequence of arguments."""
818 def convert(name, locals=locals,
819 formatarg=formatarg, formatvalue=formatvalue):
820 return formatarg(name) + formatvalue(locals[name])
821 specs = []
822 for i in range(len(args)):
823 specs.append(strseq(args[i], convert, join))
824 if varargs:
825 specs.append(formatvarargs(varargs) + formatvalue(locals[varargs]))
826 if varkw:
827 specs.append(formatvarkw(varkw) + formatvalue(locals[varkw]))
828 return '(' + string.join(specs, ', ') + ')'
829
830# -------------------------------------------------- stack frame extraction
Raymond Hettingere896acc2008-01-11 03:04:50 +0000831
832Traceback = namedtuple('Traceback', 'filename lineno function code_context index')
833
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000834def getframeinfo(frame, context=1):
835 """Get information about a frame or traceback object.
836
837 A tuple of five things is returned: the filename, the line number of
838 the current line, the function name, a list of lines of context from
839 the source code, and the index of the current line within that list.
840 The optional second argument specifies the number of lines of context
841 to return, which are centered around the current line."""
842 if istraceback(frame):
Andrew M. Kuchlingba8b6bc2004-06-05 14:11:59 +0000843 lineno = frame.tb_lineno
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000844 frame = frame.tb_frame
Andrew M. Kuchlingba8b6bc2004-06-05 14:11:59 +0000845 else:
846 lineno = frame.f_lineno
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000847 if not isframe(frame):
Jeremy Hyltonab919022003-06-27 18:41:20 +0000848 raise TypeError('arg is not a frame or traceback object')
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000849
Neil Schemenauerf06f8532002-03-23 23:51:04 +0000850 filename = getsourcefile(frame) or getfile(frame)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000851 if context > 0:
Guido van Rossum54e54c62001-09-04 19:14:14 +0000852 start = lineno - 1 - context//2
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000853 try:
854 lines, lnum = findsource(frame)
Ka-Ping Yee4eb0c002001-03-02 05:50:34 +0000855 except IOError:
856 lines = index = None
857 else:
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000858 start = max(start, 1)
Raymond Hettingera0501712004-06-15 11:22:53 +0000859 start = max(0, min(start, len(lines) - context))
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000860 lines = lines[start:start+context]
Ka-Ping Yee59ade082001-03-01 03:55:35 +0000861 index = lineno - 1 - start
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000862 else:
863 lines = index = None
864
Raymond Hettingere896acc2008-01-11 03:04:50 +0000865 return Traceback(filename, lineno, frame.f_code.co_name, lines, index)
Ka-Ping Yee59ade082001-03-01 03:55:35 +0000866
867def getlineno(frame):
868 """Get the line number from a frame object, allowing for optimization."""
Michael W. Hudsondd32a912002-08-15 14:59:02 +0000869 # FrameType.f_lineno is now a descriptor that grovels co_lnotab
870 return frame.f_lineno
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000871
872def getouterframes(frame, context=1):
873 """Get a list of records for a frame and all higher (calling) frames.
874
875 Each record contains a frame object, filename, line number, function
876 name, a list of lines of context, and index within the context."""
877 framelist = []
878 while frame:
879 framelist.append((frame,) + getframeinfo(frame, context))
880 frame = frame.f_back
881 return framelist
882
883def getinnerframes(tb, context=1):
884 """Get a list of records for a traceback's frame and all lower frames.
885
886 Each record contains a frame object, filename, line number, function
887 name, a list of lines of context, and index within the context."""
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000888 framelist = []
889 while tb:
890 framelist.append((tb.tb_frame,) + getframeinfo(tb, context))
891 tb = tb.tb_next
892 return framelist
893
Jeremy Hyltonab919022003-06-27 18:41:20 +0000894currentframe = sys._getframe
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000895
896def stack(context=1):
897 """Return a list of records for the stack above the caller's frame."""
Jeremy Hyltonab919022003-06-27 18:41:20 +0000898 return getouterframes(sys._getframe(1), context)
Ka-Ping Yee6397c7c2001-02-27 14:43:21 +0000899
900def trace(context=1):
Tim Peters85ba6732001-02-28 08:26:44 +0000901 """Return a list of records for the stack below the current exception."""
Fred Draked451ec12002-04-26 02:29:55 +0000902 return getinnerframes(sys.exc_info()[2], context)