Martin v. Löwis | 09776b7 | 2002-08-04 17:22:59 +0000 | [diff] [blame] | 1 | # -*- coding: iso-8859-1 -*- |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 2 | """Get useful information from live Python objects. |
| 3 | |
| 4 | This module encapsulates the interface provided by the internal special |
| 5 | attributes (func_*, co_*, im_*, tb_*, etc.) in a friendlier fashion. |
| 6 | It also provides some help for examining source code and class layout. |
| 7 | |
| 8 | Here are some of the useful functions provided by this module: |
| 9 | |
| 10 | ismodule(), isclass(), ismethod(), isfunction(), istraceback(), |
| 11 | isframe(), iscode(), isbuiltin(), isroutine() - check object types |
| 12 | getmembers() - get members of an object that satisfy a given condition |
| 13 | |
| 14 | getfile(), getsourcefile(), getsource() - find an object's source code |
| 15 | getdoc(), getcomments() - get documentation on an object |
| 16 | getmodule() - determine the module that an object came from |
| 17 | getclasstree() - arrange classes so as to represent their hierarchy |
| 18 | |
| 19 | getargspec(), getargvalues() - get info about function arguments |
| 20 | formatargspec(), formatargvalues() - format an argument spec |
| 21 | getouterframes(), getinnerframes() - get info about frames |
| 22 | currentframe() - get the current stack frame |
| 23 | stack(), trace() - get info about frames on the stack or in a traceback |
| 24 | """ |
| 25 | |
| 26 | # This module is in the public domain. No warranties. |
| 27 | |
Ka-Ping Yee | 8b58b84 | 2001-03-01 13:56:16 +0000 | [diff] [blame] | 28 | __author__ = 'Ka-Ping Yee <ping@lfw.org>' |
| 29 | __date__ = '1 Jan 2001' |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 30 | |
Neil Schemenauer | f06f853 | 2002-03-23 23:51:04 +0000 | [diff] [blame] | 31 | import sys, os, types, string, re, dis, imp, tokenize, linecache |
Raymond Hettinger | a1a992c | 2005-03-11 06:46:45 +0000 | [diff] [blame] | 32 | from operator import attrgetter |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 33 | from collections import namedtuple |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 34 | |
| 35 | # ----------------------------------------------------------- type-checking |
| 36 | def ismodule(object): |
| 37 | """Return true if the object is a module. |
| 38 | |
| 39 | Module objects provide these attributes: |
| 40 | __doc__ documentation string |
| 41 | __file__ filename (missing for built-in modules)""" |
Tim Peters | 28bc59f | 2001-09-16 08:40:16 +0000 | [diff] [blame] | 42 | return isinstance(object, types.ModuleType) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 43 | |
| 44 | def isclass(object): |
| 45 | """Return true if the object is a class. |
| 46 | |
| 47 | Class objects provide these attributes: |
| 48 | __doc__ documentation string |
| 49 | __module__ name of module in which this class was defined""" |
Tim Peters | 28bc59f | 2001-09-16 08:40:16 +0000 | [diff] [blame] | 50 | return isinstance(object, types.ClassType) or hasattr(object, '__bases__') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 51 | |
| 52 | def ismethod(object): |
| 53 | """Return true if the object is an instance method. |
| 54 | |
| 55 | Instance method objects provide these attributes: |
| 56 | __doc__ documentation string |
| 57 | __name__ name with which this method was defined |
| 58 | im_class class object in which this method belongs |
| 59 | im_func function object containing implementation of method |
| 60 | im_self instance to which this method is bound, or None""" |
Tim Peters | 28bc59f | 2001-09-16 08:40:16 +0000 | [diff] [blame] | 61 | return isinstance(object, types.MethodType) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 62 | |
Tim Peters | 536d226 | 2001-09-20 05:13:38 +0000 | [diff] [blame] | 63 | def ismethoddescriptor(object): |
Tim Peters | f1d90b9 | 2001-09-20 05:47:55 +0000 | [diff] [blame] | 64 | """Return true if the object is a method descriptor. |
| 65 | |
| 66 | But not if ismethod() or isclass() or isfunction() are true. |
Tim Peters | 536d226 | 2001-09-20 05:13:38 +0000 | [diff] [blame] | 67 | |
| 68 | This is new in Python 2.2, and, for example, is true of int.__add__. |
| 69 | An object passing this test has a __get__ attribute but not a __set__ |
| 70 | attribute, but beyond that the set of attributes varies. __name__ is |
| 71 | usually sensible, and __doc__ often is. |
| 72 | |
Tim Peters | f1d90b9 | 2001-09-20 05:47:55 +0000 | [diff] [blame] | 73 | Methods implemented via descriptors that also pass one of the other |
| 74 | tests return false from the ismethoddescriptor() test, simply because |
| 75 | the other tests promise more -- you can, e.g., count on having the |
| 76 | im_func attribute (etc) when an object passes ismethod().""" |
Tim Peters | 536d226 | 2001-09-20 05:13:38 +0000 | [diff] [blame] | 77 | return (hasattr(object, "__get__") |
| 78 | and not hasattr(object, "__set__") # else it's a data descriptor |
| 79 | and not ismethod(object) # mutual exclusion |
Tim Peters | f1d90b9 | 2001-09-20 05:47:55 +0000 | [diff] [blame] | 80 | and not isfunction(object) |
Tim Peters | 536d226 | 2001-09-20 05:13:38 +0000 | [diff] [blame] | 81 | and not isclass(object)) |
| 82 | |
Martin v. Löwis | e59e2ba | 2003-05-03 09:09:02 +0000 | [diff] [blame] | 83 | def isdatadescriptor(object): |
| 84 | """Return true if the object is a data descriptor. |
| 85 | |
| 86 | Data descriptors have both a __get__ and a __set__ attribute. Examples are |
| 87 | properties (defined in Python) and getsets and members (defined in C). |
| 88 | Typically, data descriptors will also have __name__ and __doc__ attributes |
| 89 | (properties, getsets, and members have both of these attributes), but this |
| 90 | is not guaranteed.""" |
| 91 | return (hasattr(object, "__set__") and hasattr(object, "__get__")) |
| 92 | |
Barry Warsaw | 00decd7 | 2006-07-27 23:43:15 +0000 | [diff] [blame] | 93 | if hasattr(types, 'MemberDescriptorType'): |
| 94 | # CPython and equivalent |
| 95 | def ismemberdescriptor(object): |
| 96 | """Return true if the object is a member descriptor. |
| 97 | |
| 98 | Member descriptors are specialized descriptors defined in extension |
| 99 | modules.""" |
| 100 | return isinstance(object, types.MemberDescriptorType) |
| 101 | else: |
| 102 | # Other implementations |
| 103 | def ismemberdescriptor(object): |
| 104 | """Return true if the object is a member descriptor. |
| 105 | |
| 106 | Member descriptors are specialized descriptors defined in extension |
| 107 | modules.""" |
| 108 | return False |
| 109 | |
| 110 | if hasattr(types, 'GetSetDescriptorType'): |
| 111 | # CPython and equivalent |
| 112 | def isgetsetdescriptor(object): |
| 113 | """Return true if the object is a getset descriptor. |
| 114 | |
| 115 | getset descriptors are specialized descriptors defined in extension |
| 116 | modules.""" |
| 117 | return isinstance(object, types.GetSetDescriptorType) |
| 118 | else: |
| 119 | # Other implementations |
| 120 | def isgetsetdescriptor(object): |
| 121 | """Return true if the object is a getset descriptor. |
| 122 | |
| 123 | getset descriptors are specialized descriptors defined in extension |
| 124 | modules.""" |
| 125 | return False |
Tim Peters | ce70a3b | 2006-07-27 23:45:48 +0000 | [diff] [blame] | 126 | |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 127 | def isfunction(object): |
| 128 | """Return true if the object is a user-defined function. |
| 129 | |
| 130 | Function objects provide these attributes: |
| 131 | __doc__ documentation string |
| 132 | __name__ name with which this function was defined |
| 133 | func_code code object containing compiled function bytecode |
| 134 | func_defaults tuple of any default values for arguments |
| 135 | func_doc (same as __doc__) |
| 136 | func_globals global namespace in which this function was defined |
| 137 | func_name (same as __name__)""" |
Tim Peters | 28bc59f | 2001-09-16 08:40:16 +0000 | [diff] [blame] | 138 | return isinstance(object, types.FunctionType) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 139 | |
| 140 | def istraceback(object): |
| 141 | """Return true if the object is a traceback. |
| 142 | |
| 143 | Traceback objects provide these attributes: |
| 144 | tb_frame frame object at this level |
| 145 | tb_lasti index of last attempted instruction in bytecode |
| 146 | tb_lineno current line number in Python source code |
| 147 | tb_next next inner traceback object (called by this level)""" |
Tim Peters | 28bc59f | 2001-09-16 08:40:16 +0000 | [diff] [blame] | 148 | return isinstance(object, types.TracebackType) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 149 | |
| 150 | def isframe(object): |
| 151 | """Return true if the object is a frame object. |
| 152 | |
| 153 | Frame objects provide these attributes: |
| 154 | f_back next outer frame object (this frame's caller) |
| 155 | f_builtins built-in namespace seen by this frame |
| 156 | f_code code object being executed in this frame |
| 157 | f_exc_traceback traceback if raised in this frame, or None |
| 158 | f_exc_type exception type if raised in this frame, or None |
| 159 | f_exc_value exception value if raised in this frame, or None |
| 160 | f_globals global namespace seen by this frame |
| 161 | f_lasti index of last attempted instruction in bytecode |
| 162 | f_lineno current line number in Python source code |
| 163 | f_locals local namespace seen by this frame |
| 164 | f_restricted 0 or 1 if frame is in restricted execution mode |
| 165 | f_trace tracing function for this frame, or None""" |
Tim Peters | 28bc59f | 2001-09-16 08:40:16 +0000 | [diff] [blame] | 166 | return isinstance(object, types.FrameType) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 167 | |
| 168 | def iscode(object): |
| 169 | """Return true if the object is a code object. |
| 170 | |
| 171 | Code objects provide these attributes: |
| 172 | co_argcount number of arguments (not including * or ** args) |
| 173 | co_code string of raw compiled bytecode |
| 174 | co_consts tuple of constants used in the bytecode |
| 175 | co_filename name of file in which this code object was created |
| 176 | co_firstlineno number of first line in Python source code |
| 177 | co_flags bitmap: 1=optimized | 2=newlocals | 4=*arg | 8=**arg |
| 178 | co_lnotab encoded mapping of line numbers to bytecode indices |
| 179 | co_name name with which this code object was defined |
| 180 | co_names tuple of names of local variables |
| 181 | co_nlocals number of local variables |
| 182 | co_stacksize virtual machine stack space required |
| 183 | co_varnames tuple of names of arguments and local variables""" |
Tim Peters | 28bc59f | 2001-09-16 08:40:16 +0000 | [diff] [blame] | 184 | return isinstance(object, types.CodeType) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 185 | |
| 186 | def isbuiltin(object): |
| 187 | """Return true if the object is a built-in function or method. |
| 188 | |
| 189 | Built-in functions and methods provide these attributes: |
| 190 | __doc__ documentation string |
| 191 | __name__ original name of this function or method |
| 192 | __self__ instance to which a method is bound, or None""" |
Tim Peters | 28bc59f | 2001-09-16 08:40:16 +0000 | [diff] [blame] | 193 | return isinstance(object, types.BuiltinFunctionType) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 194 | |
| 195 | def isroutine(object): |
| 196 | """Return true if the object is any kind of function or method.""" |
Tim Peters | 536d226 | 2001-09-20 05:13:38 +0000 | [diff] [blame] | 197 | return (isbuiltin(object) |
| 198 | or isfunction(object) |
| 199 | or ismethod(object) |
| 200 | or ismethoddescriptor(object)) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 201 | |
| 202 | def getmembers(object, predicate=None): |
| 203 | """Return all members of an object as (name, value) pairs sorted by name. |
| 204 | Optionally, only return members that satisfy a given predicate.""" |
| 205 | results = [] |
| 206 | for key in dir(object): |
| 207 | value = getattr(object, key) |
| 208 | if not predicate or predicate(value): |
| 209 | results.append((key, value)) |
| 210 | results.sort() |
| 211 | return results |
| 212 | |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 213 | Attribute = namedtuple('Attribute', 'name kind defining_class object') |
| 214 | |
Tim Peters | 13b49d3 | 2001-09-23 02:00:29 +0000 | [diff] [blame] | 215 | def classify_class_attrs(cls): |
| 216 | """Return list of attribute-descriptor tuples. |
| 217 | |
| 218 | For each name in dir(cls), the return list contains a 4-tuple |
| 219 | with these elements: |
| 220 | |
| 221 | 0. The name (a string). |
| 222 | |
| 223 | 1. The kind of attribute this is, one of these strings: |
| 224 | 'class method' created via classmethod() |
| 225 | 'static method' created via staticmethod() |
| 226 | 'property' created via property() |
| 227 | 'method' any other flavor of method |
| 228 | 'data' not a method |
| 229 | |
| 230 | 2. The class which defined this attribute (a class). |
| 231 | |
| 232 | 3. The object as obtained directly from the defining class's |
| 233 | __dict__, not via getattr. This is especially important for |
| 234 | data attributes: C.data is just a data object, but |
| 235 | C.__dict__['data'] may be a data descriptor with additional |
| 236 | info, like a __doc__ string. |
| 237 | """ |
| 238 | |
| 239 | mro = getmro(cls) |
| 240 | names = dir(cls) |
| 241 | result = [] |
| 242 | for name in names: |
| 243 | # Get the object associated with the name. |
| 244 | # Getting an obj from the __dict__ sometimes reveals more than |
| 245 | # using getattr. Static and class methods are dramatic examples. |
| 246 | if name in cls.__dict__: |
| 247 | obj = cls.__dict__[name] |
| 248 | else: |
| 249 | obj = getattr(cls, name) |
| 250 | |
| 251 | # Figure out where it was defined. |
Tim Peters | 13b49d3 | 2001-09-23 02:00:29 +0000 | [diff] [blame] | 252 | homecls = getattr(obj, "__objclass__", None) |
| 253 | if homecls is None: |
Guido van Rossum | 687ae00 | 2001-10-15 22:03:32 +0000 | [diff] [blame] | 254 | # search the dicts. |
Tim Peters | 13b49d3 | 2001-09-23 02:00:29 +0000 | [diff] [blame] | 255 | for base in mro: |
| 256 | if name in base.__dict__: |
| 257 | homecls = base |
| 258 | break |
| 259 | |
| 260 | # Get the object again, in order to get it from the defining |
| 261 | # __dict__ instead of via getattr (if possible). |
| 262 | if homecls is not None and name in homecls.__dict__: |
| 263 | obj = homecls.__dict__[name] |
| 264 | |
| 265 | # Also get the object via getattr. |
| 266 | obj_via_getattr = getattr(cls, name) |
| 267 | |
| 268 | # Classify the object. |
| 269 | if isinstance(obj, staticmethod): |
| 270 | kind = "static method" |
| 271 | elif isinstance(obj, classmethod): |
| 272 | kind = "class method" |
| 273 | elif isinstance(obj, property): |
| 274 | kind = "property" |
| 275 | elif (ismethod(obj_via_getattr) or |
| 276 | ismethoddescriptor(obj_via_getattr)): |
| 277 | kind = "method" |
| 278 | else: |
| 279 | kind = "data" |
| 280 | |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 281 | result.append(Attribute(name, kind, homecls, obj)) |
Tim Peters | 13b49d3 | 2001-09-23 02:00:29 +0000 | [diff] [blame] | 282 | |
| 283 | return result |
| 284 | |
Tim Peters | e0b2d7a | 2001-09-22 06:10:55 +0000 | [diff] [blame] | 285 | # ----------------------------------------------------------- class helpers |
| 286 | def _searchbases(cls, accum): |
| 287 | # Simulate the "classic class" search order. |
| 288 | if cls in accum: |
| 289 | return |
| 290 | accum.append(cls) |
| 291 | for base in cls.__bases__: |
| 292 | _searchbases(base, accum) |
| 293 | |
| 294 | def getmro(cls): |
| 295 | "Return tuple of base classes (including cls) in method resolution order." |
| 296 | if hasattr(cls, "__mro__"): |
| 297 | return cls.__mro__ |
| 298 | else: |
| 299 | result = [] |
| 300 | _searchbases(cls, result) |
| 301 | return tuple(result) |
| 302 | |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 303 | # -------------------------------------------------- source code extraction |
| 304 | def indentsize(line): |
| 305 | """Return the indent size, in spaces, at the start of a line of text.""" |
| 306 | expline = string.expandtabs(line) |
| 307 | return len(expline) - len(string.lstrip(expline)) |
| 308 | |
| 309 | def getdoc(object): |
| 310 | """Get the documentation string for an object. |
| 311 | |
| 312 | All tabs are expanded to spaces. To clean up docstrings that are |
| 313 | indented to line up with blocks of code, any whitespace than can be |
| 314 | uniformly removed from the second line onwards is removed.""" |
Tim Peters | 2400831 | 2002-03-17 18:56:20 +0000 | [diff] [blame] | 315 | try: |
| 316 | doc = object.__doc__ |
| 317 | except AttributeError: |
| 318 | return None |
Michael W. Hudson | 755f75e | 2002-05-20 17:29:46 +0000 | [diff] [blame] | 319 | if not isinstance(doc, types.StringTypes): |
Tim Peters | 2400831 | 2002-03-17 18:56:20 +0000 | [diff] [blame] | 320 | return None |
| 321 | try: |
| 322 | lines = string.split(string.expandtabs(doc), '\n') |
| 323 | except UnicodeError: |
| 324 | return None |
| 325 | else: |
Ka-Ping Yee | a59ef7b | 2002-11-30 03:53:15 +0000 | [diff] [blame] | 326 | # Find minimum indentation of any non-blank lines after first line. |
| 327 | margin = sys.maxint |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 328 | for line in lines[1:]: |
| 329 | content = len(string.lstrip(line)) |
Ka-Ping Yee | a59ef7b | 2002-11-30 03:53:15 +0000 | [diff] [blame] | 330 | if content: |
| 331 | indent = len(line) - content |
| 332 | margin = min(margin, indent) |
| 333 | # Remove indentation. |
| 334 | if lines: |
| 335 | lines[0] = lines[0].lstrip() |
| 336 | if margin < sys.maxint: |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 337 | for i in range(1, len(lines)): lines[i] = lines[i][margin:] |
Ka-Ping Yee | a59ef7b | 2002-11-30 03:53:15 +0000 | [diff] [blame] | 338 | # Remove any trailing or leading blank lines. |
| 339 | while lines and not lines[-1]: |
| 340 | lines.pop() |
| 341 | while lines and not lines[0]: |
| 342 | lines.pop(0) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 343 | return string.join(lines, '\n') |
| 344 | |
| 345 | def getfile(object): |
Ka-Ping Yee | c113c24 | 2001-03-02 02:08:53 +0000 | [diff] [blame] | 346 | """Work out which source or compiled file an object was defined in.""" |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 347 | if ismodule(object): |
| 348 | if hasattr(object, '__file__'): |
| 349 | return object.__file__ |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 350 | raise TypeError('arg is a built-in module') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 351 | if isclass(object): |
Ka-Ping Yee | c99e0f1 | 2001-04-13 12:10:40 +0000 | [diff] [blame] | 352 | object = sys.modules.get(object.__module__) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 353 | if hasattr(object, '__file__'): |
| 354 | return object.__file__ |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 355 | raise TypeError('arg is a built-in class') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 356 | if ismethod(object): |
| 357 | object = object.im_func |
| 358 | if isfunction(object): |
| 359 | object = object.func_code |
| 360 | if istraceback(object): |
| 361 | object = object.tb_frame |
| 362 | if isframe(object): |
| 363 | object = object.f_code |
| 364 | if iscode(object): |
| 365 | return object.co_filename |
Tim Peters | 478c105 | 2003-06-29 05:46:54 +0000 | [diff] [blame] | 366 | raise TypeError('arg is not a module, class, method, ' |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 367 | 'function, traceback, frame, or code object') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 368 | |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 369 | ModuleInfo = namedtuple('ModuleInfo', 'name suffix mode module_type') |
| 370 | |
Ka-Ping Yee | 4d6fc7f | 2001-04-10 11:43:00 +0000 | [diff] [blame] | 371 | def getmoduleinfo(path): |
| 372 | """Get the module name, suffix, mode, and module type for a given file.""" |
| 373 | filename = os.path.basename(path) |
| 374 | suffixes = map(lambda (suffix, mode, mtype): |
| 375 | (-len(suffix), suffix, mode, mtype), imp.get_suffixes()) |
| 376 | suffixes.sort() # try longest suffixes first, in case they overlap |
| 377 | for neglen, suffix, mode, mtype in suffixes: |
| 378 | if filename[neglen:] == suffix: |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 379 | return ModuleInfo(filename[:neglen], suffix, mode, mtype) |
Ka-Ping Yee | 4d6fc7f | 2001-04-10 11:43:00 +0000 | [diff] [blame] | 380 | |
| 381 | def getmodulename(path): |
| 382 | """Return the module name for a given file, or None.""" |
| 383 | info = getmoduleinfo(path) |
| 384 | if info: return info[0] |
| 385 | |
Ka-Ping Yee | c113c24 | 2001-03-02 02:08:53 +0000 | [diff] [blame] | 386 | def getsourcefile(object): |
| 387 | """Return the Python source file an object was defined in, if it exists.""" |
| 388 | filename = getfile(object) |
Raymond Hettinger | dbecd93 | 2005-02-06 06:57:08 +0000 | [diff] [blame] | 389 | if string.lower(filename[-4:]) in ('.pyc', '.pyo'): |
Ka-Ping Yee | c113c24 | 2001-03-02 02:08:53 +0000 | [diff] [blame] | 390 | filename = filename[:-4] + '.py' |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 391 | for suffix, mode, kind in imp.get_suffixes(): |
| 392 | if 'b' in mode and string.lower(filename[-len(suffix):]) == suffix: |
| 393 | # Looks like a binary file. We want to only return a text file. |
| 394 | return None |
Phillip J. Eby | 72ae6c8 | 2006-04-30 15:59:26 +0000 | [diff] [blame] | 395 | if os.path.exists(filename): |
| 396 | return filename |
Phillip J. Eby | 5d86bdb | 2006-07-10 19:03:29 +0000 | [diff] [blame] | 397 | # only return a non-existent filename if the module has a PEP 302 loader |
| 398 | if hasattr(getmodule(object, filename), '__loader__'): |
Ka-Ping Yee | c113c24 | 2001-03-02 02:08:53 +0000 | [diff] [blame] | 399 | return filename |
| 400 | |
Phillip J. Eby | 5d86bdb | 2006-07-10 19:03:29 +0000 | [diff] [blame] | 401 | def getabsfile(object, _filename=None): |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 402 | """Return an absolute path to the source or compiled file for an object. |
Ka-Ping Yee | c113c24 | 2001-03-02 02:08:53 +0000 | [diff] [blame] | 403 | |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 404 | The idea is for each object to have a unique origin, so this routine |
| 405 | normalizes the result as much as possible.""" |
Phillip J. Eby | 1a2959c | 2006-07-20 15:54:16 +0000 | [diff] [blame] | 406 | if _filename is None: |
| 407 | _filename = getsourcefile(object) or getfile(object) |
| 408 | return os.path.normcase(os.path.abspath(_filename)) |
Ka-Ping Yee | c113c24 | 2001-03-02 02:08:53 +0000 | [diff] [blame] | 409 | |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 410 | modulesbyfile = {} |
Nick Coghlan | c495c66 | 2006-09-07 10:50:34 +0000 | [diff] [blame] | 411 | _filesbymodname = {} |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 412 | |
Phillip J. Eby | 5d86bdb | 2006-07-10 19:03:29 +0000 | [diff] [blame] | 413 | def getmodule(object, _filename=None): |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 414 | """Return the module an object was defined in, or None if not found.""" |
Ka-Ping Yee | 202c99b | 2001-04-13 09:15:08 +0000 | [diff] [blame] | 415 | if ismodule(object): |
| 416 | return object |
Johannes Gijsbers | 9324526 | 2004-09-11 15:53:22 +0000 | [diff] [blame] | 417 | if hasattr(object, '__module__'): |
Ka-Ping Yee | 8b58b84 | 2001-03-01 13:56:16 +0000 | [diff] [blame] | 418 | return sys.modules.get(object.__module__) |
Nick Coghlan | c495c66 | 2006-09-07 10:50:34 +0000 | [diff] [blame] | 419 | # Try the filename to modulename cache |
| 420 | if _filename is not None and _filename in modulesbyfile: |
| 421 | return sys.modules.get(modulesbyfile[_filename]) |
| 422 | # Try the cache again with the absolute file name |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 423 | try: |
Phillip J. Eby | 5d86bdb | 2006-07-10 19:03:29 +0000 | [diff] [blame] | 424 | file = getabsfile(object, _filename) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 425 | except TypeError: |
| 426 | return None |
Raymond Hettinger | 54f0222 | 2002-06-01 14:18:47 +0000 | [diff] [blame] | 427 | if file in modulesbyfile: |
Ka-Ping Yee | b38bbbd | 2003-03-28 16:29:50 +0000 | [diff] [blame] | 428 | return sys.modules.get(modulesbyfile[file]) |
Nick Coghlan | c495c66 | 2006-09-07 10:50:34 +0000 | [diff] [blame] | 429 | # Update the filename to module name cache and check yet again |
| 430 | # Copy sys.modules in order to cope with changes while iterating |
| 431 | for modname, module in sys.modules.items(): |
Phillip J. Eby | 4703211 | 2006-04-11 01:07:43 +0000 | [diff] [blame] | 432 | if ismodule(module) and hasattr(module, '__file__'): |
Nick Coghlan | c495c66 | 2006-09-07 10:50:34 +0000 | [diff] [blame] | 433 | f = module.__file__ |
| 434 | if f == _filesbymodname.get(modname, None): |
| 435 | # Have already mapped this module, so skip it |
| 436 | continue |
| 437 | _filesbymodname[modname] = f |
Phillip J. Eby | 5d86bdb | 2006-07-10 19:03:29 +0000 | [diff] [blame] | 438 | f = getabsfile(module) |
Nick Coghlan | c495c66 | 2006-09-07 10:50:34 +0000 | [diff] [blame] | 439 | # Always map to the name the module knows itself by |
Phillip J. Eby | 5d86bdb | 2006-07-10 19:03:29 +0000 | [diff] [blame] | 440 | modulesbyfile[f] = modulesbyfile[ |
| 441 | os.path.realpath(f)] = module.__name__ |
Raymond Hettinger | 54f0222 | 2002-06-01 14:18:47 +0000 | [diff] [blame] | 442 | if file in modulesbyfile: |
Ka-Ping Yee | b38bbbd | 2003-03-28 16:29:50 +0000 | [diff] [blame] | 443 | return sys.modules.get(modulesbyfile[file]) |
Nick Coghlan | c495c66 | 2006-09-07 10:50:34 +0000 | [diff] [blame] | 444 | # Check the main module |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 445 | main = sys.modules['__main__'] |
Brett Cannon | 4a671fe | 2003-06-15 22:33:28 +0000 | [diff] [blame] | 446 | if not hasattr(object, '__name__'): |
| 447 | return None |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 448 | if hasattr(main, object.__name__): |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 449 | mainobject = getattr(main, object.__name__) |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 450 | if mainobject is object: |
| 451 | return main |
Nick Coghlan | c495c66 | 2006-09-07 10:50:34 +0000 | [diff] [blame] | 452 | # Check builtins |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 453 | builtin = sys.modules['__builtin__'] |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 454 | if hasattr(builtin, object.__name__): |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 455 | builtinobject = getattr(builtin, object.__name__) |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 456 | if builtinobject is object: |
| 457 | return builtin |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 458 | |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 459 | def findsource(object): |
| 460 | """Return the entire source file and starting line number for an object. |
| 461 | |
| 462 | The argument may be a module, class, method, function, traceback, frame, |
| 463 | or code object. The source code is returned as a list of all the lines |
| 464 | in the file and the line number indexes a line in that list. An IOError |
| 465 | is raised if the source code cannot be retrieved.""" |
Neil Schemenauer | f06f853 | 2002-03-23 23:51:04 +0000 | [diff] [blame] | 466 | file = getsourcefile(object) or getfile(object) |
Nick Coghlan | c495c66 | 2006-09-07 10:50:34 +0000 | [diff] [blame] | 467 | module = getmodule(object, file) |
Georg Brandl | 208badd | 2006-04-30 17:42:26 +0000 | [diff] [blame] | 468 | if module: |
| 469 | lines = linecache.getlines(file, module.__dict__) |
| 470 | else: |
| 471 | lines = linecache.getlines(file) |
Neil Schemenauer | f06f853 | 2002-03-23 23:51:04 +0000 | [diff] [blame] | 472 | if not lines: |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 473 | raise IOError('could not get source code') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 474 | |
| 475 | if ismodule(object): |
| 476 | return lines, 0 |
| 477 | |
| 478 | if isclass(object): |
| 479 | name = object.__name__ |
Georg Brandl | b2e81e3 | 2006-10-12 09:20:33 +0000 | [diff] [blame] | 480 | pat = re.compile(r'^(\s*)class\s*' + name + r'\b') |
| 481 | # make some effort to find the best matching class definition: |
| 482 | # use the one with the least indentation, which is the one |
| 483 | # that's most probably not inside a function definition. |
| 484 | candidates = [] |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 485 | for i in range(len(lines)): |
Georg Brandl | b2e81e3 | 2006-10-12 09:20:33 +0000 | [diff] [blame] | 486 | match = pat.match(lines[i]) |
| 487 | if match: |
| 488 | # if it's at toplevel, it's already the best one |
| 489 | if lines[i][0] == 'c': |
| 490 | return lines, i |
| 491 | # else add whitespace to candidate list |
| 492 | candidates.append((match.group(1), i)) |
| 493 | if candidates: |
| 494 | # this will sort by whitespace, and by line number, |
| 495 | # less whitespace first |
| 496 | candidates.sort() |
| 497 | return lines, candidates[0][1] |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 498 | else: |
| 499 | raise IOError('could not find class definition') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 500 | |
| 501 | if ismethod(object): |
| 502 | object = object.im_func |
| 503 | if isfunction(object): |
| 504 | object = object.func_code |
| 505 | if istraceback(object): |
| 506 | object = object.tb_frame |
| 507 | if isframe(object): |
| 508 | object = object.f_code |
| 509 | if iscode(object): |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 510 | if not hasattr(object, 'co_firstlineno'): |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 511 | raise IOError('could not find function definition') |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 512 | lnum = object.co_firstlineno - 1 |
Johannes Gijsbers | 1542f34 | 2004-12-12 16:46:28 +0000 | [diff] [blame] | 513 | pat = re.compile(r'^(\s*def\s)|(.*(?<!\w)lambda(:|\s))|^(\s*@)') |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 514 | while lnum > 0: |
Ka-Ping Yee | a6e5971 | 2001-03-10 09:31:55 +0000 | [diff] [blame] | 515 | if pat.match(lines[lnum]): break |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 516 | lnum = lnum - 1 |
| 517 | return lines, lnum |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 518 | raise IOError('could not find code object') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 519 | |
| 520 | def getcomments(object): |
Jeremy Hylton | b4c17c8 | 2002-03-28 23:01:56 +0000 | [diff] [blame] | 521 | """Get lines of comments immediately preceding an object's source code. |
| 522 | |
| 523 | Returns None when source can't be found. |
| 524 | """ |
| 525 | try: |
| 526 | lines, lnum = findsource(object) |
| 527 | except (IOError, TypeError): |
| 528 | return None |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 529 | |
| 530 | if ismodule(object): |
| 531 | # Look for a comment block at the top of the file. |
| 532 | start = 0 |
Ka-Ping Yee | b910efe | 2001-04-12 13:17:17 +0000 | [diff] [blame] | 533 | if lines and lines[0][:2] == '#!': start = 1 |
Raymond Hettinger | dbecd93 | 2005-02-06 06:57:08 +0000 | [diff] [blame] | 534 | while start < len(lines) and string.strip(lines[start]) in ('', '#'): |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 535 | start = start + 1 |
Ka-Ping Yee | b910efe | 2001-04-12 13:17:17 +0000 | [diff] [blame] | 536 | if start < len(lines) and lines[start][:1] == '#': |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 537 | comments = [] |
| 538 | end = start |
| 539 | while end < len(lines) and lines[end][:1] == '#': |
| 540 | comments.append(string.expandtabs(lines[end])) |
| 541 | end = end + 1 |
| 542 | return string.join(comments, '') |
| 543 | |
| 544 | # Look for a preceding block of comments at the same indentation. |
| 545 | elif lnum > 0: |
| 546 | indent = indentsize(lines[lnum]) |
| 547 | end = lnum - 1 |
| 548 | if end >= 0 and string.lstrip(lines[end])[:1] == '#' and \ |
| 549 | indentsize(lines[end]) == indent: |
| 550 | comments = [string.lstrip(string.expandtabs(lines[end]))] |
| 551 | if end > 0: |
| 552 | end = end - 1 |
| 553 | comment = string.lstrip(string.expandtabs(lines[end])) |
| 554 | while comment[:1] == '#' and indentsize(lines[end]) == indent: |
| 555 | comments[:0] = [comment] |
| 556 | end = end - 1 |
| 557 | if end < 0: break |
| 558 | comment = string.lstrip(string.expandtabs(lines[end])) |
| 559 | while comments and string.strip(comments[0]) == '#': |
| 560 | comments[:1] = [] |
| 561 | while comments and string.strip(comments[-1]) == '#': |
| 562 | comments[-1:] = [] |
| 563 | return string.join(comments, '') |
| 564 | |
Tim Peters | 4efb6e9 | 2001-06-29 23:51:08 +0000 | [diff] [blame] | 565 | class EndOfBlock(Exception): pass |
| 566 | |
| 567 | class BlockFinder: |
| 568 | """Provide a tokeneater() method to detect the end of a code block.""" |
| 569 | def __init__(self): |
| 570 | self.indent = 0 |
Johannes Gijsbers | a5855d5 | 2005-03-12 16:37:11 +0000 | [diff] [blame] | 571 | self.islambda = False |
Johannes Gijsbers | 1542f34 | 2004-12-12 16:46:28 +0000 | [diff] [blame] | 572 | self.started = False |
| 573 | self.passline = False |
Armin Rigo | dd5c023 | 2005-09-25 11:45:45 +0000 | [diff] [blame] | 574 | self.last = 1 |
Tim Peters | 4efb6e9 | 2001-06-29 23:51:08 +0000 | [diff] [blame] | 575 | |
| 576 | def tokeneater(self, type, token, (srow, scol), (erow, ecol), line): |
| 577 | if not self.started: |
Armin Rigo | dd5c023 | 2005-09-25 11:45:45 +0000 | [diff] [blame] | 578 | # look for the first "def", "class" or "lambda" |
Johannes Gijsbers | 1542f34 | 2004-12-12 16:46:28 +0000 | [diff] [blame] | 579 | if token in ("def", "class", "lambda"): |
Johannes Gijsbers | a5855d5 | 2005-03-12 16:37:11 +0000 | [diff] [blame] | 580 | if token == "lambda": |
| 581 | self.islambda = True |
Johannes Gijsbers | 1542f34 | 2004-12-12 16:46:28 +0000 | [diff] [blame] | 582 | self.started = True |
Armin Rigo | dd5c023 | 2005-09-25 11:45:45 +0000 | [diff] [blame] | 583 | self.passline = True # skip to the end of the line |
Tim Peters | 4efb6e9 | 2001-06-29 23:51:08 +0000 | [diff] [blame] | 584 | elif type == tokenize.NEWLINE: |
Armin Rigo | dd5c023 | 2005-09-25 11:45:45 +0000 | [diff] [blame] | 585 | self.passline = False # stop skipping when a NEWLINE is seen |
Tim Peters | 4efb6e9 | 2001-06-29 23:51:08 +0000 | [diff] [blame] | 586 | self.last = srow |
Armin Rigo | dd5c023 | 2005-09-25 11:45:45 +0000 | [diff] [blame] | 587 | if self.islambda: # lambdas always end at the first NEWLINE |
| 588 | raise EndOfBlock |
Johannes Gijsbers | 1542f34 | 2004-12-12 16:46:28 +0000 | [diff] [blame] | 589 | elif self.passline: |
| 590 | pass |
Tim Peters | 4efb6e9 | 2001-06-29 23:51:08 +0000 | [diff] [blame] | 591 | elif type == tokenize.INDENT: |
| 592 | self.indent = self.indent + 1 |
Johannes Gijsbers | 1542f34 | 2004-12-12 16:46:28 +0000 | [diff] [blame] | 593 | self.passline = True |
Tim Peters | 4efb6e9 | 2001-06-29 23:51:08 +0000 | [diff] [blame] | 594 | elif type == tokenize.DEDENT: |
| 595 | self.indent = self.indent - 1 |
Armin Rigo | dd5c023 | 2005-09-25 11:45:45 +0000 | [diff] [blame] | 596 | # the end of matching indent/dedent pairs end a block |
| 597 | # (note that this only works for "def"/"class" blocks, |
| 598 | # not e.g. for "if: else:" or "try: finally:" blocks) |
| 599 | if self.indent <= 0: |
| 600 | raise EndOfBlock |
| 601 | elif self.indent == 0 and type not in (tokenize.COMMENT, tokenize.NL): |
| 602 | # any other token on the same indentation level end the previous |
| 603 | # block as well, except the pseudo-tokens COMMENT and NL. |
| 604 | raise EndOfBlock |
Tim Peters | 4efb6e9 | 2001-06-29 23:51:08 +0000 | [diff] [blame] | 605 | |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 606 | def getblock(lines): |
| 607 | """Extract the block of code at the top of the given list of lines.""" |
Armin Rigo | dd5c023 | 2005-09-25 11:45:45 +0000 | [diff] [blame] | 608 | blockfinder = BlockFinder() |
Tim Peters | 4efb6e9 | 2001-06-29 23:51:08 +0000 | [diff] [blame] | 609 | try: |
Armin Rigo | dd5c023 | 2005-09-25 11:45:45 +0000 | [diff] [blame] | 610 | tokenize.tokenize(iter(lines).next, blockfinder.tokeneater) |
| 611 | except (EndOfBlock, IndentationError): |
| 612 | pass |
| 613 | return lines[:blockfinder.last] |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 614 | |
| 615 | def getsourcelines(object): |
| 616 | """Return a list of source lines and starting line number for an object. |
| 617 | |
| 618 | The argument may be a module, class, method, function, traceback, frame, |
| 619 | or code object. The source code is returned as a list of the lines |
| 620 | corresponding to the object and the line number indicates where in the |
| 621 | original source file the first line of code was found. An IOError is |
| 622 | raised if the source code cannot be retrieved.""" |
| 623 | lines, lnum = findsource(object) |
| 624 | |
| 625 | if ismodule(object): return lines, 0 |
| 626 | else: return getblock(lines[lnum:]), lnum + 1 |
| 627 | |
| 628 | def getsource(object): |
| 629 | """Return the text of the source code for an object. |
| 630 | |
| 631 | The argument may be a module, class, method, function, traceback, frame, |
| 632 | or code object. The source code is returned as a single string. An |
| 633 | IOError is raised if the source code cannot be retrieved.""" |
| 634 | lines, lnum = getsourcelines(object) |
| 635 | return string.join(lines, '') |
| 636 | |
| 637 | # --------------------------------------------------- class tree extraction |
| 638 | def walktree(classes, children, parent): |
| 639 | """Recursive helper function for getclasstree().""" |
| 640 | results = [] |
Raymond Hettinger | a1a992c | 2005-03-11 06:46:45 +0000 | [diff] [blame] | 641 | classes.sort(key=attrgetter('__module__', '__name__')) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 642 | for c in classes: |
| 643 | results.append((c, c.__bases__)) |
Raymond Hettinger | 54f0222 | 2002-06-01 14:18:47 +0000 | [diff] [blame] | 644 | if c in children: |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 645 | results.append(walktree(children[c], children, c)) |
| 646 | return results |
| 647 | |
| 648 | def getclasstree(classes, unique=0): |
| 649 | """Arrange the given list of classes into a hierarchy of nested lists. |
| 650 | |
| 651 | Where a nested list appears, it contains classes derived from the class |
| 652 | whose entry immediately precedes the list. Each entry is a 2-tuple |
| 653 | containing a class and a tuple of its base classes. If the 'unique' |
| 654 | argument is true, exactly one entry appears in the returned structure |
| 655 | for each class in the given list. Otherwise, classes using multiple |
| 656 | inheritance and their descendants will appear multiple times.""" |
| 657 | children = {} |
| 658 | roots = [] |
| 659 | for c in classes: |
| 660 | if c.__bases__: |
| 661 | for parent in c.__bases__: |
Raymond Hettinger | 54f0222 | 2002-06-01 14:18:47 +0000 | [diff] [blame] | 662 | if not parent in children: |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 663 | children[parent] = [] |
| 664 | children[parent].append(c) |
| 665 | if unique and parent in classes: break |
| 666 | elif c not in roots: |
| 667 | roots.append(c) |
Raymond Hettinger | e0d4972 | 2002-06-02 18:55:56 +0000 | [diff] [blame] | 668 | for parent in children: |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 669 | if parent not in classes: |
| 670 | roots.append(parent) |
| 671 | return walktree(roots, children, None) |
| 672 | |
| 673 | # ------------------------------------------------ argument list extraction |
| 674 | # These constants are from Python's compile.h. |
| 675 | CO_OPTIMIZED, CO_NEWLOCALS, CO_VARARGS, CO_VARKEYWORDS = 1, 2, 4, 8 |
| 676 | |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 677 | Arguments = namedtuple('Arguments', 'args varargs keywords') |
| 678 | |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 679 | def getargs(co): |
| 680 | """Get information about the arguments accepted by a code object. |
| 681 | |
| 682 | Three things are returned: (args, varargs, varkw), where 'args' is |
| 683 | a list of argument names (possibly containing nested lists), and |
| 684 | 'varargs' and 'varkw' are the names of the * and ** arguments or None.""" |
Jeremy Hylton | 6496788 | 2003-06-27 18:14:39 +0000 | [diff] [blame] | 685 | |
| 686 | if not iscode(co): |
| 687 | raise TypeError('arg is not a code object') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 688 | |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 689 | nargs = co.co_argcount |
| 690 | names = co.co_varnames |
| 691 | args = list(names[:nargs]) |
| 692 | step = 0 |
| 693 | |
| 694 | # The following acrobatics are for anonymous (tuple) arguments. |
| 695 | for i in range(nargs): |
Raymond Hettinger | dbecd93 | 2005-02-06 06:57:08 +0000 | [diff] [blame] | 696 | if args[i][:1] in ('', '.'): |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 697 | stack, remain, count = [], [], [] |
Georg Brandl | bc5fbd9 | 2007-07-12 08:11:29 +0000 | [diff] [blame] | 698 | while step < len(co.co_code): |
| 699 | op = ord(co.co_code[step]) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 700 | step = step + 1 |
| 701 | if op >= dis.HAVE_ARGUMENT: |
| 702 | opname = dis.opname[op] |
Georg Brandl | bc5fbd9 | 2007-07-12 08:11:29 +0000 | [diff] [blame] | 703 | value = ord(co.co_code[step]) + ord(co.co_code[step+1])*256 |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 704 | step = step + 2 |
Raymond Hettinger | dbecd93 | 2005-02-06 06:57:08 +0000 | [diff] [blame] | 705 | if opname in ('UNPACK_TUPLE', 'UNPACK_SEQUENCE'): |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 706 | remain.append(value) |
| 707 | count.append(value) |
| 708 | elif opname == 'STORE_FAST': |
| 709 | stack.append(names[value]) |
Matthias Klose | 2e829c0 | 2004-08-15 17:04:33 +0000 | [diff] [blame] | 710 | |
| 711 | # Special case for sublists of length 1: def foo((bar)) |
| 712 | # doesn't generate the UNPACK_TUPLE bytecode, so if |
| 713 | # `remain` is empty here, we have such a sublist. |
| 714 | if not remain: |
| 715 | stack[0] = [stack[0]] |
| 716 | break |
| 717 | else: |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 718 | remain[-1] = remain[-1] - 1 |
Matthias Klose | 2e829c0 | 2004-08-15 17:04:33 +0000 | [diff] [blame] | 719 | while remain[-1] == 0: |
| 720 | remain.pop() |
| 721 | size = count.pop() |
| 722 | stack[-size:] = [stack[-size:]] |
| 723 | if not remain: break |
| 724 | remain[-1] = remain[-1] - 1 |
| 725 | if not remain: break |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 726 | args[i] = stack[0] |
| 727 | |
| 728 | varargs = None |
| 729 | if co.co_flags & CO_VARARGS: |
| 730 | varargs = co.co_varnames[nargs] |
| 731 | nargs = nargs + 1 |
| 732 | varkw = None |
| 733 | if co.co_flags & CO_VARKEYWORDS: |
| 734 | varkw = co.co_varnames[nargs] |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 735 | return Arguments(args, varargs, varkw) |
| 736 | |
| 737 | ArgSpec = namedtuple('ArgSpec', 'args varargs keywords defaults') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 738 | |
| 739 | def getargspec(func): |
| 740 | """Get the names and default values of a function's arguments. |
| 741 | |
| 742 | A tuple of four things is returned: (args, varargs, varkw, defaults). |
| 743 | 'args' is a list of the argument names (it may contain nested lists). |
| 744 | 'varargs' and 'varkw' are the names of the * and ** arguments or None. |
Jeremy Hylton | 6496788 | 2003-06-27 18:14:39 +0000 | [diff] [blame] | 745 | 'defaults' is an n-tuple of the default values of the last n arguments. |
| 746 | """ |
| 747 | |
| 748 | if ismethod(func): |
| 749 | func = func.im_func |
| 750 | if not isfunction(func): |
| 751 | raise TypeError('arg is not a Python function') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 752 | args, varargs, varkw = getargs(func.func_code) |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 753 | return ArgSpec(args, varargs, varkw, func.func_defaults) |
| 754 | |
| 755 | ArgInfo = namedtuple('ArgInfo', 'args varargs keywords locals') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 756 | |
| 757 | def getargvalues(frame): |
| 758 | """Get information about arguments passed into a particular frame. |
| 759 | |
| 760 | A tuple of four things is returned: (args, varargs, varkw, locals). |
| 761 | 'args' is a list of the argument names (it may contain nested lists). |
| 762 | 'varargs' and 'varkw' are the names of the * and ** arguments or None. |
| 763 | 'locals' is the locals dictionary of the given frame.""" |
| 764 | args, varargs, varkw = getargs(frame.f_code) |
| 765 | return args, varargs, varkw, frame.f_locals |
| 766 | |
| 767 | def joinseq(seq): |
| 768 | if len(seq) == 1: |
| 769 | return '(' + seq[0] + ',)' |
| 770 | else: |
| 771 | return '(' + string.join(seq, ', ') + ')' |
| 772 | |
| 773 | def strseq(object, convert, join=joinseq): |
| 774 | """Recursively walk a sequence, stringifying each element.""" |
Raymond Hettinger | dbecd93 | 2005-02-06 06:57:08 +0000 | [diff] [blame] | 775 | if type(object) in (list, tuple): |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 776 | return join(map(lambda o, c=convert, j=join: strseq(o, c, j), object)) |
| 777 | else: |
| 778 | return convert(object) |
| 779 | |
| 780 | def formatargspec(args, varargs=None, varkw=None, defaults=None, |
| 781 | formatarg=str, |
| 782 | formatvarargs=lambda name: '*' + name, |
| 783 | formatvarkw=lambda name: '**' + name, |
| 784 | formatvalue=lambda value: '=' + repr(value), |
| 785 | join=joinseq): |
| 786 | """Format an argument spec from the 4 values returned by getargspec. |
| 787 | |
| 788 | The first four arguments are (args, varargs, varkw, defaults). The |
| 789 | other four arguments are the corresponding optional formatting functions |
| 790 | that are called to turn names and values into strings. The ninth |
| 791 | argument is an optional function to format the sequence of arguments.""" |
| 792 | specs = [] |
| 793 | if defaults: |
| 794 | firstdefault = len(args) - len(defaults) |
| 795 | for i in range(len(args)): |
| 796 | spec = strseq(args[i], formatarg, join) |
| 797 | if defaults and i >= firstdefault: |
| 798 | spec = spec + formatvalue(defaults[i - firstdefault]) |
| 799 | specs.append(spec) |
Raymond Hettinger | 936654b | 2002-06-01 03:06:31 +0000 | [diff] [blame] | 800 | if varargs is not None: |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 801 | specs.append(formatvarargs(varargs)) |
Raymond Hettinger | 936654b | 2002-06-01 03:06:31 +0000 | [diff] [blame] | 802 | if varkw is not None: |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 803 | specs.append(formatvarkw(varkw)) |
| 804 | return '(' + string.join(specs, ', ') + ')' |
| 805 | |
| 806 | def formatargvalues(args, varargs, varkw, locals, |
| 807 | formatarg=str, |
| 808 | formatvarargs=lambda name: '*' + name, |
| 809 | formatvarkw=lambda name: '**' + name, |
| 810 | formatvalue=lambda value: '=' + repr(value), |
| 811 | join=joinseq): |
| 812 | """Format an argument spec from the 4 values returned by getargvalues. |
| 813 | |
| 814 | The first four arguments are (args, varargs, varkw, locals). The |
| 815 | next four arguments are the corresponding optional formatting functions |
| 816 | that are called to turn names and values into strings. The ninth |
| 817 | argument is an optional function to format the sequence of arguments.""" |
| 818 | def convert(name, locals=locals, |
| 819 | formatarg=formatarg, formatvalue=formatvalue): |
| 820 | return formatarg(name) + formatvalue(locals[name]) |
| 821 | specs = [] |
| 822 | for i in range(len(args)): |
| 823 | specs.append(strseq(args[i], convert, join)) |
| 824 | if varargs: |
| 825 | specs.append(formatvarargs(varargs) + formatvalue(locals[varargs])) |
| 826 | if varkw: |
| 827 | specs.append(formatvarkw(varkw) + formatvalue(locals[varkw])) |
| 828 | return '(' + string.join(specs, ', ') + ')' |
| 829 | |
| 830 | # -------------------------------------------------- stack frame extraction |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 831 | |
| 832 | Traceback = namedtuple('Traceback', 'filename lineno function code_context index') |
| 833 | |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 834 | def getframeinfo(frame, context=1): |
| 835 | """Get information about a frame or traceback object. |
| 836 | |
| 837 | A tuple of five things is returned: the filename, the line number of |
| 838 | the current line, the function name, a list of lines of context from |
| 839 | the source code, and the index of the current line within that list. |
| 840 | The optional second argument specifies the number of lines of context |
| 841 | to return, which are centered around the current line.""" |
| 842 | if istraceback(frame): |
Andrew M. Kuchling | ba8b6bc | 2004-06-05 14:11:59 +0000 | [diff] [blame] | 843 | lineno = frame.tb_lineno |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 844 | frame = frame.tb_frame |
Andrew M. Kuchling | ba8b6bc | 2004-06-05 14:11:59 +0000 | [diff] [blame] | 845 | else: |
| 846 | lineno = frame.f_lineno |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 847 | if not isframe(frame): |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 848 | raise TypeError('arg is not a frame or traceback object') |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 849 | |
Neil Schemenauer | f06f853 | 2002-03-23 23:51:04 +0000 | [diff] [blame] | 850 | filename = getsourcefile(frame) or getfile(frame) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 851 | if context > 0: |
Guido van Rossum | 54e54c6 | 2001-09-04 19:14:14 +0000 | [diff] [blame] | 852 | start = lineno - 1 - context//2 |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 853 | try: |
| 854 | lines, lnum = findsource(frame) |
Ka-Ping Yee | 4eb0c00 | 2001-03-02 05:50:34 +0000 | [diff] [blame] | 855 | except IOError: |
| 856 | lines = index = None |
| 857 | else: |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 858 | start = max(start, 1) |
Raymond Hettinger | a050171 | 2004-06-15 11:22:53 +0000 | [diff] [blame] | 859 | start = max(0, min(start, len(lines) - context)) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 860 | lines = lines[start:start+context] |
Ka-Ping Yee | 59ade08 | 2001-03-01 03:55:35 +0000 | [diff] [blame] | 861 | index = lineno - 1 - start |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 862 | else: |
| 863 | lines = index = None |
| 864 | |
Raymond Hettinger | e896acc | 2008-01-11 03:04:50 +0000 | [diff] [blame] | 865 | return Traceback(filename, lineno, frame.f_code.co_name, lines, index) |
Ka-Ping Yee | 59ade08 | 2001-03-01 03:55:35 +0000 | [diff] [blame] | 866 | |
| 867 | def getlineno(frame): |
| 868 | """Get the line number from a frame object, allowing for optimization.""" |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 869 | # FrameType.f_lineno is now a descriptor that grovels co_lnotab |
| 870 | return frame.f_lineno |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 871 | |
| 872 | def getouterframes(frame, context=1): |
| 873 | """Get a list of records for a frame and all higher (calling) frames. |
| 874 | |
| 875 | Each record contains a frame object, filename, line number, function |
| 876 | name, a list of lines of context, and index within the context.""" |
| 877 | framelist = [] |
| 878 | while frame: |
| 879 | framelist.append((frame,) + getframeinfo(frame, context)) |
| 880 | frame = frame.f_back |
| 881 | return framelist |
| 882 | |
| 883 | def getinnerframes(tb, context=1): |
| 884 | """Get a list of records for a traceback's frame and all lower frames. |
| 885 | |
| 886 | Each record contains a frame object, filename, line number, function |
| 887 | name, a list of lines of context, and index within the context.""" |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 888 | framelist = [] |
| 889 | while tb: |
| 890 | framelist.append((tb.tb_frame,) + getframeinfo(tb, context)) |
| 891 | tb = tb.tb_next |
| 892 | return framelist |
| 893 | |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 894 | currentframe = sys._getframe |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 895 | |
| 896 | def stack(context=1): |
| 897 | """Return a list of records for the stack above the caller's frame.""" |
Jeremy Hylton | ab91902 | 2003-06-27 18:41:20 +0000 | [diff] [blame] | 898 | return getouterframes(sys._getframe(1), context) |
Ka-Ping Yee | 6397c7c | 2001-02-27 14:43:21 +0000 | [diff] [blame] | 899 | |
| 900 | def trace(context=1): |
Tim Peters | 85ba673 | 2001-02-28 08:26:44 +0000 | [diff] [blame] | 901 | """Return a list of records for the stack below the current exception.""" |
Fred Drake | d451ec1 | 2002-04-26 02:29:55 +0000 | [diff] [blame] | 902 | return getinnerframes(sys.exc_info()[2], context) |