Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 1 | """Disassembler of Python byte code into mnemonics.""" |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 2 | |
| 3 | import sys |
Guido van Rossum | 18aef3c | 1997-03-14 04:15:43 +0000 | [diff] [blame] | 4 | import types |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 5 | |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 6 | from opcode import * |
| 7 | from opcode import __all__ as _opcodes_all |
| 8 | |
| 9 | __all__ = ["dis","disassemble","distb","disco"] + _opcodes_all |
| 10 | del _opcodes_all |
Skip Montanaro | e99d5ea | 2001-01-20 19:54:20 +0000 | [diff] [blame] | 11 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 12 | def dis(x=None): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 13 | """Disassemble classes, methods, functions, or code. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 14 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 15 | With no argument, disassemble the last traceback. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 16 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 17 | """ |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 18 | if x is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 19 | distb() |
| 20 | return |
Guido van Rossum | fc53c13 | 2001-01-19 02:41:41 +0000 | [diff] [blame] | 21 | if hasattr(x, 'im_func'): |
| 22 | x = x.im_func |
Neal Norwitz | 221085d | 2007-02-25 20:55:47 +0000 | [diff] [blame] | 23 | if hasattr(x, '__code__'): |
| 24 | x = x.__code__ |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 25 | if hasattr(x, '__dict__'): |
| 26 | items = x.__dict__.items() |
| 27 | items.sort() |
| 28 | for name, x1 in items: |
| 29 | if type(x1) in (types.MethodType, |
| 30 | types.FunctionType, |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 31 | types.CodeType, |
| 32 | types.ClassType): |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 33 | print("Disassembly of %s:" % name) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 34 | try: |
| 35 | dis(x1) |
Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 36 | except TypeError as msg: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 37 | print("Sorry:", msg) |
| 38 | print() |
Guido van Rossum | fc53c13 | 2001-01-19 02:41:41 +0000 | [diff] [blame] | 39 | elif hasattr(x, 'co_code'): |
| 40 | disassemble(x) |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 41 | elif isinstance(x, str): |
| 42 | disassemble_string(x) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 43 | else: |
Guido van Rossum | fc53c13 | 2001-01-19 02:41:41 +0000 | [diff] [blame] | 44 | raise TypeError, \ |
| 45 | "don't know how to disassemble %s objects" % \ |
| 46 | type(x).__name__ |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 47 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 48 | def distb(tb=None): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 49 | """Disassemble a traceback (default: last traceback).""" |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 50 | if tb is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 51 | try: |
| 52 | tb = sys.last_traceback |
| 53 | except AttributeError: |
| 54 | raise RuntimeError, "no last traceback to disassemble" |
| 55 | while tb.tb_next: tb = tb.tb_next |
| 56 | disassemble(tb.tb_frame.f_code, tb.tb_lasti) |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 57 | |
Guido van Rossum | 3e1b85e | 2007-05-30 02:07:00 +0000 | [diff] [blame^] | 58 | # XXX This duplicates information from code.h, also duplicated in inspect.py. |
| 59 | # XXX Maybe this ought to be put in a central location, like opcode.py? |
| 60 | flag2name = { |
| 61 | 1: "OPTIMIZED", |
| 62 | 2: "NEWLOCALS", |
| 63 | 4: "VARARGS", |
| 64 | 8: "VARKEYWORDS", |
| 65 | 16: "NESTED", |
| 66 | 32: "GENERATOR", |
| 67 | 64: "NOFREE", |
| 68 | } |
| 69 | |
| 70 | def pretty_flags(flags): |
| 71 | """Return pretty representation of code flags.""" |
| 72 | names = [] |
| 73 | for i in range(32): |
| 74 | flag = 1<<i |
| 75 | if flags & flag: |
| 76 | names.append(flag2name.get(flag, hex(flag))) |
| 77 | flags ^= flag |
| 78 | if not flags: |
| 79 | break |
| 80 | else: |
| 81 | names.append(hex(flags)) |
| 82 | return ", ".join(names) |
| 83 | |
| 84 | def show_code(co): |
| 85 | """Show details about a code object.""" |
| 86 | print("Name: ", co.co_name) |
| 87 | print("Filename: ", co.co_filename) |
| 88 | print("Argument count: ", co.co_argcount) |
| 89 | print("Kw-only arguments:", co.co_kwonlyargcount) |
| 90 | print("Number of locals: ", co.co_nlocals) |
| 91 | print("Stack size: ", co.co_stacksize) |
| 92 | print("Flags: ", pretty_flags(co.co_flags)) |
| 93 | if co.co_consts: |
| 94 | print("Constants:") |
| 95 | for i_c in enumerate(co.co_consts): |
| 96 | print("%4d: %r" % i_c) |
| 97 | if co.co_names: |
| 98 | print("Names:") |
| 99 | for i_n in enumerate(co.co_names): |
| 100 | print("%4d: %s" % i_n) |
| 101 | if co.co_varnames: |
| 102 | print("Variable names:") |
| 103 | for i_n in enumerate(co.co_varnames): |
| 104 | print("%4d: %s" % i_n) |
| 105 | if co.co_freevars: |
| 106 | print("Free variables:") |
| 107 | for i_n in enumerate(co.co_freevars): |
| 108 | print("%4d: %s" % i_n) |
| 109 | if co.co_cellvars: |
| 110 | print("Cell variables:") |
| 111 | for i_n in enumerate(co.co_cellvars): |
| 112 | print("%4d: %s" % i_n) |
| 113 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 114 | def disassemble(co, lasti=-1): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 115 | """Disassemble a code object.""" |
| 116 | code = co.co_code |
| 117 | labels = findlabels(code) |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 118 | linestarts = dict(findlinestarts(co)) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 119 | n = len(code) |
| 120 | i = 0 |
| 121 | extended_arg = 0 |
Jeremy Hylton | a39414b | 2001-01-25 20:08:47 +0000 | [diff] [blame] | 122 | free = None |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 123 | while i < n: |
| 124 | c = code[i] |
| 125 | op = ord(c) |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 126 | if i in linestarts: |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 127 | if i > 0: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 128 | print() |
| 129 | print("%3d" % linestarts[i], end=' ') |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 130 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 131 | print(' ', end=' ') |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 132 | |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 133 | if i == lasti: print('-->', end=' ') |
| 134 | else: print(' ', end=' ') |
| 135 | if i in labels: print('>>', end=' ') |
| 136 | else: print(' ', end=' ') |
| 137 | print(repr(i).rjust(4), end=' ') |
| 138 | print(opname[op].ljust(20), end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 139 | i = i+1 |
| 140 | if op >= HAVE_ARGUMENT: |
| 141 | oparg = ord(code[i]) + ord(code[i+1])*256 + extended_arg |
| 142 | extended_arg = 0 |
| 143 | i = i+2 |
| 144 | if op == EXTENDED_ARG: |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 145 | extended_arg = oparg*65536 |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 146 | print(repr(oparg).rjust(5), end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 147 | if op in hasconst: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 148 | print('(' + repr(co.co_consts[oparg]) + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 149 | elif op in hasname: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 150 | print('(' + co.co_names[oparg] + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 151 | elif op in hasjrel: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 152 | print('(to ' + repr(i + oparg) + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 153 | elif op in haslocal: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 154 | print('(' + co.co_varnames[oparg] + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 155 | elif op in hascompare: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 156 | print('(' + cmp_op[oparg] + ')', end=' ') |
Jeremy Hylton | a39414b | 2001-01-25 20:08:47 +0000 | [diff] [blame] | 157 | elif op in hasfree: |
| 158 | if free is None: |
| 159 | free = co.co_cellvars + co.co_freevars |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 160 | print('(' + free[oparg] + ')', end=' ') |
| 161 | print() |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 162 | |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 163 | def disassemble_string(code, lasti=-1, varnames=None, names=None, |
| 164 | constants=None): |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 165 | labels = findlabels(code) |
| 166 | n = len(code) |
| 167 | i = 0 |
| 168 | while i < n: |
| 169 | c = code[i] |
| 170 | op = ord(c) |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 171 | if i == lasti: print('-->', end=' ') |
| 172 | else: print(' ', end=' ') |
| 173 | if i in labels: print('>>', end=' ') |
| 174 | else: print(' ', end=' ') |
| 175 | print(repr(i).rjust(4), end=' ') |
| 176 | print(opname[op].ljust(15), end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 177 | i = i+1 |
| 178 | if op >= HAVE_ARGUMENT: |
| 179 | oparg = ord(code[i]) + ord(code[i+1])*256 |
| 180 | i = i+2 |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 181 | print(repr(oparg).rjust(5), end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 182 | if op in hasconst: |
| 183 | if constants: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 184 | print('(' + repr(constants[oparg]) + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 185 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 186 | print('(%d)'%oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 187 | elif op in hasname: |
| 188 | if names is not None: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 189 | print('(' + names[oparg] + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 190 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 191 | print('(%d)'%oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 192 | elif op in hasjrel: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 193 | print('(to ' + repr(i + oparg) + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 194 | elif op in haslocal: |
| 195 | if varnames: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 196 | print('(' + varnames[oparg] + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 197 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 198 | print('(%d)' % oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 199 | elif op in hascompare: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 200 | print('(' + cmp_op[oparg] + ')', end=' ') |
| 201 | print() |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 202 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 203 | disco = disassemble # XXX For backwards compatibility |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 204 | |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 205 | def findlabels(code): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 206 | """Detect all offsets in a byte code which are jump targets. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 207 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 208 | Return the list of offsets. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 209 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 210 | """ |
| 211 | labels = [] |
| 212 | n = len(code) |
| 213 | i = 0 |
| 214 | while i < n: |
| 215 | c = code[i] |
| 216 | op = ord(c) |
| 217 | i = i+1 |
| 218 | if op >= HAVE_ARGUMENT: |
| 219 | oparg = ord(code[i]) + ord(code[i+1])*256 |
| 220 | i = i+2 |
| 221 | label = -1 |
| 222 | if op in hasjrel: |
| 223 | label = i+oparg |
| 224 | elif op in hasjabs: |
| 225 | label = oparg |
| 226 | if label >= 0: |
| 227 | if label not in labels: |
| 228 | labels.append(label) |
| 229 | return labels |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 230 | |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 231 | def findlinestarts(code): |
| 232 | """Find the offsets in a byte code which are start of lines in the source. |
| 233 | |
| 234 | Generate pairs (offset, lineno) as described in Python/compile.c. |
| 235 | |
| 236 | """ |
| 237 | byte_increments = [ord(c) for c in code.co_lnotab[0::2]] |
| 238 | line_increments = [ord(c) for c in code.co_lnotab[1::2]] |
| 239 | |
| 240 | lastlineno = None |
| 241 | lineno = code.co_firstlineno |
| 242 | addr = 0 |
| 243 | for byte_incr, line_incr in zip(byte_increments, line_increments): |
| 244 | if byte_incr: |
| 245 | if lineno != lastlineno: |
| 246 | yield (addr, lineno) |
| 247 | lastlineno = lineno |
| 248 | addr += byte_incr |
| 249 | lineno += line_incr |
| 250 | if lineno != lastlineno: |
| 251 | yield (addr, lineno) |
Guido van Rossum | 1fdae12 | 2000-02-04 17:47:55 +0000 | [diff] [blame] | 252 | |
| 253 | def _test(): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 254 | """Simple test program to disassemble a file.""" |
| 255 | if sys.argv[1:]: |
| 256 | if sys.argv[2:]: |
| 257 | sys.stderr.write("usage: python dis.py [-|file]\n") |
| 258 | sys.exit(2) |
| 259 | fn = sys.argv[1] |
| 260 | if not fn or fn == "-": |
| 261 | fn = None |
| 262 | else: |
| 263 | fn = None |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 264 | if fn is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 265 | f = sys.stdin |
| 266 | else: |
| 267 | f = open(fn) |
| 268 | source = f.read() |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 269 | if fn is not None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 270 | f.close() |
| 271 | else: |
| 272 | fn = "<stdin>" |
| 273 | code = compile(source, fn, "exec") |
| 274 | dis(code) |
Guido van Rossum | 1fdae12 | 2000-02-04 17:47:55 +0000 | [diff] [blame] | 275 | |
| 276 | if __name__ == "__main__": |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 277 | _test() |