Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 1 | """Disassembler of Python byte code into mnemonics.""" |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 2 | |
| 3 | import sys |
Guido van Rossum | 18aef3c | 1997-03-14 04:15:43 +0000 | [diff] [blame] | 4 | import types |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 5 | |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 6 | from opcode import * |
| 7 | from opcode import __all__ as _opcodes_all |
| 8 | |
| 9 | __all__ = ["dis","disassemble","distb","disco"] + _opcodes_all |
| 10 | del _opcodes_all |
Skip Montanaro | e99d5ea | 2001-01-20 19:54:20 +0000 | [diff] [blame] | 11 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 12 | def dis(x=None): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 13 | """Disassemble classes, methods, functions, or code. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 14 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 15 | With no argument, disassemble the last traceback. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 16 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 17 | """ |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 18 | if x is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 19 | distb() |
| 20 | return |
Christian Heimes | ff73795 | 2007-11-27 10:40:20 +0000 | [diff] [blame] | 21 | if hasattr(x, '__func__'): |
| 22 | x = x.__func__ |
Neal Norwitz | 221085d | 2007-02-25 20:55:47 +0000 | [diff] [blame] | 23 | if hasattr(x, '__code__'): |
| 24 | x = x.__code__ |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 25 | if hasattr(x, '__dict__'): |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 26 | items = sorted(x.__dict__.items()) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 27 | for name, x1 in items: |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 28 | if isinstance(x1, (types.MethodType, types.FunctionType, |
Guido van Rossum | 1325790 | 2007-06-07 23:15:56 +0000 | [diff] [blame] | 29 | types.CodeType, type)): |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 30 | print("Disassembly of %s:" % name) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 31 | try: |
| 32 | dis(x1) |
Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 33 | except TypeError as msg: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 34 | print("Sorry:", msg) |
| 35 | print() |
Guido van Rossum | fc53c13 | 2001-01-19 02:41:41 +0000 | [diff] [blame] | 36 | elif hasattr(x, 'co_code'): |
| 37 | disassemble(x) |
Alexandre Vassalotti | 267d417 | 2008-06-04 20:26:54 +0000 | [diff] [blame] | 38 | elif isinstance(x, (bytes, bytearray)): |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 39 | disassemble_string(x) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 40 | else: |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 41 | raise TypeError("don't know how to disassemble %s objects" % |
| 42 | type(x).__name__) |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 43 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 44 | def distb(tb=None): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 45 | """Disassemble a traceback (default: last traceback).""" |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 46 | if tb is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 47 | try: |
| 48 | tb = sys.last_traceback |
| 49 | except AttributeError: |
Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 50 | raise RuntimeError("no last traceback to disassemble") |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 51 | while tb.tb_next: tb = tb.tb_next |
| 52 | disassemble(tb.tb_frame.f_code, tb.tb_lasti) |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 53 | |
Guido van Rossum | 3e1b85e | 2007-05-30 02:07:00 +0000 | [diff] [blame] | 54 | # XXX This duplicates information from code.h, also duplicated in inspect.py. |
| 55 | # XXX Maybe this ought to be put in a central location, like opcode.py? |
| 56 | flag2name = { |
| 57 | 1: "OPTIMIZED", |
| 58 | 2: "NEWLOCALS", |
| 59 | 4: "VARARGS", |
| 60 | 8: "VARKEYWORDS", |
| 61 | 16: "NESTED", |
| 62 | 32: "GENERATOR", |
| 63 | 64: "NOFREE", |
| 64 | } |
| 65 | |
| 66 | def pretty_flags(flags): |
| 67 | """Return pretty representation of code flags.""" |
| 68 | names = [] |
| 69 | for i in range(32): |
| 70 | flag = 1<<i |
| 71 | if flags & flag: |
| 72 | names.append(flag2name.get(flag, hex(flag))) |
| 73 | flags ^= flag |
| 74 | if not flags: |
| 75 | break |
| 76 | else: |
| 77 | names.append(hex(flags)) |
| 78 | return ", ".join(names) |
| 79 | |
| 80 | def show_code(co): |
| 81 | """Show details about a code object.""" |
| 82 | print("Name: ", co.co_name) |
| 83 | print("Filename: ", co.co_filename) |
| 84 | print("Argument count: ", co.co_argcount) |
| 85 | print("Kw-only arguments:", co.co_kwonlyargcount) |
| 86 | print("Number of locals: ", co.co_nlocals) |
| 87 | print("Stack size: ", co.co_stacksize) |
| 88 | print("Flags: ", pretty_flags(co.co_flags)) |
| 89 | if co.co_consts: |
| 90 | print("Constants:") |
| 91 | for i_c in enumerate(co.co_consts): |
| 92 | print("%4d: %r" % i_c) |
| 93 | if co.co_names: |
| 94 | print("Names:") |
| 95 | for i_n in enumerate(co.co_names): |
| 96 | print("%4d: %s" % i_n) |
| 97 | if co.co_varnames: |
| 98 | print("Variable names:") |
| 99 | for i_n in enumerate(co.co_varnames): |
| 100 | print("%4d: %s" % i_n) |
| 101 | if co.co_freevars: |
| 102 | print("Free variables:") |
| 103 | for i_n in enumerate(co.co_freevars): |
| 104 | print("%4d: %s" % i_n) |
| 105 | if co.co_cellvars: |
| 106 | print("Cell variables:") |
| 107 | for i_n in enumerate(co.co_cellvars): |
| 108 | print("%4d: %s" % i_n) |
| 109 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 110 | def disassemble(co, lasti=-1): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 111 | """Disassemble a code object.""" |
| 112 | code = co.co_code |
| 113 | labels = findlabels(code) |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 114 | linestarts = dict(findlinestarts(co)) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 115 | n = len(code) |
| 116 | i = 0 |
| 117 | extended_arg = 0 |
Jeremy Hylton | a39414b | 2001-01-25 20:08:47 +0000 | [diff] [blame] | 118 | free = None |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 119 | while i < n: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 120 | op = code[i] |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 121 | if i in linestarts: |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 122 | if i > 0: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 123 | print() |
| 124 | print("%3d" % linestarts[i], end=' ') |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 125 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 126 | print(' ', end=' ') |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 127 | |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 128 | if i == lasti: print('-->', end=' ') |
| 129 | else: print(' ', end=' ') |
| 130 | if i in labels: print('>>', end=' ') |
| 131 | else: print(' ', end=' ') |
| 132 | print(repr(i).rjust(4), end=' ') |
| 133 | print(opname[op].ljust(20), end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 134 | i = i+1 |
| 135 | if op >= HAVE_ARGUMENT: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 136 | oparg = code[i] + code[i+1]*256 + extended_arg |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 137 | extended_arg = 0 |
| 138 | i = i+2 |
| 139 | if op == EXTENDED_ARG: |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 140 | extended_arg = oparg*65536 |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 141 | print(repr(oparg).rjust(5), end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 142 | if op in hasconst: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 143 | print('(' + repr(co.co_consts[oparg]) + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 144 | elif op in hasname: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 145 | print('(' + co.co_names[oparg] + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 146 | elif op in hasjrel: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 147 | print('(to ' + repr(i + oparg) + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 148 | elif op in haslocal: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 149 | print('(' + co.co_varnames[oparg] + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 150 | elif op in hascompare: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 151 | print('(' + cmp_op[oparg] + ')', end=' ') |
Jeremy Hylton | a39414b | 2001-01-25 20:08:47 +0000 | [diff] [blame] | 152 | elif op in hasfree: |
| 153 | if free is None: |
| 154 | free = co.co_cellvars + co.co_freevars |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 155 | print('(' + free[oparg] + ')', end=' ') |
| 156 | print() |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 157 | |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 158 | def disassemble_string(code, lasti=-1, varnames=None, names=None, |
| 159 | constants=None): |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 160 | labels = findlabels(code) |
| 161 | n = len(code) |
| 162 | i = 0 |
| 163 | while i < n: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 164 | op = code[i] |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 165 | if i == lasti: print('-->', end=' ') |
| 166 | else: print(' ', end=' ') |
| 167 | if i in labels: print('>>', end=' ') |
| 168 | else: print(' ', end=' ') |
| 169 | print(repr(i).rjust(4), end=' ') |
| 170 | print(opname[op].ljust(15), end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 171 | i = i+1 |
| 172 | if op >= HAVE_ARGUMENT: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 173 | oparg = code[i] + code[i+1]*256 |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 174 | i = i+2 |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 175 | print(repr(oparg).rjust(5), end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 176 | if op in hasconst: |
| 177 | if constants: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 178 | print('(' + repr(constants[oparg]) + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 179 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 180 | print('(%d)'%oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 181 | elif op in hasname: |
| 182 | if names is not None: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 183 | print('(' + names[oparg] + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 184 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 185 | print('(%d)'%oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 186 | elif op in hasjrel: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 187 | print('(to ' + repr(i + oparg) + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 188 | elif op in haslocal: |
| 189 | if varnames: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 190 | print('(' + varnames[oparg] + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 191 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 192 | print('(%d)' % oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 193 | elif op in hascompare: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 194 | print('(' + cmp_op[oparg] + ')', end=' ') |
| 195 | print() |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 196 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 197 | disco = disassemble # XXX For backwards compatibility |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 198 | |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 199 | def findlabels(code): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 200 | """Detect all offsets in a byte code which are jump targets. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 201 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 202 | Return the list of offsets. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 203 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 204 | """ |
| 205 | labels = [] |
| 206 | n = len(code) |
| 207 | i = 0 |
| 208 | while i < n: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 209 | op = code[i] |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 210 | i = i+1 |
| 211 | if op >= HAVE_ARGUMENT: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 212 | oparg = code[i] + code[i+1]*256 |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 213 | i = i+2 |
| 214 | label = -1 |
| 215 | if op in hasjrel: |
| 216 | label = i+oparg |
| 217 | elif op in hasjabs: |
| 218 | label = oparg |
| 219 | if label >= 0: |
| 220 | if label not in labels: |
| 221 | labels.append(label) |
| 222 | return labels |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 223 | |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 224 | def findlinestarts(code): |
| 225 | """Find the offsets in a byte code which are start of lines in the source. |
| 226 | |
| 227 | Generate pairs (offset, lineno) as described in Python/compile.c. |
| 228 | |
| 229 | """ |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 230 | byte_increments = list(code.co_lnotab[0::2]) |
| 231 | line_increments = list(code.co_lnotab[1::2]) |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 232 | |
| 233 | lastlineno = None |
| 234 | lineno = code.co_firstlineno |
| 235 | addr = 0 |
| 236 | for byte_incr, line_incr in zip(byte_increments, line_increments): |
| 237 | if byte_incr: |
| 238 | if lineno != lastlineno: |
| 239 | yield (addr, lineno) |
| 240 | lastlineno = lineno |
| 241 | addr += byte_incr |
| 242 | lineno += line_incr |
| 243 | if lineno != lastlineno: |
| 244 | yield (addr, lineno) |
Guido van Rossum | 1fdae12 | 2000-02-04 17:47:55 +0000 | [diff] [blame] | 245 | |
| 246 | def _test(): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 247 | """Simple test program to disassemble a file.""" |
| 248 | if sys.argv[1:]: |
| 249 | if sys.argv[2:]: |
| 250 | sys.stderr.write("usage: python dis.py [-|file]\n") |
| 251 | sys.exit(2) |
| 252 | fn = sys.argv[1] |
| 253 | if not fn or fn == "-": |
| 254 | fn = None |
| 255 | else: |
| 256 | fn = None |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 257 | if fn is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 258 | f = sys.stdin |
| 259 | else: |
| 260 | f = open(fn) |
| 261 | source = f.read() |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 262 | if fn is not None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 263 | f.close() |
| 264 | else: |
| 265 | fn = "<stdin>" |
| 266 | code = compile(source, fn, "exec") |
| 267 | dis(code) |
Guido van Rossum | 1fdae12 | 2000-02-04 17:47:55 +0000 | [diff] [blame] | 268 | |
| 269 | if __name__ == "__main__": |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 270 | _test() |