Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 1 | """Disassembler of Python byte code into mnemonics.""" |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 2 | |
| 3 | import sys |
Guido van Rossum | 18aef3c | 1997-03-14 04:15:43 +0000 | [diff] [blame] | 4 | import types |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 5 | |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 6 | from opcode import * |
| 7 | from opcode import __all__ as _opcodes_all |
| 8 | |
Benjamin Peterson | 75edad0 | 2009-01-01 15:05:06 +0000 | [diff] [blame] | 9 | __all__ = ["dis", "disassemble", "distb", "disco", |
| 10 | "findlinestarts", "findlabels"] + _opcodes_all |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 11 | del _opcodes_all |
Skip Montanaro | e99d5ea | 2001-01-20 19:54:20 +0000 | [diff] [blame] | 12 | |
Benjamin Peterson | 6ef9a84 | 2010-04-04 23:26:50 +0000 | [diff] [blame] | 13 | _have_code = (types.MethodType, types.FunctionType, types.CodeType, type) |
| 14 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 15 | def dis(x=None): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 16 | """Disassemble classes, methods, functions, or code. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 17 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 18 | With no argument, disassemble the last traceback. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 19 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 20 | """ |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 21 | if x is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 22 | distb() |
| 23 | return |
Christian Heimes | ff73795 | 2007-11-27 10:40:20 +0000 | [diff] [blame] | 24 | if hasattr(x, '__func__'): |
| 25 | x = x.__func__ |
Neal Norwitz | 221085d | 2007-02-25 20:55:47 +0000 | [diff] [blame] | 26 | if hasattr(x, '__code__'): |
| 27 | x = x.__code__ |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 28 | if hasattr(x, '__dict__'): |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 29 | items = sorted(x.__dict__.items()) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 30 | for name, x1 in items: |
Benjamin Peterson | 6ef9a84 | 2010-04-04 23:26:50 +0000 | [diff] [blame] | 31 | if isinstance(x1, _have_code): |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 32 | print("Disassembly of %s:" % name) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 33 | try: |
| 34 | dis(x1) |
Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 35 | except TypeError as msg: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 36 | print("Sorry:", msg) |
| 37 | print() |
Guido van Rossum | fc53c13 | 2001-01-19 02:41:41 +0000 | [diff] [blame] | 38 | elif hasattr(x, 'co_code'): |
| 39 | disassemble(x) |
Alexandre Vassalotti | 267d417 | 2008-06-04 20:26:54 +0000 | [diff] [blame] | 40 | elif isinstance(x, (bytes, bytearray)): |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 41 | disassemble_string(x) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 42 | else: |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 43 | raise TypeError("don't know how to disassemble %s objects" % |
| 44 | type(x).__name__) |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 45 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 46 | def distb(tb=None): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 47 | """Disassemble a traceback (default: last traceback).""" |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 48 | if tb is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 49 | try: |
| 50 | tb = sys.last_traceback |
| 51 | except AttributeError: |
Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 52 | raise RuntimeError("no last traceback to disassemble") |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 53 | while tb.tb_next: tb = tb.tb_next |
| 54 | disassemble(tb.tb_frame.f_code, tb.tb_lasti) |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 55 | |
Guido van Rossum | 3e1b85e | 2007-05-30 02:07:00 +0000 | [diff] [blame] | 56 | # XXX This duplicates information from code.h, also duplicated in inspect.py. |
| 57 | # XXX Maybe this ought to be put in a central location, like opcode.py? |
| 58 | flag2name = { |
| 59 | 1: "OPTIMIZED", |
| 60 | 2: "NEWLOCALS", |
| 61 | 4: "VARARGS", |
| 62 | 8: "VARKEYWORDS", |
| 63 | 16: "NESTED", |
| 64 | 32: "GENERATOR", |
| 65 | 64: "NOFREE", |
| 66 | } |
| 67 | |
| 68 | def pretty_flags(flags): |
| 69 | """Return pretty representation of code flags.""" |
| 70 | names = [] |
| 71 | for i in range(32): |
| 72 | flag = 1<<i |
| 73 | if flags & flag: |
| 74 | names.append(flag2name.get(flag, hex(flag))) |
| 75 | flags ^= flag |
| 76 | if not flags: |
| 77 | break |
| 78 | else: |
| 79 | names.append(hex(flags)) |
| 80 | return ", ".join(names) |
| 81 | |
| 82 | def show_code(co): |
| 83 | """Show details about a code object.""" |
| 84 | print("Name: ", co.co_name) |
| 85 | print("Filename: ", co.co_filename) |
| 86 | print("Argument count: ", co.co_argcount) |
| 87 | print("Kw-only arguments:", co.co_kwonlyargcount) |
| 88 | print("Number of locals: ", co.co_nlocals) |
| 89 | print("Stack size: ", co.co_stacksize) |
| 90 | print("Flags: ", pretty_flags(co.co_flags)) |
| 91 | if co.co_consts: |
| 92 | print("Constants:") |
| 93 | for i_c in enumerate(co.co_consts): |
| 94 | print("%4d: %r" % i_c) |
| 95 | if co.co_names: |
| 96 | print("Names:") |
| 97 | for i_n in enumerate(co.co_names): |
| 98 | print("%4d: %s" % i_n) |
| 99 | if co.co_varnames: |
| 100 | print("Variable names:") |
| 101 | for i_n in enumerate(co.co_varnames): |
| 102 | print("%4d: %s" % i_n) |
| 103 | if co.co_freevars: |
| 104 | print("Free variables:") |
| 105 | for i_n in enumerate(co.co_freevars): |
| 106 | print("%4d: %s" % i_n) |
| 107 | if co.co_cellvars: |
| 108 | print("Cell variables:") |
| 109 | for i_n in enumerate(co.co_cellvars): |
| 110 | print("%4d: %s" % i_n) |
| 111 | |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 112 | def disassemble(co, lasti=-1): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 113 | """Disassemble a code object.""" |
| 114 | code = co.co_code |
| 115 | labels = findlabels(code) |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 116 | linestarts = dict(findlinestarts(co)) |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 117 | n = len(code) |
| 118 | i = 0 |
| 119 | extended_arg = 0 |
Jeremy Hylton | a39414b | 2001-01-25 20:08:47 +0000 | [diff] [blame] | 120 | free = None |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 121 | while i < n: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 122 | op = code[i] |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 123 | if i in linestarts: |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 124 | if i > 0: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 125 | print() |
| 126 | print("%3d" % linestarts[i], end=' ') |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 127 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 128 | print(' ', end=' ') |
Michael W. Hudson | dd32a91 | 2002-08-15 14:59:02 +0000 | [diff] [blame] | 129 | |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 130 | if i == lasti: print('-->', end=' ') |
| 131 | else: print(' ', end=' ') |
| 132 | if i in labels: print('>>', end=' ') |
| 133 | else: print(' ', end=' ') |
| 134 | print(repr(i).rjust(4), end=' ') |
| 135 | print(opname[op].ljust(20), end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 136 | i = i+1 |
| 137 | if op >= HAVE_ARGUMENT: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 138 | oparg = code[i] + code[i+1]*256 + extended_arg |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 139 | extended_arg = 0 |
| 140 | i = i+2 |
| 141 | if op == EXTENDED_ARG: |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 142 | extended_arg = oparg*65536 |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 143 | print(repr(oparg).rjust(5), end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 144 | if op in hasconst: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 145 | print('(' + repr(co.co_consts[oparg]) + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 146 | elif op in hasname: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 147 | print('(' + co.co_names[oparg] + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 148 | elif op in hasjrel: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 149 | print('(to ' + repr(i + oparg) + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 150 | elif op in haslocal: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 151 | print('(' + co.co_varnames[oparg] + ')', end=' ') |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 152 | elif op in hascompare: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 153 | print('(' + cmp_op[oparg] + ')', end=' ') |
Jeremy Hylton | a39414b | 2001-01-25 20:08:47 +0000 | [diff] [blame] | 154 | elif op in hasfree: |
| 155 | if free is None: |
| 156 | free = co.co_cellvars + co.co_freevars |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 157 | print('(' + free[oparg] + ')', end=' ') |
| 158 | print() |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 159 | |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 160 | def disassemble_string(code, lasti=-1, varnames=None, names=None, |
| 161 | constants=None): |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 162 | labels = findlabels(code) |
| 163 | n = len(code) |
| 164 | i = 0 |
| 165 | while i < n: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 166 | op = code[i] |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 167 | if i == lasti: print('-->', end=' ') |
| 168 | else: print(' ', end=' ') |
| 169 | if i in labels: print('>>', end=' ') |
| 170 | else: print(' ', end=' ') |
| 171 | print(repr(i).rjust(4), end=' ') |
| 172 | print(opname[op].ljust(15), end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 173 | i = i+1 |
| 174 | if op >= HAVE_ARGUMENT: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 175 | oparg = code[i] + code[i+1]*256 |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 176 | i = i+2 |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 177 | print(repr(oparg).rjust(5), end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 178 | if op in hasconst: |
| 179 | if constants: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 180 | print('(' + repr(constants[oparg]) + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 181 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 182 | print('(%d)'%oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 183 | elif op in hasname: |
| 184 | if names is not None: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 185 | print('(' + names[oparg] + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 186 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 187 | print('(%d)'%oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 188 | elif op in hasjrel: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 189 | print('(to ' + repr(i + oparg) + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 190 | elif op in haslocal: |
| 191 | if varnames: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 192 | print('(' + varnames[oparg] + ')', end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 193 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 194 | print('(%d)' % oparg, end=' ') |
Tim Peters | 669454e | 2003-03-07 17:30:48 +0000 | [diff] [blame] | 195 | elif op in hascompare: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 196 | print('(' + cmp_op[oparg] + ')', end=' ') |
| 197 | print() |
Skip Montanaro | 19c6ba3 | 2003-02-27 21:29:27 +0000 | [diff] [blame] | 198 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 199 | disco = disassemble # XXX For backwards compatibility |
Guido van Rossum | bd30795 | 1997-01-17 20:05:04 +0000 | [diff] [blame] | 200 | |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 201 | def findlabels(code): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 202 | """Detect all offsets in a byte code which are jump targets. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 203 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 204 | Return the list of offsets. |
Guido van Rossum | 421c224 | 1997-11-18 15:47:55 +0000 | [diff] [blame] | 205 | |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 206 | """ |
| 207 | labels = [] |
| 208 | n = len(code) |
| 209 | i = 0 |
| 210 | while i < n: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 211 | op = code[i] |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 212 | i = i+1 |
| 213 | if op >= HAVE_ARGUMENT: |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 214 | oparg = code[i] + code[i+1]*256 |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 215 | i = i+2 |
| 216 | label = -1 |
| 217 | if op in hasjrel: |
| 218 | label = i+oparg |
| 219 | elif op in hasjabs: |
| 220 | label = oparg |
| 221 | if label >= 0: |
| 222 | if label not in labels: |
| 223 | labels.append(label) |
| 224 | return labels |
Guido van Rossum | 217a5fa | 1990-12-26 15:40:07 +0000 | [diff] [blame] | 225 | |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 226 | def findlinestarts(code): |
| 227 | """Find the offsets in a byte code which are start of lines in the source. |
| 228 | |
| 229 | Generate pairs (offset, lineno) as described in Python/compile.c. |
| 230 | |
| 231 | """ |
Guido van Rossum | 75a902d | 2007-10-19 22:06:24 +0000 | [diff] [blame] | 232 | byte_increments = list(code.co_lnotab[0::2]) |
| 233 | line_increments = list(code.co_lnotab[1::2]) |
Armin Rigo | 9c8f7ea | 2003-10-28 12:17:25 +0000 | [diff] [blame] | 234 | |
| 235 | lastlineno = None |
| 236 | lineno = code.co_firstlineno |
| 237 | addr = 0 |
| 238 | for byte_incr, line_incr in zip(byte_increments, line_increments): |
| 239 | if byte_incr: |
| 240 | if lineno != lastlineno: |
| 241 | yield (addr, lineno) |
| 242 | lastlineno = lineno |
| 243 | addr += byte_incr |
| 244 | lineno += line_incr |
| 245 | if lineno != lastlineno: |
| 246 | yield (addr, lineno) |
Guido van Rossum | 1fdae12 | 2000-02-04 17:47:55 +0000 | [diff] [blame] | 247 | |
| 248 | def _test(): |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 249 | """Simple test program to disassemble a file.""" |
| 250 | if sys.argv[1:]: |
| 251 | if sys.argv[2:]: |
| 252 | sys.stderr.write("usage: python dis.py [-|file]\n") |
| 253 | sys.exit(2) |
| 254 | fn = sys.argv[1] |
| 255 | if not fn or fn == "-": |
| 256 | fn = None |
| 257 | else: |
| 258 | fn = None |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 259 | if fn is None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 260 | f = sys.stdin |
| 261 | else: |
| 262 | f = open(fn) |
| 263 | source = f.read() |
Raymond Hettinger | 0f4940c | 2002-06-01 00:57:55 +0000 | [diff] [blame] | 264 | if fn is not None: |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 265 | f.close() |
| 266 | else: |
| 267 | fn = "<stdin>" |
| 268 | code = compile(source, fn, "exec") |
| 269 | dis(code) |
Guido van Rossum | 1fdae12 | 2000-02-04 17:47:55 +0000 | [diff] [blame] | 270 | |
| 271 | if __name__ == "__main__": |
Tim Peters | 88869f9 | 2001-01-14 23:36:06 +0000 | [diff] [blame] | 272 | _test() |