Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 1 | import dis |
Antoine Pitrou | b7fbcd3 | 2010-01-16 18:37:38 +0000 | [diff] [blame] | 2 | import re |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 3 | import sys |
Guido van Rossum | 34d1928 | 2007-08-09 01:03:29 +0000 | [diff] [blame] | 4 | from io import StringIO |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 5 | import unittest |
| 6 | |
| 7 | def disassemble(func): |
| 8 | f = StringIO() |
| 9 | tmp = sys.stdout |
| 10 | sys.stdout = f |
| 11 | dis.dis(func) |
| 12 | sys.stdout = tmp |
| 13 | result = f.getvalue() |
| 14 | f.close() |
| 15 | return result |
| 16 | |
| 17 | def dis_single(line): |
| 18 | return disassemble(compile(line, '', 'single')) |
| 19 | |
| 20 | class TestTranforms(unittest.TestCase): |
| 21 | |
| 22 | def test_unot(self): |
Jeffrey Yasskin | 9de7ec7 | 2009-02-25 02:25:04 +0000 | [diff] [blame] | 23 | # UNARY_NOT POP_JUMP_IF_FALSE --> POP_JUMP_IF_TRUE' |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 24 | def unot(x): |
| 25 | if not x == 2: |
| 26 | del x |
| 27 | asm = disassemble(unot) |
Jeffrey Yasskin | 9de7ec7 | 2009-02-25 02:25:04 +0000 | [diff] [blame] | 28 | for elem in ('UNARY_NOT', 'POP_JUMP_IF_FALSE'): |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 29 | self.assertNotIn(elem, asm) |
Jeffrey Yasskin | 9de7ec7 | 2009-02-25 02:25:04 +0000 | [diff] [blame] | 30 | for elem in ('POP_JUMP_IF_TRUE',): |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 31 | self.assertIn(elem, asm) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 32 | |
| 33 | def test_elim_inversion_of_is_or_in(self): |
| 34 | for line, elem in ( |
| 35 | ('not a is b', '(is not)',), |
| 36 | ('not a in b', '(not in)',), |
| 37 | ('not a is not b', '(is)',), |
| 38 | ('not a not in b', '(in)',), |
| 39 | ): |
| 40 | asm = dis_single(line) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 41 | self.assertIn(elem, asm) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 42 | |
Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 43 | def test_global_as_constant(self): |
| 44 | # LOAD_GLOBAL None/True/False --> LOAD_CONST None/True/False |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 45 | def f(x): |
Tim Peters | 66cb018 | 2004-08-26 05:23:19 +0000 | [diff] [blame] | 46 | None |
Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 47 | None |
Tim Peters | 66cb018 | 2004-08-26 05:23:19 +0000 | [diff] [blame] | 48 | return x |
Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 49 | def g(x): |
| 50 | True |
| 51 | return x |
| 52 | def h(x): |
| 53 | False |
| 54 | return x |
| 55 | for func, name in ((f, 'None'), (g, 'True'), (h, 'False')): |
| 56 | asm = disassemble(func) |
| 57 | for elem in ('LOAD_GLOBAL',): |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 58 | self.assertNotIn(elem, asm) |
Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 59 | for elem in ('LOAD_CONST', '('+name+')'): |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 60 | self.assertIn(elem, asm) |
Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 61 | def f(): |
| 62 | 'Adding a docstring made this test fail in Py2.5.0' |
| 63 | return None |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 64 | self.assertIn('LOAD_CONST', disassemble(f)) |
| 65 | self.assertNotIn('LOAD_GLOBAL', disassemble(f)) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 66 | |
| 67 | def test_while_one(self): |
Jeffrey Yasskin | 9de7ec7 | 2009-02-25 02:25:04 +0000 | [diff] [blame] | 68 | # Skip over: LOAD_CONST trueconst POP_JUMP_IF_FALSE xx |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 69 | def f(): |
Tim Peters | 66cb018 | 2004-08-26 05:23:19 +0000 | [diff] [blame] | 70 | while 1: |
| 71 | pass |
| 72 | return list |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 73 | asm = disassemble(f) |
Jeffrey Yasskin | 9de7ec7 | 2009-02-25 02:25:04 +0000 | [diff] [blame] | 74 | for elem in ('LOAD_CONST', 'POP_JUMP_IF_FALSE'): |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 75 | self.assertNotIn(elem, asm) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 76 | for elem in ('JUMP_ABSOLUTE',): |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 77 | self.assertIn(elem, asm) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 78 | |
| 79 | def test_pack_unpack(self): |
| 80 | for line, elem in ( |
Raymond Hettinger | 2c31a05 | 2004-09-22 18:44:21 +0000 | [diff] [blame] | 81 | ('a, = a,', 'LOAD_CONST',), |
| 82 | ('a, b = a, b', 'ROT_TWO',), |
| 83 | ('a, b, c = a, b, c', 'ROT_THREE',), |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 84 | ): |
| 85 | asm = dis_single(line) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 86 | self.assertIn(elem, asm) |
| 87 | self.assertNotIn('BUILD_TUPLE', asm) |
| 88 | self.assertNotIn('UNPACK_TUPLE', asm) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 89 | |
Raymond Hettinger | 2c31a05 | 2004-09-22 18:44:21 +0000 | [diff] [blame] | 90 | def test_folding_of_tuples_of_constants(self): |
| 91 | for line, elem in ( |
Raymond Hettinger | 5dec096 | 2004-11-02 04:20:10 +0000 | [diff] [blame] | 92 | ('a = 1,2,3', '((1, 2, 3))'), |
| 93 | ('("a","b","c")', "(('a', 'b', 'c'))"), |
| 94 | ('a,b,c = 1,2,3', '((1, 2, 3))'), |
| 95 | ('(None, 1, None)', '((None, 1, None))'), |
| 96 | ('((1, 2), 3, 4)', '(((1, 2), 3, 4))'), |
Raymond Hettinger | 2c31a05 | 2004-09-22 18:44:21 +0000 | [diff] [blame] | 97 | ): |
| 98 | asm = dis_single(line) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 99 | self.assertIn(elem, asm) |
| 100 | self.assertNotIn('BUILD_TUPLE', asm) |
Raymond Hettinger | 2c31a05 | 2004-09-22 18:44:21 +0000 | [diff] [blame] | 101 | |
Raymond Hettinger | 23109ef | 2004-10-26 08:59:14 +0000 | [diff] [blame] | 102 | # Bug 1053819: Tuple of constants misidentified when presented with: |
| 103 | # . . . opcode_with_arg 100 unary_opcode BUILD_TUPLE 1 . . . |
| 104 | # The following would segfault upon compilation |
| 105 | def crater(): |
| 106 | (~[ |
| 107 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 108 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 109 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 110 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 111 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 112 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 113 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 114 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 115 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 116 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, |
| 117 | ],) |
| 118 | |
Antoine Pitrou | b7fbcd3 | 2010-01-16 18:37:38 +0000 | [diff] [blame] | 119 | def test_folding_of_lists_of_constants(self): |
| 120 | for line, elem in ( |
| 121 | # in/not in constants with BUILD_LIST should be folded to a tuple: |
| 122 | ('a in [1,2,3]', '(1, 2, 3)'), |
| 123 | ('a not in ["a","b","c"]', "(('a', 'b', 'c'))"), |
| 124 | ('a in [None, 1, None]', '((None, 1, None))'), |
| 125 | ('a not in [(1, 2), 3, 4]', '(((1, 2), 3, 4))'), |
| 126 | ): |
| 127 | asm = dis_single(line) |
| 128 | self.assertIn(elem, asm) |
| 129 | self.assertNotIn('BUILD_LIST', asm) |
| 130 | |
| 131 | def test_folding_of_sets_of_constants(self): |
| 132 | for line, elem in ( |
| 133 | # in/not in constants with BUILD_SET should be folded to a frozenset: |
| 134 | ('a in {1,2,3}', frozenset({1, 2, 3})), |
| 135 | ('a not in {"a","b","c"}', frozenset({'a', 'c', 'b'})), |
| 136 | ('a in {None, 1, None}', frozenset({1, None})), |
| 137 | ('a not in {(1, 2), 3, 4}', frozenset({(1, 2), 3, 4})), |
| 138 | ('a in {1, 2, 3, 3, 2, 1}', frozenset({1, 2, 3})), |
| 139 | ): |
| 140 | asm = dis_single(line) |
| 141 | self.assertNotIn('BUILD_SET', asm) |
| 142 | |
| 143 | # Verify that the frozenset 'elem' is in the disassembly |
| 144 | # The ordering of the elements in repr( frozenset ) isn't |
| 145 | # guaranteed, so we jump through some hoops to ensure that we have |
| 146 | # the frozenset we expect: |
| 147 | self.assertIn('frozenset', asm) |
| 148 | # Extract the frozenset literal from the disassembly: |
| 149 | m = re.match(r'.*(frozenset\({.*}\)).*', asm, re.DOTALL) |
| 150 | self.assertTrue(m) |
| 151 | self.assertEqual(eval(m.group(1)), elem) |
| 152 | |
| 153 | # Ensure that the resulting code actually works: |
| 154 | def f(a): |
| 155 | return a in {1, 2, 3} |
| 156 | |
| 157 | def g(a): |
| 158 | return a not in {1, 2, 3} |
| 159 | |
| 160 | self.assertTrue(f(3)) |
| 161 | self.assertTrue(not f(4)) |
| 162 | |
| 163 | self.assertTrue(not g(3)) |
| 164 | self.assertTrue(g(4)) |
| 165 | |
| 166 | |
Raymond Hettinger | c34f867 | 2005-01-02 06:17:33 +0000 | [diff] [blame] | 167 | def test_folding_of_binops_on_constants(self): |
| 168 | for line, elem in ( |
| 169 | ('a = 2+3+4', '(9)'), # chained fold |
| 170 | ('"@"*4', "('@@@@')"), # check string ops |
| 171 | ('a="abc" + "def"', "('abcdef')"), # check string ops |
| 172 | ('a = 3**4', '(81)'), # binary power |
| 173 | ('a = 3*4', '(12)'), # binary multiply |
Raymond Hettinger | c34f867 | 2005-01-02 06:17:33 +0000 | [diff] [blame] | 174 | ('a = 13//4', '(3)'), # binary floor divide |
| 175 | ('a = 14%4', '(2)'), # binary modulo |
| 176 | ('a = 2+3', '(5)'), # binary add |
| 177 | ('a = 13-4', '(9)'), # binary subtract |
| 178 | ('a = (12,13)[1]', '(13)'), # binary subscr |
| 179 | ('a = 13 << 2', '(52)'), # binary lshift |
| 180 | ('a = 13 >> 2', '(3)'), # binary rshift |
| 181 | ('a = 13 & 7', '(5)'), # binary and |
| 182 | ('a = 13 ^ 7', '(10)'), # binary xor |
| 183 | ('a = 13 | 7', '(15)'), # binary or |
| 184 | ): |
| 185 | asm = dis_single(line) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 186 | self.assertIn(elem, asm, asm) |
| 187 | self.assertNotIn('BINARY_', asm) |
Raymond Hettinger | c34f867 | 2005-01-02 06:17:33 +0000 | [diff] [blame] | 188 | |
| 189 | # Verify that unfoldables are skipped |
| 190 | asm = dis_single('a=2+"b"') |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 191 | self.assertIn('(2)', asm) |
| 192 | self.assertIn("('b')", asm) |
Raymond Hettinger | c34f867 | 2005-01-02 06:17:33 +0000 | [diff] [blame] | 193 | |
Raymond Hettinger | 9feb267 | 2005-01-26 12:50:05 +0000 | [diff] [blame] | 194 | # Verify that large sequences do not result from folding |
| 195 | asm = dis_single('a="x"*1000') |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 196 | self.assertIn('(1000)', asm) |
Raymond Hettinger | 9feb267 | 2005-01-26 12:50:05 +0000 | [diff] [blame] | 197 | |
Raymond Hettinger | afd842f | 2005-02-20 12:46:54 +0000 | [diff] [blame] | 198 | def test_folding_of_unaryops_on_constants(self): |
| 199 | for line, elem in ( |
Raymond Hettinger | afd842f | 2005-02-20 12:46:54 +0000 | [diff] [blame] | 200 | ('-0.5', '(-0.5)'), # unary negative |
| 201 | ('~-2', '(1)'), # unary invert |
Raymond Hettinger | af7adad | 2009-10-22 11:22:50 +0000 | [diff] [blame] | 202 | ('+1', '(1)'), # unary positive |
Raymond Hettinger | afd842f | 2005-02-20 12:46:54 +0000 | [diff] [blame] | 203 | ): |
| 204 | asm = dis_single(line) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 205 | self.assertIn(elem, asm, asm) |
| 206 | self.assertNotIn('UNARY_', asm) |
Raymond Hettinger | afd842f | 2005-02-20 12:46:54 +0000 | [diff] [blame] | 207 | |
| 208 | # Verify that unfoldables are skipped |
| 209 | for line, elem in ( |
| 210 | ('-"abc"', "('abc')"), # unary negative |
| 211 | ('~"abc"', "('abc')"), # unary invert |
| 212 | ): |
| 213 | asm = dis_single(line) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 214 | self.assertIn(elem, asm, asm) |
| 215 | self.assertIn('UNARY_', asm) |
Raymond Hettinger | afd842f | 2005-02-20 12:46:54 +0000 | [diff] [blame] | 216 | |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 217 | def test_elim_extra_return(self): |
| 218 | # RETURN LOAD_CONST None RETURN --> RETURN |
| 219 | def f(x): |
| 220 | return x |
| 221 | asm = disassemble(f) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 222 | self.assertNotIn('LOAD_CONST', asm) |
| 223 | self.assertNotIn('(None)', asm) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 224 | self.assertEqual(asm.split().count('RETURN_VALUE'), 1) |
| 225 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 226 | def test_elim_jump_to_return(self): |
| 227 | # JUMP_FORWARD to RETURN --> RETURN |
| 228 | def f(cond, true_value, false_value): |
| 229 | return true_value if cond else false_value |
| 230 | asm = disassemble(f) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 231 | self.assertNotIn('JUMP_FORWARD', asm) |
| 232 | self.assertNotIn('JUMP_ABSOLUTE', asm) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 233 | self.assertEqual(asm.split().count('RETURN_VALUE'), 2) |
| 234 | |
| 235 | def test_elim_jump_after_return1(self): |
| 236 | # Eliminate dead code: jumps immediately after returns can't be reached |
| 237 | def f(cond1, cond2): |
| 238 | if cond1: return 1 |
| 239 | if cond2: return 2 |
| 240 | while 1: |
| 241 | return 3 |
| 242 | while 1: |
| 243 | if cond1: return 4 |
| 244 | return 5 |
| 245 | return 6 |
| 246 | asm = disassemble(f) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 247 | self.assertNotIn('JUMP_FORWARD', asm) |
| 248 | self.assertNotIn('JUMP_ABSOLUTE', asm) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 249 | self.assertEqual(asm.split().count('RETURN_VALUE'), 6) |
| 250 | |
| 251 | def test_elim_jump_after_return2(self): |
| 252 | # Eliminate dead code: jumps immediately after returns can't be reached |
| 253 | def f(cond1, cond2): |
| 254 | while 1: |
| 255 | if cond1: return 4 |
| 256 | asm = disassemble(f) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 257 | self.assertNotIn('JUMP_FORWARD', asm) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 258 | # There should be one jump for the while loop. |
| 259 | self.assertEqual(asm.split().count('JUMP_ABSOLUTE'), 1) |
| 260 | self.assertEqual(asm.split().count('RETURN_VALUE'), 2) |
Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 261 | |
Guido van Rossum | 0240b92 | 2007-02-26 21:23:50 +0000 | [diff] [blame] | 262 | def test_make_function_doesnt_bail(self): |
| 263 | def f(): |
Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 264 | def g()->1+1: |
Guido van Rossum | 0240b92 | 2007-02-26 21:23:50 +0000 | [diff] [blame] | 265 | pass |
| 266 | return g |
| 267 | asm = disassemble(f) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 268 | self.assertNotIn('BINARY_ADD', asm) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 269 | |
| 270 | |
| 271 | def test_main(verbose=None): |
| 272 | import sys |
Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 273 | from test import support |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 274 | test_classes = (TestTranforms,) |
Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 275 | support.run_unittest(*test_classes) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 276 | |
| 277 | # verify reference counting |
| 278 | if verbose and hasattr(sys, "gettotalrefcount"): |
| 279 | import gc |
| 280 | counts = [None] * 5 |
Guido van Rossum | 805365e | 2007-05-07 22:24:25 +0000 | [diff] [blame] | 281 | for i in range(len(counts)): |
Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 282 | support.run_unittest(*test_classes) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 283 | gc.collect() |
| 284 | counts[i] = sys.gettotalrefcount() |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 285 | print(counts) |
Raymond Hettinger | fd2d1f7 | 2004-08-23 23:37:48 +0000 | [diff] [blame] | 286 | |
| 287 | if __name__ == "__main__": |
| 288 | test_main(verbose=True) |