Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 1 | #!/usr/bin/env python |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 2 | from __future__ import print_function |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 3 | # Capstone Python bindings, by Nguyen Anh Quynnh <aquynh@gmail.com> |
| 4 | |
| 5 | from capstone import * |
Joxean | 114df0e | 2013-12-04 07:11:32 +0100 | [diff] [blame] | 6 | import binascii |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 7 | import sys |
| 8 | _python3 = sys.version_info.major == 3 |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 9 | |
Nguyen Anh Quynh | 749046b | 2014-04-12 01:15:10 +0800 | [diff] [blame^] | 10 | |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 11 | X86_CODE16 = b"\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00" |
| 12 | X86_CODE32 = b"\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00" |
| 13 | X86_CODE64 = b"\x55\x48\x8b\x05\xb8\x13\x00\x00" |
| 14 | ARM_CODE = b"\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3" |
| 15 | ARM_CODE2 = b"\x10\xf1\x10\xe7\x11\xf2\x31\xe7\xdc\xa1\x2e\xf3\xe8\x4e\x62\xf3" |
| 16 | THUMB_CODE = b"\x70\x47\xeb\x46\x83\xb0\xc9\x68" |
| 17 | THUMB_CODE2 = b"\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0" |
| 18 | MIPS_CODE = b"\x0C\x10\x00\x97\x00\x00\x00\x00\x24\x02\x00\x0c\x8f\xa2\x00\x00\x34\x21\x34\x56" |
| 19 | MIPS_CODE2 = b"\x56\x34\x21\x34\xc2\x17\x01\x00" |
| 20 | ARM64_CODE = b"\x21\x7c\x02\x9b\x21\x7c\x00\x53\x00\x40\x21\x4b\xe1\x0b\x40\xb9" |
| 21 | PPC_CODE = b"\x80\x20\x00\x00\x80\x3f\x00\x00\x10\x43\x23\x0e\xd0\x44\x00\x80\x4c\x43\x22\x02\x2d\x03\x00\x80\x7c\x43\x20\x14\x7c\x43\x20\x93\x4f\x20\x00\x21\x4c\xc8\x00\x21" |
Nguyen Anh Quynh | 749046b | 2014-04-12 01:15:10 +0800 | [diff] [blame^] | 22 | SPARC_CODE = b"\x80\xa0\x40\x02\x85\xc2\x60\x08\x85\xe8\x20\x01\x81\xe8\x00\x00\x90\x10\x20\x01\xd5\xf6\x10\x16\x21\x00\x00\x0a\x86\x00\x40\x02\x01\x00\x00\x00\x12\xbf\xff\xff\x10\xbf\xff\xff\xa0\x02\x00\x09\x0d\xbf\xff\xff\xd4\x20\x60\x00\xd4\x4e\x00\x16\x2a\xc2\x80\x03" |
| 23 | SPARCV9_CODE = b"\x81\xa8\x0a\x24\x89\xa0\x10\x20\x89\xa0\x1a\x60\x89\xa0\x00\xe0" |
| 24 | SYSZ_CODE = b"\xed\x00\x00\x00\x00\x1a\x5a\x0f\x1f\xff\xc2\x09\x80\x00\x00\x00\x07\xf7\xeb\x2a\xff\xff\x7f\x57\xe3\x01\xff\xff\x7f\x57\xeb\x00\xf0\x00\x00\x24\xb2\x4f\x00\x78" |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 25 | |
| 26 | all_tests = ( |
Nguyen Anh Quynh | 4649071 | 2013-12-06 00:44:44 +0800 | [diff] [blame] | 27 | (CS_ARCH_X86, CS_MODE_16, X86_CODE16, "X86 16bit (Intel syntax)", 0), |
| 28 | (CS_ARCH_X86, CS_MODE_32, X86_CODE32, "X86 32bit (ATT syntax)", CS_OPT_SYNTAX_ATT), |
| 29 | (CS_ARCH_X86, CS_MODE_32, X86_CODE32, "X86 32 (Intel syntax)", 0), |
| 30 | (CS_ARCH_X86, CS_MODE_64, X86_CODE64, "X86 64 (Intel syntax)", 0), |
| 31 | (CS_ARCH_ARM, CS_MODE_ARM, ARM_CODE, "ARM", 0), |
| 32 | (CS_ARCH_ARM, CS_MODE_THUMB, THUMB_CODE2, "THUMB-2", 0), |
| 33 | (CS_ARCH_ARM, CS_MODE_ARM, ARM_CODE2, "ARM: Cortex-A15 + NEON", 0), |
| 34 | (CS_ARCH_ARM, CS_MODE_THUMB, THUMB_CODE, "THUMB", 0), |
| 35 | (CS_ARCH_MIPS, CS_MODE_32 + CS_MODE_BIG_ENDIAN, MIPS_CODE, "MIPS-32 (Big-endian)", 0), |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 36 | (CS_ARCH_MIPS, CS_MODE_64 + CS_MODE_LITTLE_ENDIAN, MIPS_CODE2, "MIPS-64-EL (Little-endian)", 0), |
Nguyen Anh Quynh | fc4bc12 | 2014-01-08 10:21:04 +0800 | [diff] [blame] | 37 | (CS_ARCH_ARM64, CS_MODE_ARM, ARM64_CODE, "ARM-64", 0), |
Nguyen Anh Quynh | 5f1f90c | 2014-01-01 23:28:05 +0800 | [diff] [blame] | 38 | (CS_ARCH_PPC, CS_MODE_BIG_ENDIAN, PPC_CODE, "PPC-64", 0), |
Nguyen Anh Quynh | fc4bc12 | 2014-01-08 10:21:04 +0800 | [diff] [blame] | 39 | (CS_ARCH_PPC, CS_MODE_BIG_ENDIAN, PPC_CODE, "PPC-64, print register with number only", CS_OPT_SYNTAX_NOREGNAME), |
Nguyen Anh Quynh | 30a9d54 | 2014-03-10 14:40:48 +0800 | [diff] [blame] | 40 | (CS_ARCH_SPARC, CS_MODE_BIG_ENDIAN, SPARC_CODE, "Sparc", 0), |
Nguyen Anh Quynh | ea9f4b1 | 2014-03-10 20:38:01 +0800 | [diff] [blame] | 41 | (CS_ARCH_SPARC, CS_MODE_BIG_ENDIAN + CS_MODE_V9, SPARCV9_CODE, "SparcV9", 0), |
Nguyen Anh Quynh | 1c8405d | 2014-03-23 11:17:24 +0800 | [diff] [blame] | 42 | (CS_ARCH_SYSZ, 0, SYSZ_CODE, "SystemZ", 0), |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 43 | ) |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 44 | |
| 45 | |
| 46 | def to_hex(s): |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 47 | if _python3: |
| 48 | return " ".join("0x{0:02x}".format(c) for c in s) # <-- Python 3 is OK |
| 49 | else: |
| 50 | return " ".join("0x{0:02x}".format(ord(c)) for c in s) |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 51 | |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 52 | def to_x(s): |
| 53 | from struct import pack |
| 54 | if not s: return '0' |
| 55 | x = pack(">q", s) |
| 56 | while x[0] in ('0', 0): x = x[1:] |
| 57 | return x |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 58 | |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 59 | def to_x_32(s): |
| 60 | from struct import pack |
| 61 | if not s: return '0' |
| 62 | x = pack(">i", s) |
| 63 | while x[0] in ('0', 0): x = x[1:] |
| 64 | return x |
| 65 | |
| 66 | # ## Test cs_disasm_quick() |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 67 | def test_cs_disasm_quick(): |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 68 | for arch, mode, code, comment, syntax in all_tests: |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 69 | print('*' * 40) |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 70 | print("Platform: %s" % comment) |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 71 | print("Disasm:"), |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 72 | print(to_hex(code)) |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 73 | for insn in cs_disasm_quick(arch, mode, code, 0x1000): |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 74 | print("0x%x:\t%s\t%s" % (insn.address, insn.mnemonic, insn.op_str)) |
| 75 | print() |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 76 | |
| 77 | |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 78 | # ## Test class Cs |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 79 | def test_class(): |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 80 | for arch, mode, code, comment, syntax in all_tests: |
danghvu | 1a7c449 | 2013-11-27 22:51:11 -0600 | [diff] [blame] | 81 | print('*' * 16) |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 82 | print("Platform: %s" % comment) |
danghvu | 1a7c449 | 2013-11-27 22:51:11 -0600 | [diff] [blame] | 83 | print("Code: %s" % to_hex(code)) |
| 84 | print("Disasm:") |
| 85 | |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 86 | try: |
Nguyen Anh Quynh | 520c361 | 2013-12-06 15:26:07 +0800 | [diff] [blame] | 87 | md = Cs(arch, mode) |
Nguyen Anh Quynh | daaed13 | 2013-12-03 22:18:28 +0800 | [diff] [blame] | 88 | |
Nguyen Anh Quynh | 4649071 | 2013-12-06 00:44:44 +0800 | [diff] [blame] | 89 | if syntax != 0: |
| 90 | md.syntax = syntax |
Nguyen Anh Quynh | daaed13 | 2013-12-03 22:18:28 +0800 | [diff] [blame] | 91 | |
Nguyen Anh Quynh | e099ede | 2013-12-06 18:06:11 +0800 | [diff] [blame] | 92 | for insn in md.disasm(code, 0x1000): |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 93 | # bytes = binascii.hexlify(insn.bytes) |
| 94 | # print("0x%x:\t%s\t%s\t// hex-code: %s" %(insn.address, insn.mnemonic, insn.op_str, bytes)) |
| 95 | print("0x%x:\t%s\t%s" % (insn.address, insn.mnemonic, insn.op_str)) |
danghvu | 1a7c449 | 2013-11-27 22:51:11 -0600 | [diff] [blame] | 96 | |
Nguyen Anh Quynh | e099ede | 2013-12-06 18:06:11 +0800 | [diff] [blame] | 97 | print("0x%x:" % (insn.address + insn.size)) |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 98 | print() |
Nguyen Anh Quynh | f1618bc | 2013-12-06 20:58:04 +0800 | [diff] [blame] | 99 | except CsError as e: |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 100 | print("ERROR: %s" % e) |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 101 | |
| 102 | |
fenuks | 110ab1d | 2014-04-11 11:00:33 +0200 | [diff] [blame] | 103 | # test_cs_disasm_quick() |
| 104 | # print ("*" * 40) |
| 105 | if __name__ == '__main__': |
| 106 | test_class() |