blob: f471f3f9c6e2f4e094d0a2e9e014228ed10974bd [file] [log] [blame]
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08001#!/usr/bin/env python
fenuks110ab1d2014-04-11 11:00:33 +02002from __future__ import print_function
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08003# Capstone Python bindings, by Nguyen Anh Quynnh <aquynh@gmail.com>
4
5from capstone import *
Joxean114df0e2013-12-04 07:11:32 +01006import binascii
fenuks110ab1d2014-04-11 11:00:33 +02007import sys
8_python3 = sys.version_info.major == 3
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08009
Nguyen Anh Quynh749046b2014-04-12 01:15:10 +080010
fenuks110ab1d2014-04-11 11:00:33 +020011X86_CODE16 = b"\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00"
12X86_CODE32 = b"\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00"
13X86_CODE64 = b"\x55\x48\x8b\x05\xb8\x13\x00\x00"
14ARM_CODE = b"\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3"
15ARM_CODE2 = b"\x10\xf1\x10\xe7\x11\xf2\x31\xe7\xdc\xa1\x2e\xf3\xe8\x4e\x62\xf3"
16THUMB_CODE = b"\x70\x47\xeb\x46\x83\xb0\xc9\x68"
17THUMB_CODE2 = b"\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0"
18MIPS_CODE = b"\x0C\x10\x00\x97\x00\x00\x00\x00\x24\x02\x00\x0c\x8f\xa2\x00\x00\x34\x21\x34\x56"
19MIPS_CODE2 = b"\x56\x34\x21\x34\xc2\x17\x01\x00"
20ARM64_CODE = b"\x21\x7c\x02\x9b\x21\x7c\x00\x53\x00\x40\x21\x4b\xe1\x0b\x40\xb9"
21PPC_CODE = b"\x80\x20\x00\x00\x80\x3f\x00\x00\x10\x43\x23\x0e\xd0\x44\x00\x80\x4c\x43\x22\x02\x2d\x03\x00\x80\x7c\x43\x20\x14\x7c\x43\x20\x93\x4f\x20\x00\x21\x4c\xc8\x00\x21"
Nguyen Anh Quynh749046b2014-04-12 01:15:10 +080022SPARC_CODE = b"\x80\xa0\x40\x02\x85\xc2\x60\x08\x85\xe8\x20\x01\x81\xe8\x00\x00\x90\x10\x20\x01\xd5\xf6\x10\x16\x21\x00\x00\x0a\x86\x00\x40\x02\x01\x00\x00\x00\x12\xbf\xff\xff\x10\xbf\xff\xff\xa0\x02\x00\x09\x0d\xbf\xff\xff\xd4\x20\x60\x00\xd4\x4e\x00\x16\x2a\xc2\x80\x03"
23SPARCV9_CODE = b"\x81\xa8\x0a\x24\x89\xa0\x10\x20\x89\xa0\x1a\x60\x89\xa0\x00\xe0"
24SYSZ_CODE = b"\xed\x00\x00\x00\x00\x1a\x5a\x0f\x1f\xff\xc2\x09\x80\x00\x00\x00\x07\xf7\xeb\x2a\xff\xff\x7f\x57\xe3\x01\xff\xff\x7f\x57\xeb\x00\xf0\x00\x00\x24\xb2\x4f\x00\x78"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080025
26all_tests = (
Nguyen Anh Quynh46490712013-12-06 00:44:44 +080027 (CS_ARCH_X86, CS_MODE_16, X86_CODE16, "X86 16bit (Intel syntax)", 0),
28 (CS_ARCH_X86, CS_MODE_32, X86_CODE32, "X86 32bit (ATT syntax)", CS_OPT_SYNTAX_ATT),
29 (CS_ARCH_X86, CS_MODE_32, X86_CODE32, "X86 32 (Intel syntax)", 0),
30 (CS_ARCH_X86, CS_MODE_64, X86_CODE64, "X86 64 (Intel syntax)", 0),
31 (CS_ARCH_ARM, CS_MODE_ARM, ARM_CODE, "ARM", 0),
32 (CS_ARCH_ARM, CS_MODE_THUMB, THUMB_CODE2, "THUMB-2", 0),
33 (CS_ARCH_ARM, CS_MODE_ARM, ARM_CODE2, "ARM: Cortex-A15 + NEON", 0),
34 (CS_ARCH_ARM, CS_MODE_THUMB, THUMB_CODE, "THUMB", 0),
35 (CS_ARCH_MIPS, CS_MODE_32 + CS_MODE_BIG_ENDIAN, MIPS_CODE, "MIPS-32 (Big-endian)", 0),
fenuks110ab1d2014-04-11 11:00:33 +020036 (CS_ARCH_MIPS, CS_MODE_64 + CS_MODE_LITTLE_ENDIAN, MIPS_CODE2, "MIPS-64-EL (Little-endian)", 0),
Nguyen Anh Quynhfc4bc122014-01-08 10:21:04 +080037 (CS_ARCH_ARM64, CS_MODE_ARM, ARM64_CODE, "ARM-64", 0),
Nguyen Anh Quynh5f1f90c2014-01-01 23:28:05 +080038 (CS_ARCH_PPC, CS_MODE_BIG_ENDIAN, PPC_CODE, "PPC-64", 0),
Nguyen Anh Quynhfc4bc122014-01-08 10:21:04 +080039 (CS_ARCH_PPC, CS_MODE_BIG_ENDIAN, PPC_CODE, "PPC-64, print register with number only", CS_OPT_SYNTAX_NOREGNAME),
Nguyen Anh Quynh30a9d542014-03-10 14:40:48 +080040 (CS_ARCH_SPARC, CS_MODE_BIG_ENDIAN, SPARC_CODE, "Sparc", 0),
Nguyen Anh Quynhea9f4b12014-03-10 20:38:01 +080041 (CS_ARCH_SPARC, CS_MODE_BIG_ENDIAN + CS_MODE_V9, SPARCV9_CODE, "SparcV9", 0),
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080042 (CS_ARCH_SYSZ, 0, SYSZ_CODE, "SystemZ", 0),
fenuks110ab1d2014-04-11 11:00:33 +020043)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080044
45
46def to_hex(s):
fenuks110ab1d2014-04-11 11:00:33 +020047 if _python3:
48 return " ".join("0x{0:02x}".format(c) for c in s) # <-- Python 3 is OK
49 else:
50 return " ".join("0x{0:02x}".format(ord(c)) for c in s)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080051
fenuks110ab1d2014-04-11 11:00:33 +020052def to_x(s):
53 from struct import pack
54 if not s: return '0'
55 x = pack(">q", s)
56 while x[0] in ('0', 0): x = x[1:]
57 return x
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080058
fenuks110ab1d2014-04-11 11:00:33 +020059def to_x_32(s):
60 from struct import pack
61 if not s: return '0'
62 x = pack(">i", s)
63 while x[0] in ('0', 0): x = x[1:]
64 return x
65
66# ## Test cs_disasm_quick()
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080067def test_cs_disasm_quick():
fenuks110ab1d2014-04-11 11:00:33 +020068 for arch, mode, code, comment, syntax in all_tests:
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080069 print('*' * 40)
fenuks110ab1d2014-04-11 11:00:33 +020070 print("Platform: %s" % comment)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080071 print("Disasm:"),
fenuks110ab1d2014-04-11 11:00:33 +020072 print(to_hex(code))
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080073 for insn in cs_disasm_quick(arch, mode, code, 0x1000):
fenuks110ab1d2014-04-11 11:00:33 +020074 print("0x%x:\t%s\t%s" % (insn.address, insn.mnemonic, insn.op_str))
75 print()
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080076
77
fenuks110ab1d2014-04-11 11:00:33 +020078# ## Test class Cs
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080079def test_class():
fenuks110ab1d2014-04-11 11:00:33 +020080 for arch, mode, code, comment, syntax in all_tests:
danghvu1a7c4492013-11-27 22:51:11 -060081 print('*' * 16)
fenuks110ab1d2014-04-11 11:00:33 +020082 print("Platform: %s" % comment)
danghvu1a7c4492013-11-27 22:51:11 -060083 print("Code: %s" % to_hex(code))
84 print("Disasm:")
85
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080086 try:
Nguyen Anh Quynh520c3612013-12-06 15:26:07 +080087 md = Cs(arch, mode)
Nguyen Anh Quynhdaaed132013-12-03 22:18:28 +080088
Nguyen Anh Quynh46490712013-12-06 00:44:44 +080089 if syntax != 0:
90 md.syntax = syntax
Nguyen Anh Quynhdaaed132013-12-03 22:18:28 +080091
Nguyen Anh Quynhe099ede2013-12-06 18:06:11 +080092 for insn in md.disasm(code, 0x1000):
fenuks110ab1d2014-04-11 11:00:33 +020093 # bytes = binascii.hexlify(insn.bytes)
94 # print("0x%x:\t%s\t%s\t// hex-code: %s" %(insn.address, insn.mnemonic, insn.op_str, bytes))
95 print("0x%x:\t%s\t%s" % (insn.address, insn.mnemonic, insn.op_str))
danghvu1a7c4492013-11-27 22:51:11 -060096
Nguyen Anh Quynhe099ede2013-12-06 18:06:11 +080097 print("0x%x:" % (insn.address + insn.size))
fenuks110ab1d2014-04-11 11:00:33 +020098 print()
Nguyen Anh Quynhf1618bc2013-12-06 20:58:04 +080099 except CsError as e:
fenuks110ab1d2014-04-11 11:00:33 +0200100 print("ERROR: %s" % e)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800101
102
fenuks110ab1d2014-04-11 11:00:33 +0200103# test_cs_disasm_quick()
104# print ("*" * 40)
105if __name__ == '__main__':
106 test_class()