blob: 2aefdf11247ea59d3daab13e4e4e5261f1bc2b04 [file] [log] [blame]
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08001/* Capstone Disassembler Engine */
2/* By Nguyen Anh Quynh <aquynh@gmail.com>, 2013> */
3
4#include <stdio.h>
5#include <stdlib.h>
6#include <inttypes.h>
7
8#include <capstone.h>
9
10static csh handle;
11
12struct platform {
13 cs_arch arch;
14 cs_mode mode;
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080015 unsigned char *code;
16 size_t size;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080017 char *comment;
Nguyen Anh Quynh2ff665a2014-03-11 00:18:50 +080018 int syntax;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080019};
20
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080021static void print_string_hex(char *comment, unsigned char *str, int len)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080022{
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080023 unsigned char *c;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080024
25 printf("%s", comment);
26 for (c = str; c < str + len; c++) {
27 printf("0x%02x ", *c & 0xff);
28 }
29
30 printf("\n");
31}
32
Nguyen Anh Quynh397d0de2013-12-16 23:37:08 +080033static void print_insn_detail(cs_insn *ins)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080034{
Nguyen Anh Quynh4fe224b2013-12-24 16:49:36 +080035 cs_arm *arm = &(ins->detail->arm);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080036
37 if (arm->op_count)
38 printf("\top_count: %u\n", arm->op_count);
39
40 int i;
41 for (i = 0; i < arm->op_count; i++) {
42 cs_arm_op *op = &(arm->operands[i]);
43 switch((int)op->type) {
44 default:
45 break;
46 case ARM_OP_REG:
47 printf("\t\toperands[%u].type: REG = %s\n", i, cs_reg_name(handle, op->reg));
48 break;
49 case ARM_OP_IMM:
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080050 printf("\t\toperands[%u].type: IMM = 0x%x\n", i, op->imm);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080051 break;
52 case ARM_OP_FP:
53 printf("\t\toperands[%u].type: FP = %f\n", i, op->fp);
54 break;
55 case ARM_OP_MEM:
56 printf("\t\toperands[%u].type: MEM\n", i);
57 if (op->mem.base != X86_REG_INVALID)
58 printf("\t\t\toperands[%u].mem.base: REG = %s\n",
59 i, cs_reg_name(handle, op->mem.base));
60 if (op->mem.index != X86_REG_INVALID)
61 printf("\t\t\toperands[%u].mem.index: REG = %s\n",
62 i, cs_reg_name(handle, op->mem.index));
63 if (op->mem.scale != 1)
64 printf("\t\t\toperands[%u].mem.scale: %u\n", i, op->mem.scale);
65 if (op->mem.disp != 0)
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080066 printf("\t\t\toperands[%u].mem.disp: 0x%x\n", i, op->mem.disp);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080067
68 break;
69 case ARM_OP_PIMM:
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080070 printf("\t\toperands[%u].type: P-IMM = %u\n", i, op->imm);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080071 break;
72 case ARM_OP_CIMM:
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080073 printf("\t\toperands[%u].type: C-IMM = %u\n", i, op->imm);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080074 break;
75 }
76
77 if (op->shift.type != ARM_SFT_INVALID && op->shift.value) {
78 if (op->shift.type < ARM_SFT_ASR_REG)
79 // shift with constant value
80 printf("\t\t\tShift: %u = %u\n", op->shift.type, op->shift.value);
81 else
82 // shift with register
83 printf("\t\t\tShift: %u = %s\n", op->shift.type,
84 cs_reg_name(handle, op->shift.value));
85 }
86 }
87
88 if (arm->cc != ARM_CC_AL && arm->cc != ARM_CC_INVALID)
Nguyen Anh Quynhf122ae02014-01-05 21:45:30 +080089 printf("\tCode condition: %u\n", arm->cc);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080090
91 if (arm->update_flags)
92 printf("\tUpdate-flags: True\n");
93
94 if (arm->writeback)
95 printf("\tWrite-back: True\n");
96
97 printf("\n");
98}
99
100static void test()
101{
102//#define ARM_CODE "\x04\xe0\x2d\xe5" // str lr, [sp, #-0x4]!
103//#define ARM_CODE "\xe0\x83\x22\xe5" // str r8, [r2, #-0x3e0]!
104//#define ARM_CODE "\xf1\x02\x03\x0e" // mcreq p0x2, #0x0, r0, c0x3, c0x1, #0x7
105//#define ARM_CODE "\x00\x00\xa0\xe3" // mov r0, #0x0
106//#define ARM_CODE "\x02\x30\xc1\xe7" // strb r3, [r1, r2]
107//#define ARM_CODE "\x00\x00\x53\xe3" // cmp r3, #0x0
108//#define ARM_CODE "\x02\x00\xa1\xe2" // adc r0, r1, r2
109//#define ARM_CODE "\x21\x01\xa0\xe0" // adc r0, r0, r1, lsr #2
110//#define ARM_CODE "\x21\x01\xb0\xe0" // adcs r0, r0, r1, lsr #2
111//#define ARM_CODE "\x32\x03\xa1\xe0" // adc r0, r1, r2, lsr r3
112//#define ARM_CODE "\x22\x01\xa1\xe0" // adc r0, r1, r2, lsr #2
113//#define ARM_CODE "\x65\x61\x4f\x50" // subpl r6, pc, r5, ror #2
114//#define ARM_CODE "\x30\x30\x53\xe5" // ldrb r3, [r3, #-0x30]
115//#define ARM_CODE "\xb6\x10\xdf\xe1" // ldrh r1, [pc, #0x6]
116//#define ARM_CODE "\x02\x00\x9f\xef" // svc #0x9f0002
117//#define ARM_CODE "\x00\xc0\x27\xea" // b 0x9F0002: FIXME: disasm as "b #0x9f0000"
118//#define ARM_CODE "\x12\x13\xa0\xe1" // lsl r1, r2, r3
119//#define ARM_CODE "\x82\x11\xa0\xe1" // lsl r1, r2, #0x3
120//#define ARM_CODE "\x00\xc0\xa0\xe1" // mov ip, r0
121//#define ARM_CODE "\x02\x00\x12\xe3" // tst r2, #2
122//#define ARM_CODE "\x51\x12\xa0\xe1" // asr r1, r2
123//#define ARM_CODE "\x72\x10\xef\xe6" // uxtb r1, r2
124//#define ARM_CODE "\xe0\x0a\xb7\xee" // vcvt.f64.f32 d0, s1
125//#define ARM_CODE "\x9f\x0f\x91\xe1" // ldrex r0, [r1]
126//#define ARM_CODE "\x0f\x06\x20\xf4" // vld1.8 {d0, d1, d2}, [r0]
127//#define ARM_CODE "\x72\x00\xa1\xe6" // sxtab r0, r1, r2
128//#define ARM_CODE "\x50\x06\x84\xf2" // vmov.i32 q0, #0x40000000
129//#define ARM_CODE "\x73\xe0\xb8\xee" // mrc p0, #5, lr, c8, c3, #3
130//#define ARM_CODE "\x12\x02\x81\xe6" // pkhbt r0, r1, r2, lsl #0x4
131//#define ARM_CODE "\x12\x00\xa0\xe6" // ssat r0, #0x1, r2
132//#define ARM_CODE "\x03\x60\x2d\xe9" // push {r0, r1, sp, lr}
133//#define ARM_CODE "\x8f\x40\x60\xf4" // vld4.32 {d20, d21, d22, d23}, [r0]
134//#define ARM_CODE "\xd0\x00\xc2\xe1" // ldrd r0, r1, [r2]
135//#define ARM_CODE "\x08\xf0\xd0\xf5" // pld [r0, #0x8]
136//#define ARM_CODE "\x10\x8b\xbc\xec" // ldc p11, c8, [r12], #64
137//#define ARM_CODE "\xd4\x30\xd2\xe1" // ldrsb r3, [r2, #0x4]
138//#define ARM_CODE "\x11\x0f\xbe\xf2" // vcvt.s32.f32 d0, d1, #2
139//#define ARM_CODE "\x01\x01\x70\xe1" // cmn r0, r1, lsl #2
140//#define ARM_CODE "\x06\x00\x91\xe2" // adds r0, r1, #6
141//#define ARM_CODE "\x5b\xf0\x7f\xf5" // dmb ish
142//#define ARM_CODE "\xf7\xff\xff\xfe"
Nguyen Anh Quynh524194a2013-12-01 23:23:37 +0800143//#define ARM_CODE "\x00\x20\xbd\xe8" // ldm sp!, {sp}
144//#define ARM_CODE "\x00\xa0\xbd\xe8" // pop {sp, pc}
145//#define ARM_CODE "\x90\x04\x0E\x00" // muleq lr, r0, r4
146//#define ARM_CODE "\x90\x24\x0E\x00" // muleq lr, r0, r4
Nguyen Anh Quynh6677b992013-12-08 22:20:35 +0800147//#define ARM_CODE "\xb6\x10\x5f\xe1" // ldrh r1, [pc, #-6]
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800148#define ARM_CODE "\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3"
149//#define ARM_CODE2 "\xf0\x24"
150//#define ARM_CODE2 "\x83\xb0"
151#define ARM_CODE2 "\xd1\xe8\x00\xf0\xf0\x24\x04\x07\x1f\x3c\xf2\xc0\x00\x00\x4f\xf0\x00\x01\x46\x6c"
152//#define THUMB_CODE "\x70\x47" // bl 0x26
153//#define THUMB_CODE "\x07\xdd" // ble 0x1c
Nguyen Anh Quynhbc38a282013-12-01 23:14:17 +0800154//#define THUMB_CODE "\x00\x47" // bx r0
155//#define THUMB_CODE "\x01\x47" // bx r0
156//#define THUMB_CODE "\x02\x47" // bx r0
Nguyen Anh Quynhf1c2eee2013-12-02 12:29:07 +0800157//#define THUMB_CODE "\x0a\xbf" // itet eq
Nguyen Anh Quynh7c7a8bc2013-12-02 13:16:44 +0800158#define THUMB_CODE "\x70\x47\xeb\x46\x83\xb0\xc9\x68\x1f\xb1"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800159#define THUMB_CODE2 "\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0"
160
161 struct platform platforms[] = {
162 {
163 .arch = CS_ARCH_ARM,
164 .mode = CS_MODE_ARM,
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +0800165 .code = (unsigned char *)ARM_CODE,
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800166 .size = sizeof(ARM_CODE) - 1,
167 .comment = "ARM"
168 },
169 {
170 .arch = CS_ARCH_ARM,
171 .mode = CS_MODE_THUMB,
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +0800172 .code = (unsigned char *)THUMB_CODE,
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800173 .size = sizeof(THUMB_CODE) - 1,
174 .comment = "Thumb"
175 },
176 {
177 .arch = CS_ARCH_ARM,
178 .mode = CS_MODE_THUMB,
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +0800179 .code = (unsigned char *)ARM_CODE2,
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800180 .size = sizeof(ARM_CODE2) - 1,
181 .comment = "Thumb-mixed"
182 },
183 {
184 .arch = CS_ARCH_ARM,
185 .mode = CS_MODE_THUMB,
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +0800186 .code = (unsigned char *)THUMB_CODE2,
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800187 .size = sizeof(THUMB_CODE2) - 1,
Nguyen Anh Quynh2ff665a2014-03-11 00:18:50 +0800188 .comment = "Thumb-2 & register named with numbers",
189 .syntax = CS_OPT_SYNTAX_NOREGNAME
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800190 },
191 };
192
Nguyen Anh Quynh5df9e4b2013-12-03 15:02:12 +0800193 uint64_t address = 0x1000;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800194 cs_insn *insn;
195 int i;
196
197 for (i = 0; i < sizeof(platforms)/sizeof(platforms[0]); i++) {
Nguyen Anh Quynhceae16d2014-01-19 16:04:23 +0800198 cs_err err = cs_open(platforms[i].arch, platforms[i].mode, &handle);
199 if (err) {
200 printf("Failed on cs_open() with error returned: %u\n", err);
Nguyen Anh Quynh49146912014-02-22 16:54:44 +0800201 continue;
Nguyen Anh Quynhceae16d2014-01-19 16:04:23 +0800202 }
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800203
Nguyen Anh Quynh39b812d2014-01-07 23:36:26 +0800204 cs_option(handle, CS_OPT_DETAIL, CS_OPT_ON);
205
Nguyen Anh Quynh2ff665a2014-03-11 00:18:50 +0800206 if (platforms[i].syntax)
207 cs_option(handle, CS_OPT_SYNTAX, platforms[i].syntax);
208
Nguyen Anh Quynh04c19be2013-12-25 13:26:22 +0800209 size_t count = cs_disasm_ex(handle, platforms[i].code, platforms[i].size, address, 0, &insn);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800210 if (count) {
211 printf("****************\n");
212 printf("Platform: %s\n", platforms[i].comment);
213 print_string_hex("Code:", platforms[i].code, platforms[i].size);
214 printf("Disasm:\n");
215
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +0800216 size_t j;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800217 for (j = 0; j < count; j++) {
Nguyen Anh Quynh7b7b40c2013-12-03 12:24:06 +0800218 printf("0x%"PRIx64":\t%s\t%s\n", insn[j].address, insn[j].mnemonic, insn[j].op_str);
Nguyen Anh Quynh397d0de2013-12-16 23:37:08 +0800219 print_insn_detail(&insn[j]);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800220 }
Nguyen Anh Quynh7b7b40c2013-12-03 12:24:06 +0800221 printf("0x%"PRIx64":\n", insn[j-1].address + insn[j-1].size);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800222
Nguyen Anh Quynh04c19be2013-12-25 13:26:22 +0800223 // free memory allocated by cs_disasm_ex()
Nguyen Anh Quynh4fe224b2013-12-24 16:49:36 +0800224 cs_free(insn, count);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800225 } else {
226 printf("****************\n");
227 printf("Platform: %s\n", platforms[i].comment);
228 print_string_hex("Code:", platforms[i].code, platforms[i].size);
229 printf("ERROR: Failed to disasm given code!\n");
230 }
231
232 printf("\n");
233
Nguyen Anh Quynh226d7dc2014-02-27 22:20:39 +0800234 cs_close(&handle);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800235 }
236}
237
238int main()
239{
240 test();
241
242 return 0;
243}
244