blob: 1c2fdf3680a1b46d279df617e97315ea8b94e5c7 [file] [log] [blame]
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08001/* Capstone Disassembler Engine */
2/* By Nguyen Anh Quynh <aquynh@gmail.com>, 2013> */
3
4#include <stdio.h>
5#include <stdlib.h>
Cr4sh19ee2d12015-03-29 18:29:06 +08006#include "../myinttypes.h"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08007
pancake9c10ace2015-02-24 04:55:55 +01008#include <capstone/capstone.h>
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08009
10static csh handle;
11
12struct platform {
13 cs_arch arch;
14 cs_mode mode;
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080015 unsigned char *code;
16 size_t size;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080017 char *comment;
Nguyen Anh Quynh2ff665a2014-03-11 00:18:50 +080018 int syntax;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080019};
20
Mr. eXoDia9be1f932014-08-26 12:46:15 +020021static void print_string_hex(char *comment, unsigned char *str, size_t len)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080022{
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080023 unsigned char *c;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080024
25 printf("%s", comment);
26 for (c = str; c < str + len; c++) {
27 printf("0x%02x ", *c & 0xff);
28 }
29
30 printf("\n");
31}
32
Nguyen Anh Quynh29f777b2015-04-07 11:59:26 +080033static void print_insn_detail(csh handle, cs_insn *ins)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080034{
Nguyen Anh Quynh54015f42014-04-10 00:02:04 +080035 cs_arm *arm;
Nguyen Anh Quynh5b556e52014-04-11 10:15:26 +080036 int i;
Nguyen Anh Quynh29f777b2015-04-07 11:59:26 +080037 cs_regs regs_read, regs_write;
38 uint8_t regs_read_count, regs_write_count;
Nguyen Anh Quynh54015f42014-04-10 00:02:04 +080039
40 // detail can be NULL on "data" instruction if SKIPDATA option is turned ON
41 if (ins->detail == NULL)
42 return;
43
44 arm = &(ins->detail->arm);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080045
46 if (arm->op_count)
47 printf("\top_count: %u\n", arm->op_count);
48
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080049 for (i = 0; i < arm->op_count; i++) {
50 cs_arm_op *op = &(arm->operands[i]);
51 switch((int)op->type) {
52 default:
53 break;
54 case ARM_OP_REG:
55 printf("\t\toperands[%u].type: REG = %s\n", i, cs_reg_name(handle, op->reg));
56 break;
57 case ARM_OP_IMM:
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080058 printf("\t\toperands[%u].type: IMM = 0x%x\n", i, op->imm);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080059 break;
60 case ARM_OP_FP:
61 printf("\t\toperands[%u].type: FP = %f\n", i, op->fp);
62 break;
63 case ARM_OP_MEM:
64 printf("\t\toperands[%u].type: MEM\n", i);
65 if (op->mem.base != X86_REG_INVALID)
66 printf("\t\t\toperands[%u].mem.base: REG = %s\n",
67 i, cs_reg_name(handle, op->mem.base));
68 if (op->mem.index != X86_REG_INVALID)
69 printf("\t\t\toperands[%u].mem.index: REG = %s\n",
70 i, cs_reg_name(handle, op->mem.index));
71 if (op->mem.scale != 1)
72 printf("\t\t\toperands[%u].mem.scale: %u\n", i, op->mem.scale);
73 if (op->mem.disp != 0)
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080074 printf("\t\t\toperands[%u].mem.disp: 0x%x\n", i, op->mem.disp);
Nguyen Anh Quynh6c34c662015-01-12 15:38:06 +080075 if (op->mem.lshift != 0)
76 printf("\t\t\toperands[%u].mem.lshift: 0x%x\n", i, op->mem.lshift);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080077
78 break;
79 case ARM_OP_PIMM:
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080080 printf("\t\toperands[%u].type: P-IMM = %u\n", i, op->imm);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080081 break;
82 case ARM_OP_CIMM:
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080083 printf("\t\toperands[%u].type: C-IMM = %u\n", i, op->imm);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080084 break;
Nguyen Anh Quynh04d9f8e2014-09-01 23:27:24 +080085 case ARM_OP_SETEND:
86 printf("\t\toperands[%u].type: SETEND = %s\n", i, op->setend == ARM_SETEND_BE? "be" : "le");
87 break;
88 case ARM_OP_SYSREG:
89 printf("\t\toperands[%u].type: SYSREG = %u\n", i, op->reg);
90 break;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080091 }
92
Nguyen Anh Quynh29f777b2015-04-07 11:59:26 +080093 if (op->neon_lane != -1) {
94 printf("\t\toperands[%u].neon_lane = %u\n", i, op->neon_lane);
95 }
96
97 switch(op->access) {
98 default:
99 break;
100 case CS_AC_READ:
101 printf("\t\toperands[%u].access: READ\n", i);
102 break;
103 case CS_AC_WRITE:
104 printf("\t\toperands[%u].access: WRITE\n", i);
105 break;
106 case CS_AC_READ | CS_AC_WRITE:
107 printf("\t\toperands[%u].access: READ | WRITE\n", i);
108 break;
109 }
110
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800111 if (op->shift.type != ARM_SFT_INVALID && op->shift.value) {
112 if (op->shift.type < ARM_SFT_ASR_REG)
113 // shift with constant value
114 printf("\t\t\tShift: %u = %u\n", op->shift.type, op->shift.value);
115 else
116 // shift with register
117 printf("\t\t\tShift: %u = %s\n", op->shift.type,
118 cs_reg_name(handle, op->shift.value));
119 }
Nguyen Anh Quynh04d9f8e2014-09-01 23:27:24 +0800120
121 if (op->vector_index != -1) {
122 printf("\t\toperands[%u].vector_index = %u\n", i, op->vector_index);
123 }
Nguyen Anh Quynh8fb2eab2014-10-06 20:27:25 +0800124
125 if (op->subtracted)
126 printf("\t\tSubtracted: True\n");
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800127 }
128
129 if (arm->cc != ARM_CC_AL && arm->cc != ARM_CC_INVALID)
Nguyen Anh Quynhf122ae02014-01-05 21:45:30 +0800130 printf("\tCode condition: %u\n", arm->cc);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800131
132 if (arm->update_flags)
133 printf("\tUpdate-flags: True\n");
134
135 if (arm->writeback)
136 printf("\tWrite-back: True\n");
137
Nguyen Anh Quynh04d9f8e2014-09-01 23:27:24 +0800138 if (arm->cps_mode)
139 printf("\tCPSI-mode: %u\n", arm->cps_mode);
140
141 if (arm->cps_flag)
142 printf("\tCPSI-flag: %u\n", arm->cps_flag);
143
144 if (arm->vector_data)
145 printf("\tVector-data: %u\n", arm->vector_data);
146
147 if (arm->vector_size)
148 printf("\tVector-size: %u\n", arm->vector_size);
149
150 if (arm->usermode)
151 printf("\tUser-mode: True\n");
152
Nguyen Anh Quynh8cdafda2014-11-11 22:30:30 +0800153 if (arm->mem_barrier)
154 printf("\tMemory-barrier: %u\n", arm->mem_barrier);
155
Nguyen Anh Quynh29f777b2015-04-07 11:59:26 +0800156 // Print out all registers accessed by this instruction (either implicit or explicit)
157 if (!cs_regs_access(handle, ins,
158 regs_read, &regs_read_count,
159 regs_write, &regs_write_count)) {
160 if (regs_read_count) {
161 printf("\tRegisters read:");
162 for(i = 0; i < regs_read_count; i++) {
163 printf(" %s", cs_reg_name(handle, regs_read[i]));
164 }
165 printf("\n");
166 }
167
168 if (regs_write_count) {
169 printf("\tRegisters modified:");
170 for(i = 0; i < regs_write_count; i++) {
171 printf(" %s", cs_reg_name(handle, regs_write[i]));
172 }
173 printf("\n");
174 }
175 }
176
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800177 printf("\n");
178}
179
180static void test()
181{
182//#define ARM_CODE "\x04\xe0\x2d\xe5" // str lr, [sp, #-0x4]!
183//#define ARM_CODE "\xe0\x83\x22\xe5" // str r8, [r2, #-0x3e0]!
184//#define ARM_CODE "\xf1\x02\x03\x0e" // mcreq p0x2, #0x0, r0, c0x3, c0x1, #0x7
185//#define ARM_CODE "\x00\x00\xa0\xe3" // mov r0, #0x0
186//#define ARM_CODE "\x02\x30\xc1\xe7" // strb r3, [r1, r2]
187//#define ARM_CODE "\x00\x00\x53\xe3" // cmp r3, #0x0
188//#define ARM_CODE "\x02\x00\xa1\xe2" // adc r0, r1, r2
189//#define ARM_CODE "\x21\x01\xa0\xe0" // adc r0, r0, r1, lsr #2
190//#define ARM_CODE "\x21\x01\xb0\xe0" // adcs r0, r0, r1, lsr #2
191//#define ARM_CODE "\x32\x03\xa1\xe0" // adc r0, r1, r2, lsr r3
192//#define ARM_CODE "\x22\x01\xa1\xe0" // adc r0, r1, r2, lsr #2
193//#define ARM_CODE "\x65\x61\x4f\x50" // subpl r6, pc, r5, ror #2
194//#define ARM_CODE "\x30\x30\x53\xe5" // ldrb r3, [r3, #-0x30]
195//#define ARM_CODE "\xb6\x10\xdf\xe1" // ldrh r1, [pc, #0x6]
196//#define ARM_CODE "\x02\x00\x9f\xef" // svc #0x9f0002
197//#define ARM_CODE "\x00\xc0\x27\xea" // b 0x9F0002: FIXME: disasm as "b #0x9f0000"
198//#define ARM_CODE "\x12\x13\xa0\xe1" // lsl r1, r2, r3
199//#define ARM_CODE "\x82\x11\xa0\xe1" // lsl r1, r2, #0x3
200//#define ARM_CODE "\x00\xc0\xa0\xe1" // mov ip, r0
201//#define ARM_CODE "\x02\x00\x12\xe3" // tst r2, #2
202//#define ARM_CODE "\x51\x12\xa0\xe1" // asr r1, r2
203//#define ARM_CODE "\x72\x10\xef\xe6" // uxtb r1, r2
204//#define ARM_CODE "\xe0\x0a\xb7\xee" // vcvt.f64.f32 d0, s1
205//#define ARM_CODE "\x9f\x0f\x91\xe1" // ldrex r0, [r1]
206//#define ARM_CODE "\x0f\x06\x20\xf4" // vld1.8 {d0, d1, d2}, [r0]
207//#define ARM_CODE "\x72\x00\xa1\xe6" // sxtab r0, r1, r2
208//#define ARM_CODE "\x50\x06\x84\xf2" // vmov.i32 q0, #0x40000000
209//#define ARM_CODE "\x73\xe0\xb8\xee" // mrc p0, #5, lr, c8, c3, #3
210//#define ARM_CODE "\x12\x02\x81\xe6" // pkhbt r0, r1, r2, lsl #0x4
211//#define ARM_CODE "\x12\x00\xa0\xe6" // ssat r0, #0x1, r2
212//#define ARM_CODE "\x03\x60\x2d\xe9" // push {r0, r1, sp, lr}
213//#define ARM_CODE "\x8f\x40\x60\xf4" // vld4.32 {d20, d21, d22, d23}, [r0]
214//#define ARM_CODE "\xd0\x00\xc2\xe1" // ldrd r0, r1, [r2]
215//#define ARM_CODE "\x08\xf0\xd0\xf5" // pld [r0, #0x8]
216//#define ARM_CODE "\x10\x8b\xbc\xec" // ldc p11, c8, [r12], #64
217//#define ARM_CODE "\xd4\x30\xd2\xe1" // ldrsb r3, [r2, #0x4]
218//#define ARM_CODE "\x11\x0f\xbe\xf2" // vcvt.s32.f32 d0, d1, #2
219//#define ARM_CODE "\x01\x01\x70\xe1" // cmn r0, r1, lsl #2
220//#define ARM_CODE "\x06\x00\x91\xe2" // adds r0, r1, #6
221//#define ARM_CODE "\x5b\xf0\x7f\xf5" // dmb ish
222//#define ARM_CODE "\xf7\xff\xff\xfe"
Nguyen Anh Quynh524194a2013-12-01 23:23:37 +0800223//#define ARM_CODE "\x00\x20\xbd\xe8" // ldm sp!, {sp}
224//#define ARM_CODE "\x00\xa0\xbd\xe8" // pop {sp, pc}
225//#define ARM_CODE "\x90\x04\x0E\x00" // muleq lr, r0, r4
226//#define ARM_CODE "\x90\x24\x0E\x00" // muleq lr, r0, r4
Nguyen Anh Quynh6677b992013-12-08 22:20:35 +0800227//#define ARM_CODE "\xb6\x10\x5f\xe1" // ldrh r1, [pc, #-6]
Nguyen Anh Quynh29f777b2015-04-07 11:59:26 +0800228
229#define ARM_CODE "\x86\x48\x60\xf4\x4d\x0f\xe2\xf4\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3\x00\x02\x01\xf1\x05\x40\xd0\xe8\xf4\x80\x00\x00"
230
231//#define ARM_CODE "\x86\x48\x60\xf4"
232
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800233//#define ARM_CODE2 "\xf0\x24"
234//#define ARM_CODE2 "\x83\xb0"
235#define ARM_CODE2 "\xd1\xe8\x00\xf0\xf0\x24\x04\x07\x1f\x3c\xf2\xc0\x00\x00\x4f\xf0\x00\x01\x46\x6c"
236//#define THUMB_CODE "\x70\x47" // bl 0x26
237//#define THUMB_CODE "\x07\xdd" // ble 0x1c
Nguyen Anh Quynhbc38a282013-12-01 23:14:17 +0800238//#define THUMB_CODE "\x00\x47" // bx r0
239//#define THUMB_CODE "\x01\x47" // bx r0
240//#define THUMB_CODE "\x02\x47" // bx r0
Nguyen Anh Quynhf1c2eee2013-12-02 12:29:07 +0800241//#define THUMB_CODE "\x0a\xbf" // itet eq
Nguyen Anh Quynh29f777b2015-04-07 11:59:26 +0800242
243#define THUMB_CODE "\x60\xf9\x1f\x04\xe0\xf9\x4f\x07\x70\x47\xeb\x46\x83\xb0\xc9\x68\x1f\xb1\x30\xbf\xaf\xf3\x20\x84\x52\xf8\x23\xf0"
244//#define THUMB_CODE "\xe0\xf9\x4f\x07"
245
Nguyen Anh Quynh04d9f8e2014-09-01 23:27:24 +0800246#define THUMB_CODE2 "\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0\x18\xbf\xad\xbf\xf3\xff\x0b\x0c\x86\xf3\x00\x89\x80\xf3\x00\x8c\x4f\xfa\x99\xf6\xd0\xff\xa2\x01"
Nguyen Anh Quynh83466d42014-11-11 21:44:42 +0800247#define THUMB_MCLASS "\xef\xf3\x02\x80"
248#define ARMV8 "\xe0\x3b\xb2\xee\x42\x00\x01\xe1\x51\xf0\x7f\xf5"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800249
250 struct platform platforms[] = {
251 {
Axel 0vercl0k Souchet6b2395f2014-05-09 21:08:40 +0100252 CS_ARCH_ARM,
253 CS_MODE_ARM,
254 (unsigned char *)ARM_CODE,
255 sizeof(ARM_CODE) - 1,
256 "ARM"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800257 },
258 {
Axel 0vercl0k Souchet6b2395f2014-05-09 21:08:40 +0100259 CS_ARCH_ARM,
260 CS_MODE_THUMB,
261 (unsigned char *)THUMB_CODE,
262 sizeof(THUMB_CODE) - 1,
263 "Thumb"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800264 },
265 {
Axel 0vercl0k Souchet6b2395f2014-05-09 21:08:40 +0100266 CS_ARCH_ARM,
267 CS_MODE_THUMB,
268 (unsigned char *)ARM_CODE2,
269 sizeof(ARM_CODE2) - 1,
270 "Thumb-mixed"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800271 },
272 {
Axel 0vercl0k Souchet6b2395f2014-05-09 21:08:40 +0100273 CS_ARCH_ARM,
274 CS_MODE_THUMB,
275 (unsigned char *)THUMB_CODE2,
276 sizeof(THUMB_CODE2) - 1,
277 "Thumb-2 & register named with numbers",
278 CS_OPT_SYNTAX_NOREGNAME
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800279 },
Nguyen Anh Quynh83466d42014-11-11 21:44:42 +0800280 {
281 CS_ARCH_ARM,
282 (cs_mode)(CS_MODE_THUMB + CS_MODE_MCLASS),
283 (unsigned char*)THUMB_MCLASS,
284 sizeof(THUMB_MCLASS) - 1,
285 "Thumb-MClass"
286 },
287 {
288 CS_ARCH_ARM,
289 (cs_mode)(CS_MODE_ARM + CS_MODE_V8),
290 (unsigned char*)ARMV8,
291 sizeof(ARMV8) - 1,
292 "Arm-V8"
293 },
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800294 };
295
Nguyen Anh Quynh5df9e4b2013-12-03 15:02:12 +0800296 uint64_t address = 0x1000;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800297 cs_insn *insn;
298 int i;
Nguyen Anh Quynh5b556e52014-04-11 10:15:26 +0800299 size_t count;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800300
301 for (i = 0; i < sizeof(platforms)/sizeof(platforms[0]); i++) {
Nguyen Anh Quynhceae16d2014-01-19 16:04:23 +0800302 cs_err err = cs_open(platforms[i].arch, platforms[i].mode, &handle);
303 if (err) {
304 printf("Failed on cs_open() with error returned: %u\n", err);
Nguyen Anh Quynh49146912014-02-22 16:54:44 +0800305 continue;
Nguyen Anh Quynhceae16d2014-01-19 16:04:23 +0800306 }
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800307
Nguyen Anh Quynh39b812d2014-01-07 23:36:26 +0800308 cs_option(handle, CS_OPT_DETAIL, CS_OPT_ON);
309
Nguyen Anh Quynh2ff665a2014-03-11 00:18:50 +0800310 if (platforms[i].syntax)
311 cs_option(handle, CS_OPT_SYNTAX, platforms[i].syntax);
312
Nguyen Anh Quynh0beb0d42014-08-27 22:55:29 +0800313 count = cs_disasm(handle, platforms[i].code, platforms[i].size, address, 0, &insn);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800314 if (count) {
Nguyen Anh Quynh5b556e52014-04-11 10:15:26 +0800315 size_t j;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800316 printf("****************\n");
317 printf("Platform: %s\n", platforms[i].comment);
318 print_string_hex("Code:", platforms[i].code, platforms[i].size);
319 printf("Disasm:\n");
320
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800321 for (j = 0; j < count; j++) {
Nguyen Anh Quynh7b7b40c2013-12-03 12:24:06 +0800322 printf("0x%"PRIx64":\t%s\t%s\n", insn[j].address, insn[j].mnemonic, insn[j].op_str);
Nguyen Anh Quynh29f777b2015-04-07 11:59:26 +0800323 print_insn_detail(handle, &insn[j]);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800324 }
Nguyen Anh Quynh7b7b40c2013-12-03 12:24:06 +0800325 printf("0x%"PRIx64":\n", insn[j-1].address + insn[j-1].size);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800326
Nguyen Anh Quynh0beb0d42014-08-27 22:55:29 +0800327 // free memory allocated by cs_disasm()
Nguyen Anh Quynh4fe224b2013-12-24 16:49:36 +0800328 cs_free(insn, count);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800329 } else {
330 printf("****************\n");
331 printf("Platform: %s\n", platforms[i].comment);
332 print_string_hex("Code:", platforms[i].code, platforms[i].size);
333 printf("ERROR: Failed to disasm given code!\n");
334 }
335
336 printf("\n");
337
Nguyen Anh Quynh226d7dc2014-02-27 22:20:39 +0800338 cs_close(&handle);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800339 }
340}
341
342int main()
343{
344 test();
345
346 return 0;
347}
348