Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 1 | /* Capstone Disassembler Engine */ |
| 2 | /* By Nguyen Anh Quynh <aquynh@gmail.com>, 2013> */ |
| 3 | |
| 4 | #include <stdio.h> |
| 5 | #include <stdlib.h> |
| 6 | #include <inttypes.h> |
| 7 | |
| 8 | #include <capstone.h> |
| 9 | |
| 10 | static csh handle; |
| 11 | |
| 12 | struct platform { |
| 13 | cs_arch arch; |
| 14 | cs_mode mode; |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 15 | unsigned char *code; |
| 16 | size_t size; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 17 | char *comment; |
Nguyen Anh Quynh | 2ff665a | 2014-03-11 00:18:50 +0800 | [diff] [blame] | 18 | int syntax; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 19 | }; |
| 20 | |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 21 | static void print_string_hex(char *comment, unsigned char *str, int len) |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 22 | { |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 23 | unsigned char *c; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 24 | |
| 25 | printf("%s", comment); |
| 26 | for (c = str; c < str + len; c++) { |
| 27 | printf("0x%02x ", *c & 0xff); |
| 28 | } |
| 29 | |
| 30 | printf("\n"); |
| 31 | } |
| 32 | |
Nguyen Anh Quynh | 397d0de | 2013-12-16 23:37:08 +0800 | [diff] [blame] | 33 | static void print_insn_detail(cs_insn *ins) |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 34 | { |
Nguyen Anh Quynh | 4fe224b | 2013-12-24 16:49:36 +0800 | [diff] [blame] | 35 | cs_arm *arm = &(ins->detail->arm); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 36 | |
| 37 | if (arm->op_count) |
| 38 | printf("\top_count: %u\n", arm->op_count); |
| 39 | |
| 40 | int i; |
| 41 | for (i = 0; i < arm->op_count; i++) { |
| 42 | cs_arm_op *op = &(arm->operands[i]); |
| 43 | switch((int)op->type) { |
| 44 | default: |
| 45 | break; |
| 46 | case ARM_OP_REG: |
| 47 | printf("\t\toperands[%u].type: REG = %s\n", i, cs_reg_name(handle, op->reg)); |
| 48 | break; |
| 49 | case ARM_OP_IMM: |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 50 | printf("\t\toperands[%u].type: IMM = 0x%x\n", i, op->imm); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 51 | break; |
| 52 | case ARM_OP_FP: |
| 53 | printf("\t\toperands[%u].type: FP = %f\n", i, op->fp); |
| 54 | break; |
| 55 | case ARM_OP_MEM: |
| 56 | printf("\t\toperands[%u].type: MEM\n", i); |
| 57 | if (op->mem.base != X86_REG_INVALID) |
| 58 | printf("\t\t\toperands[%u].mem.base: REG = %s\n", |
| 59 | i, cs_reg_name(handle, op->mem.base)); |
| 60 | if (op->mem.index != X86_REG_INVALID) |
| 61 | printf("\t\t\toperands[%u].mem.index: REG = %s\n", |
| 62 | i, cs_reg_name(handle, op->mem.index)); |
| 63 | if (op->mem.scale != 1) |
| 64 | printf("\t\t\toperands[%u].mem.scale: %u\n", i, op->mem.scale); |
| 65 | if (op->mem.disp != 0) |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 66 | printf("\t\t\toperands[%u].mem.disp: 0x%x\n", i, op->mem.disp); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 67 | |
| 68 | break; |
| 69 | case ARM_OP_PIMM: |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 70 | printf("\t\toperands[%u].type: P-IMM = %u\n", i, op->imm); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 71 | break; |
| 72 | case ARM_OP_CIMM: |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 73 | printf("\t\toperands[%u].type: C-IMM = %u\n", i, op->imm); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 74 | break; |
| 75 | } |
| 76 | |
| 77 | if (op->shift.type != ARM_SFT_INVALID && op->shift.value) { |
| 78 | if (op->shift.type < ARM_SFT_ASR_REG) |
| 79 | // shift with constant value |
| 80 | printf("\t\t\tShift: %u = %u\n", op->shift.type, op->shift.value); |
| 81 | else |
| 82 | // shift with register |
| 83 | printf("\t\t\tShift: %u = %s\n", op->shift.type, |
| 84 | cs_reg_name(handle, op->shift.value)); |
| 85 | } |
| 86 | } |
| 87 | |
| 88 | if (arm->cc != ARM_CC_AL && arm->cc != ARM_CC_INVALID) |
Nguyen Anh Quynh | f122ae0 | 2014-01-05 21:45:30 +0800 | [diff] [blame] | 89 | printf("\tCode condition: %u\n", arm->cc); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 90 | |
| 91 | if (arm->update_flags) |
| 92 | printf("\tUpdate-flags: True\n"); |
| 93 | |
| 94 | if (arm->writeback) |
| 95 | printf("\tWrite-back: True\n"); |
| 96 | |
| 97 | printf("\n"); |
| 98 | } |
| 99 | |
| 100 | static void test() |
| 101 | { |
| 102 | //#define ARM_CODE "\x04\xe0\x2d\xe5" // str lr, [sp, #-0x4]! |
| 103 | //#define ARM_CODE "\xe0\x83\x22\xe5" // str r8, [r2, #-0x3e0]! |
| 104 | //#define ARM_CODE "\xf1\x02\x03\x0e" // mcreq p0x2, #0x0, r0, c0x3, c0x1, #0x7 |
| 105 | //#define ARM_CODE "\x00\x00\xa0\xe3" // mov r0, #0x0 |
| 106 | //#define ARM_CODE "\x02\x30\xc1\xe7" // strb r3, [r1, r2] |
| 107 | //#define ARM_CODE "\x00\x00\x53\xe3" // cmp r3, #0x0 |
| 108 | //#define ARM_CODE "\x02\x00\xa1\xe2" // adc r0, r1, r2 |
| 109 | //#define ARM_CODE "\x21\x01\xa0\xe0" // adc r0, r0, r1, lsr #2 |
| 110 | //#define ARM_CODE "\x21\x01\xb0\xe0" // adcs r0, r0, r1, lsr #2 |
| 111 | //#define ARM_CODE "\x32\x03\xa1\xe0" // adc r0, r1, r2, lsr r3 |
| 112 | //#define ARM_CODE "\x22\x01\xa1\xe0" // adc r0, r1, r2, lsr #2 |
| 113 | //#define ARM_CODE "\x65\x61\x4f\x50" // subpl r6, pc, r5, ror #2 |
| 114 | //#define ARM_CODE "\x30\x30\x53\xe5" // ldrb r3, [r3, #-0x30] |
| 115 | //#define ARM_CODE "\xb6\x10\xdf\xe1" // ldrh r1, [pc, #0x6] |
| 116 | //#define ARM_CODE "\x02\x00\x9f\xef" // svc #0x9f0002 |
| 117 | //#define ARM_CODE "\x00\xc0\x27\xea" // b 0x9F0002: FIXME: disasm as "b #0x9f0000" |
| 118 | //#define ARM_CODE "\x12\x13\xa0\xe1" // lsl r1, r2, r3 |
| 119 | //#define ARM_CODE "\x82\x11\xa0\xe1" // lsl r1, r2, #0x3 |
| 120 | //#define ARM_CODE "\x00\xc0\xa0\xe1" // mov ip, r0 |
| 121 | //#define ARM_CODE "\x02\x00\x12\xe3" // tst r2, #2 |
| 122 | //#define ARM_CODE "\x51\x12\xa0\xe1" // asr r1, r2 |
| 123 | //#define ARM_CODE "\x72\x10\xef\xe6" // uxtb r1, r2 |
| 124 | //#define ARM_CODE "\xe0\x0a\xb7\xee" // vcvt.f64.f32 d0, s1 |
| 125 | //#define ARM_CODE "\x9f\x0f\x91\xe1" // ldrex r0, [r1] |
| 126 | //#define ARM_CODE "\x0f\x06\x20\xf4" // vld1.8 {d0, d1, d2}, [r0] |
| 127 | //#define ARM_CODE "\x72\x00\xa1\xe6" // sxtab r0, r1, r2 |
| 128 | //#define ARM_CODE "\x50\x06\x84\xf2" // vmov.i32 q0, #0x40000000 |
| 129 | //#define ARM_CODE "\x73\xe0\xb8\xee" // mrc p0, #5, lr, c8, c3, #3 |
| 130 | //#define ARM_CODE "\x12\x02\x81\xe6" // pkhbt r0, r1, r2, lsl #0x4 |
| 131 | //#define ARM_CODE "\x12\x00\xa0\xe6" // ssat r0, #0x1, r2 |
| 132 | //#define ARM_CODE "\x03\x60\x2d\xe9" // push {r0, r1, sp, lr} |
| 133 | //#define ARM_CODE "\x8f\x40\x60\xf4" // vld4.32 {d20, d21, d22, d23}, [r0] |
| 134 | //#define ARM_CODE "\xd0\x00\xc2\xe1" // ldrd r0, r1, [r2] |
| 135 | //#define ARM_CODE "\x08\xf0\xd0\xf5" // pld [r0, #0x8] |
| 136 | //#define ARM_CODE "\x10\x8b\xbc\xec" // ldc p11, c8, [r12], #64 |
| 137 | //#define ARM_CODE "\xd4\x30\xd2\xe1" // ldrsb r3, [r2, #0x4] |
| 138 | //#define ARM_CODE "\x11\x0f\xbe\xf2" // vcvt.s32.f32 d0, d1, #2 |
| 139 | //#define ARM_CODE "\x01\x01\x70\xe1" // cmn r0, r1, lsl #2 |
| 140 | //#define ARM_CODE "\x06\x00\x91\xe2" // adds r0, r1, #6 |
| 141 | //#define ARM_CODE "\x5b\xf0\x7f\xf5" // dmb ish |
| 142 | //#define ARM_CODE "\xf7\xff\xff\xfe" |
Nguyen Anh Quynh | 524194a | 2013-12-01 23:23:37 +0800 | [diff] [blame] | 143 | //#define ARM_CODE "\x00\x20\xbd\xe8" // ldm sp!, {sp} |
| 144 | //#define ARM_CODE "\x00\xa0\xbd\xe8" // pop {sp, pc} |
| 145 | //#define ARM_CODE "\x90\x04\x0E\x00" // muleq lr, r0, r4 |
| 146 | //#define ARM_CODE "\x90\x24\x0E\x00" // muleq lr, r0, r4 |
Nguyen Anh Quynh | 6677b99 | 2013-12-08 22:20:35 +0800 | [diff] [blame] | 147 | //#define ARM_CODE "\xb6\x10\x5f\xe1" // ldrh r1, [pc, #-6] |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 148 | #define ARM_CODE "\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3" |
| 149 | //#define ARM_CODE2 "\xf0\x24" |
| 150 | //#define ARM_CODE2 "\x83\xb0" |
| 151 | #define ARM_CODE2 "\xd1\xe8\x00\xf0\xf0\x24\x04\x07\x1f\x3c\xf2\xc0\x00\x00\x4f\xf0\x00\x01\x46\x6c" |
| 152 | //#define THUMB_CODE "\x70\x47" // bl 0x26 |
| 153 | //#define THUMB_CODE "\x07\xdd" // ble 0x1c |
Nguyen Anh Quynh | bc38a28 | 2013-12-01 23:14:17 +0800 | [diff] [blame] | 154 | //#define THUMB_CODE "\x00\x47" // bx r0 |
| 155 | //#define THUMB_CODE "\x01\x47" // bx r0 |
| 156 | //#define THUMB_CODE "\x02\x47" // bx r0 |
Nguyen Anh Quynh | f1c2eee | 2013-12-02 12:29:07 +0800 | [diff] [blame] | 157 | //#define THUMB_CODE "\x0a\xbf" // itet eq |
Nguyen Anh Quynh | 7c7a8bc | 2013-12-02 13:16:44 +0800 | [diff] [blame] | 158 | #define THUMB_CODE "\x70\x47\xeb\x46\x83\xb0\xc9\x68\x1f\xb1" |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 159 | #define THUMB_CODE2 "\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0" |
| 160 | |
| 161 | struct platform platforms[] = { |
| 162 | { |
| 163 | .arch = CS_ARCH_ARM, |
| 164 | .mode = CS_MODE_ARM, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 165 | .code = (unsigned char *)ARM_CODE, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 166 | .size = sizeof(ARM_CODE) - 1, |
| 167 | .comment = "ARM" |
| 168 | }, |
| 169 | { |
| 170 | .arch = CS_ARCH_ARM, |
| 171 | .mode = CS_MODE_THUMB, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 172 | .code = (unsigned char *)THUMB_CODE, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 173 | .size = sizeof(THUMB_CODE) - 1, |
| 174 | .comment = "Thumb" |
| 175 | }, |
| 176 | { |
| 177 | .arch = CS_ARCH_ARM, |
| 178 | .mode = CS_MODE_THUMB, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 179 | .code = (unsigned char *)ARM_CODE2, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 180 | .size = sizeof(ARM_CODE2) - 1, |
| 181 | .comment = "Thumb-mixed" |
| 182 | }, |
| 183 | { |
| 184 | .arch = CS_ARCH_ARM, |
| 185 | .mode = CS_MODE_THUMB, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 186 | .code = (unsigned char *)THUMB_CODE2, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 187 | .size = sizeof(THUMB_CODE2) - 1, |
Nguyen Anh Quynh | 2ff665a | 2014-03-11 00:18:50 +0800 | [diff] [blame] | 188 | .comment = "Thumb-2 & register named with numbers", |
| 189 | .syntax = CS_OPT_SYNTAX_NOREGNAME |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 190 | }, |
| 191 | }; |
| 192 | |
Nguyen Anh Quynh | 5df9e4b | 2013-12-03 15:02:12 +0800 | [diff] [blame] | 193 | uint64_t address = 0x1000; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 194 | cs_insn *insn; |
| 195 | int i; |
| 196 | |
| 197 | for (i = 0; i < sizeof(platforms)/sizeof(platforms[0]); i++) { |
Nguyen Anh Quynh | ceae16d | 2014-01-19 16:04:23 +0800 | [diff] [blame] | 198 | cs_err err = cs_open(platforms[i].arch, platforms[i].mode, &handle); |
| 199 | if (err) { |
| 200 | printf("Failed on cs_open() with error returned: %u\n", err); |
Nguyen Anh Quynh | 4914691 | 2014-02-22 16:54:44 +0800 | [diff] [blame] | 201 | continue; |
Nguyen Anh Quynh | ceae16d | 2014-01-19 16:04:23 +0800 | [diff] [blame] | 202 | } |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 203 | |
Nguyen Anh Quynh | 39b812d | 2014-01-07 23:36:26 +0800 | [diff] [blame] | 204 | cs_option(handle, CS_OPT_DETAIL, CS_OPT_ON); |
| 205 | |
Nguyen Anh Quynh | 2ff665a | 2014-03-11 00:18:50 +0800 | [diff] [blame] | 206 | if (platforms[i].syntax) |
| 207 | cs_option(handle, CS_OPT_SYNTAX, platforms[i].syntax); |
| 208 | |
Nguyen Anh Quynh | 04c19be | 2013-12-25 13:26:22 +0800 | [diff] [blame] | 209 | size_t count = cs_disasm_ex(handle, platforms[i].code, platforms[i].size, address, 0, &insn); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 210 | if (count) { |
| 211 | printf("****************\n"); |
| 212 | printf("Platform: %s\n", platforms[i].comment); |
| 213 | print_string_hex("Code:", platforms[i].code, platforms[i].size); |
| 214 | printf("Disasm:\n"); |
| 215 | |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 216 | size_t j; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 217 | for (j = 0; j < count; j++) { |
Nguyen Anh Quynh | 7b7b40c | 2013-12-03 12:24:06 +0800 | [diff] [blame] | 218 | printf("0x%"PRIx64":\t%s\t%s\n", insn[j].address, insn[j].mnemonic, insn[j].op_str); |
Nguyen Anh Quynh | 397d0de | 2013-12-16 23:37:08 +0800 | [diff] [blame] | 219 | print_insn_detail(&insn[j]); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 220 | } |
Nguyen Anh Quynh | 7b7b40c | 2013-12-03 12:24:06 +0800 | [diff] [blame] | 221 | printf("0x%"PRIx64":\n", insn[j-1].address + insn[j-1].size); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 222 | |
Nguyen Anh Quynh | 04c19be | 2013-12-25 13:26:22 +0800 | [diff] [blame] | 223 | // free memory allocated by cs_disasm_ex() |
Nguyen Anh Quynh | 4fe224b | 2013-12-24 16:49:36 +0800 | [diff] [blame] | 224 | cs_free(insn, count); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 225 | } else { |
| 226 | printf("****************\n"); |
| 227 | printf("Platform: %s\n", platforms[i].comment); |
| 228 | print_string_hex("Code:", platforms[i].code, platforms[i].size); |
| 229 | printf("ERROR: Failed to disasm given code!\n"); |
| 230 | } |
| 231 | |
| 232 | printf("\n"); |
| 233 | |
Nguyen Anh Quynh | 226d7dc | 2014-02-27 22:20:39 +0800 | [diff] [blame] | 234 | cs_close(&handle); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 235 | } |
| 236 | } |
| 237 | |
| 238 | int main() |
| 239 | { |
| 240 | test(); |
| 241 | |
| 242 | return 0; |
| 243 | } |
| 244 | |