Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 1 | /* Capstone Disassembler Engine */ |
| 2 | /* By Nguyen Anh Quynh <aquynh@gmail.com>, 2013> */ |
| 3 | |
| 4 | #include <stdio.h> |
| 5 | #include <stdlib.h> |
| 6 | #include <inttypes.h> |
| 7 | |
| 8 | #include <capstone.h> |
| 9 | |
| 10 | struct platform { |
| 11 | cs_arch arch; |
| 12 | cs_mode mode; |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 13 | unsigned char *code; |
| 14 | size_t size; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 15 | char *comment; |
Nguyen Anh Quynh | b8ce68e | 2013-12-03 23:45:08 +0800 | [diff] [blame] | 16 | cs_opt_type opt_type; |
| 17 | cs_opt_value opt_value; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 18 | }; |
| 19 | |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 20 | static void print_string_hex(unsigned char *str, int len) |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 21 | { |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 22 | unsigned char *c; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 23 | |
| 24 | printf("Code: "); |
| 25 | for (c = str; c < str + len; c++) { |
| 26 | printf("0x%02x ", *c & 0xff); |
| 27 | } |
| 28 | printf("\n"); |
| 29 | } |
| 30 | |
| 31 | static void test() |
| 32 | { |
| 33 | #define X86_CODE16 "\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00" |
| 34 | #define X86_CODE32 "\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00" |
Nguyen Anh Quynh | b4ce383 | 2013-12-06 08:06:21 +0800 | [diff] [blame] | 35 | //#define X86_CODE32 "\x0f\xa7\xc0" // xstorerng |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 36 | #define X86_CODE64 "\x55\x48\x8b\x05\xb8\x13\x00\x00" |
| 37 | //#define ARM_CODE "\x04\xe0\x2d\xe5" |
| 38 | #define ARM_CODE "\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3" |
| 39 | #define ARM_CODE2 "\x10\xf1\x10\xe7\x11\xf2\x31\xe7\xdc\xa1\x2e\xf3\xe8\x4e\x62\xf3" |
| 40 | #define THUMB_CODE "\x70\x47\xeb\x46\x83\xb0\xc9\x68" |
| 41 | #define THUMB_CODE2 "\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0" |
| 42 | #define MIPS_CODE "\x0C\x10\x00\x97\x00\x00\x00\x00\x24\x02\x00\x0c\x8f\xa2\x00\x00\x34\x21\x34\x56" |
| 43 | #define MIPS_CODE2 "\x56\x34\x21\x34\xc2\x17\x01\x00" |
| 44 | //#define ARM64_CODE "\x00\x40\x21\x4b" // sub w0, w0, w1, uxtw |
| 45 | //#define ARM64_CODE "\x21\x7c\x02\x9b" // mul x1, x1, x2 |
| 46 | //#define ARM64_CODE "\x20\x74\x0b\xd5" // dc zva, x0 |
| 47 | //#define ARM64_CODE "\xe1\x0b\x40\xb9" // ldr w1, [sp, #0x8] |
| 48 | #define ARM64_CODE "\x21\x7c\x02\x9b\x21\x7c\x00\x53\x00\x40\x21\x4b\xe1\x0b\x40\xb9" |
Nguyen Anh Quynh | f1d489b | 2014-01-05 00:00:05 +0800 | [diff] [blame] | 49 | #define PPC_CODE "\x80\x20\x00\x00\x80\x3f\x00\x00\x10\x43\x23\x0e\xd0\x44\x00\x80\x4c\x43\x22\x02\x2d\x03\x00\x80\x7c\x43\x20\x14\x7c\x43\x20\x93\x4f\x20\x00\x21\x4c\xc8\x00\x21" |
Nguyen Anh Quynh | 05e2713 | 2014-03-10 11:58:57 +0800 | [diff] [blame] | 50 | #define SPARC_CODE "\x80\xa0\x40\x02\x85\xc2\x60\x08\x85\xe8\x20\x01\x81\xe8\x00\x00\x90\x10\x20\x01\xd5\xf6\x10\x16\x21\x00\x00\x0a\x86\x00\x40\x02\x01\x00\x00\x00\x12\xbf\xff\xff\x10\xbf\xff\xff\xa0\x02\x00\x09\x0d\xbf\xff\xff\xd4\x20\x60\x00\xd4\x4e\x00\x16\x2a\xc2\x80\x03" |
Nguyen Anh Quynh | ea9f4b1 | 2014-03-10 20:38:01 +0800 | [diff] [blame] | 51 | #define SPARCV9_CODE "\x81\xa8\x0a\x24\x89\xa0\x10\x20\x89\xa0\x1a\x60\x89\xa0\x00\xe0" |
Nguyen Anh Quynh | da1e833 | 2014-03-23 11:12:07 +0800 | [diff] [blame] | 52 | #define SYSZ_CODE "\xed\x00\x00\x00\x00\x1a\x5a\x0f\x1f\xff\xc2\x09\x80\x00\x00\x00\x07\xf7\xeb\x2a\xff\xff\x7f\x57\xe3\x01\xff\xff\x7f\x57\xeb\x00\xf0\x00\x00\x24\xb2\x4f\x00\x78" |
Nguyen Anh Quynh | ea9f4b1 | 2014-03-10 20:38:01 +0800 | [diff] [blame] | 53 | |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 54 | struct platform platforms[] = { |
| 55 | { |
| 56 | .arch = CS_ARCH_X86, |
| 57 | .mode = CS_MODE_16, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 58 | .code = (unsigned char*)X86_CODE16, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 59 | .size = sizeof(X86_CODE16) - 1, |
| 60 | .comment = "X86 16bit (Intel syntax)" |
| 61 | }, |
| 62 | { |
| 63 | .arch = CS_ARCH_X86, |
Nguyen Anh Quynh | 01aba00 | 2013-12-03 21:00:09 +0800 | [diff] [blame] | 64 | .mode = CS_MODE_32, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 65 | .code = (unsigned char*)X86_CODE32, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 66 | .size = sizeof(X86_CODE32) - 1, |
Nguyen Anh Quynh | 01aba00 | 2013-12-03 21:00:09 +0800 | [diff] [blame] | 67 | .comment = "X86 32bit (ATT syntax)", |
Nguyen Anh Quynh | b8ce68e | 2013-12-03 23:45:08 +0800 | [diff] [blame] | 68 | .opt_type = CS_OPT_SYNTAX, |
Nguyen Anh Quynh | c618db4 | 2013-12-04 00:05:04 +0800 | [diff] [blame] | 69 | .opt_value = CS_OPT_SYNTAX_ATT, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 70 | }, |
| 71 | { |
| 72 | .arch = CS_ARCH_X86, |
| 73 | .mode = CS_MODE_32, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 74 | .code = (unsigned char*)X86_CODE32, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 75 | .size = sizeof(X86_CODE32) - 1, |
| 76 | .comment = "X86 32 (Intel syntax)" |
| 77 | }, |
| 78 | { |
| 79 | .arch = CS_ARCH_X86, |
| 80 | .mode = CS_MODE_64, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 81 | .code = (unsigned char*)X86_CODE64, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 82 | .size = sizeof(X86_CODE64) - 1, |
| 83 | .comment = "X86 64 (Intel syntax)" |
| 84 | }, |
| 85 | { |
| 86 | .arch = CS_ARCH_ARM, |
| 87 | .mode = CS_MODE_ARM, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 88 | .code = (unsigned char*)ARM_CODE, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 89 | .size = sizeof(ARM_CODE) - 1, |
| 90 | .comment = "ARM" |
| 91 | }, |
| 92 | { |
| 93 | .arch = CS_ARCH_ARM, |
| 94 | .mode = CS_MODE_THUMB, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 95 | .code = (unsigned char*)THUMB_CODE2, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 96 | .size = sizeof(THUMB_CODE2) - 1, |
| 97 | .comment = "THUMB-2" |
| 98 | }, |
| 99 | { |
| 100 | .arch = CS_ARCH_ARM, |
| 101 | .mode = CS_MODE_ARM, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 102 | .code = (unsigned char*)ARM_CODE2, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 103 | .size = sizeof(ARM_CODE2) - 1, |
| 104 | .comment = "ARM: Cortex-A15 + NEON" |
| 105 | }, |
| 106 | { |
| 107 | .arch = CS_ARCH_ARM, |
| 108 | .mode = CS_MODE_THUMB, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 109 | .code = (unsigned char*)THUMB_CODE, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 110 | .size = sizeof(THUMB_CODE) - 1, |
| 111 | .comment = "THUMB" |
| 112 | }, |
| 113 | { |
| 114 | .arch = CS_ARCH_MIPS, |
| 115 | .mode = CS_MODE_32 + CS_MODE_BIG_ENDIAN, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 116 | .code = (unsigned char*)MIPS_CODE, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 117 | .size = sizeof(MIPS_CODE) - 1, |
| 118 | .comment = "MIPS-32 (Big-endian)" |
| 119 | }, |
| 120 | { |
| 121 | .arch = CS_ARCH_MIPS, |
| 122 | .mode = CS_MODE_64+ CS_MODE_LITTLE_ENDIAN, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 123 | .code = (unsigned char*)MIPS_CODE2, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 124 | .size = sizeof(MIPS_CODE2) - 1, |
| 125 | .comment = "MIPS-64-EL (Little-endian)" |
| 126 | }, |
| 127 | { |
| 128 | .arch = CS_ARCH_ARM64, |
| 129 | .mode = CS_MODE_ARM, |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 130 | .code = (unsigned char*)ARM64_CODE, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 131 | .size = sizeof(ARM64_CODE) - 1, |
| 132 | .comment = "ARM-64" |
| 133 | }, |
Nguyen Anh Quynh | 42c6b1a | 2013-12-30 00:15:25 +0800 | [diff] [blame] | 134 | { |
| 135 | .arch = CS_ARCH_PPC, |
Nguyen Anh Quynh | 5f1f90c | 2014-01-01 23:28:05 +0800 | [diff] [blame] | 136 | .mode = CS_MODE_BIG_ENDIAN, |
| 137 | .code = (unsigned char*)PPC_CODE, |
| 138 | .size = sizeof(PPC_CODE) - 1, |
Nguyen Anh Quynh | 42c6b1a | 2013-12-30 00:15:25 +0800 | [diff] [blame] | 139 | .comment = "PPC-64" |
| 140 | }, |
| 141 | { |
| 142 | .arch = CS_ARCH_PPC, |
Nguyen Anh Quynh | 5f1f90c | 2014-01-01 23:28:05 +0800 | [diff] [blame] | 143 | .mode = CS_MODE_BIG_ENDIAN, |
| 144 | .code = (unsigned char*)PPC_CODE, |
| 145 | .size = sizeof(PPC_CODE) - 1, |
Nguyen Anh Quynh | 42c6b1a | 2013-12-30 00:15:25 +0800 | [diff] [blame] | 146 | .opt_type = CS_OPT_SYNTAX, |
Nguyen Anh Quynh | f1d489b | 2014-01-05 00:00:05 +0800 | [diff] [blame] | 147 | .opt_value = CS_OPT_SYNTAX_NOREGNAME, |
| 148 | .comment = "PPC-64, print register with number only" |
Nguyen Anh Quynh | 42c6b1a | 2013-12-30 00:15:25 +0800 | [diff] [blame] | 149 | }, |
Nguyen Anh Quynh | 05e2713 | 2014-03-10 11:58:57 +0800 | [diff] [blame] | 150 | { |
| 151 | .arch = CS_ARCH_SPARC, |
| 152 | .mode = CS_MODE_BIG_ENDIAN, |
| 153 | .code = (unsigned char*)SPARC_CODE, |
| 154 | .size = sizeof(SPARC_CODE) - 1, |
| 155 | .comment = "Sparc" |
| 156 | }, |
Nguyen Anh Quynh | ea9f4b1 | 2014-03-10 20:38:01 +0800 | [diff] [blame] | 157 | { |
| 158 | .arch = CS_ARCH_SPARC, |
| 159 | .mode = CS_MODE_BIG_ENDIAN + CS_MODE_V9, |
| 160 | .code = (unsigned char*)SPARCV9_CODE, |
| 161 | .size = sizeof(SPARCV9_CODE) - 1, |
| 162 | .comment = "SparcV9" |
| 163 | }, |
Nguyen Anh Quynh | 48a14ca | 2014-03-23 08:35:45 +0800 | [diff] [blame] | 164 | { |
| 165 | .arch = CS_ARCH_SYSZ, |
| 166 | .mode = 0, |
| 167 | .code = (unsigned char*)SYSZ_CODE, |
| 168 | .size = sizeof(SYSZ_CODE) - 1, |
| 169 | .comment = "SystemZ" |
| 170 | }, |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 171 | }; |
| 172 | |
| 173 | csh handle; |
Nguyen Anh Quynh | 5df9e4b | 2013-12-03 15:02:12 +0800 | [diff] [blame] | 174 | uint64_t address = 0x1000; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 175 | cs_insn *insn; |
| 176 | int i; |
| 177 | |
| 178 | for (i = 0; i < sizeof(platforms)/sizeof(platforms[0]); i++) { |
Nguyen Anh Quynh | 48a14ca | 2014-03-23 08:35:45 +0800 | [diff] [blame] | 179 | printf("****************\n"); |
| 180 | printf("Platform: %s\n", platforms[i].comment); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 181 | cs_err err = cs_open(platforms[i].arch, platforms[i].mode, &handle); |
| 182 | if (err) { |
| 183 | printf("Failed on cs_open() with error returned: %u\n", err); |
Nguyen Anh Quynh | 4914691 | 2014-02-22 16:54:44 +0800 | [diff] [blame] | 184 | continue; |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 185 | } |
| 186 | |
Nguyen Anh Quynh | b8ce68e | 2013-12-03 23:45:08 +0800 | [diff] [blame] | 187 | if (platforms[i].opt_type) |
| 188 | cs_option(handle, platforms[i].opt_type, platforms[i].opt_value); |
Nguyen Anh Quynh | 01aba00 | 2013-12-03 21:00:09 +0800 | [diff] [blame] | 189 | |
Nguyen Anh Quynh | 04c19be | 2013-12-25 13:26:22 +0800 | [diff] [blame] | 190 | size_t count = cs_disasm_ex(handle, platforms[i].code, platforms[i].size, address, 0, &insn); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 191 | if (count) { |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 192 | print_string_hex(platforms[i].code, platforms[i].size); |
| 193 | printf("Disasm:\n"); |
| 194 | |
Nguyen Anh Quynh | b42a657 | 2013-11-29 17:40:07 +0800 | [diff] [blame] | 195 | size_t j; |
Nguyen Anh Quynh | 723687e | 2013-11-29 22:36:45 +0800 | [diff] [blame] | 196 | |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 197 | for (j = 0; j < count; j++) { |
Nguyen Anh Quynh | 723687e | 2013-11-29 22:36:45 +0800 | [diff] [blame] | 198 | printf("0x%"PRIx64":\t%s\t\t%s\n", |
Nguyen Anh Quynh | 7b7b40c | 2013-12-03 12:24:06 +0800 | [diff] [blame] | 199 | insn[j].address, insn[j].mnemonic, insn[j].op_str); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 200 | } |
| 201 | |
| 202 | // print out the next offset, after the last insn |
Nguyen Anh Quynh | 7b7b40c | 2013-12-03 12:24:06 +0800 | [diff] [blame] | 203 | printf("0x%"PRIx64":\n", insn[j-1].address + insn[j-1].size); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 204 | |
Nguyen Anh Quynh | 04c19be | 2013-12-25 13:26:22 +0800 | [diff] [blame] | 205 | // free memory allocated by cs_disasm_ex() |
Nguyen Anh Quynh | 4fe224b | 2013-12-24 16:49:36 +0800 | [diff] [blame] | 206 | cs_free(insn, count); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 207 | } else { |
| 208 | printf("****************\n"); |
| 209 | printf("Platform: %s\n", platforms[i].comment); |
| 210 | print_string_hex(platforms[i].code, platforms[i].size); |
| 211 | printf("ERROR: Failed to disasm given code!\n"); |
| 212 | } |
| 213 | |
| 214 | printf("\n"); |
| 215 | |
Nguyen Anh Quynh | 226d7dc | 2014-02-27 22:20:39 +0800 | [diff] [blame] | 216 | cs_close(&handle); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 217 | } |
| 218 | } |
| 219 | |
| 220 | int main() |
| 221 | { |
Nguyen Anh Quynh | 8f13f3c | 2013-12-04 22:57:04 +0800 | [diff] [blame] | 222 | test(); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 223 | |
| 224 | #if 0 |
Nguyen Anh Quynh | 8f13f3c | 2013-12-04 22:57:04 +0800 | [diff] [blame] | 225 | #define offsetof(st, m) __builtin_offsetof(st, m) |
Nguyen Anh Quynh | 723687e | 2013-11-29 22:36:45 +0800 | [diff] [blame] | 226 | |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 227 | cs_insn insn; |
| 228 | printf("size: %lu\n", sizeof(insn)); |
Nguyen Anh Quynh | 8f13f3c | 2013-12-04 22:57:04 +0800 | [diff] [blame] | 229 | printf("@id: %lu\n", offsetof(cs_insn, id)); |
| 230 | printf("@address: %lu\n", offsetof(cs_insn, address)); |
| 231 | printf("@size: %lu\n", offsetof(cs_insn, size)); |
| 232 | printf("@bytes: %lu\n", offsetof(cs_insn, bytes)); |
| 233 | printf("@mnemonic: %lu\n", offsetof(cs_insn, mnemonic)); |
| 234 | printf("@op_str: %lu\n", offsetof(cs_insn, op_str)); |
| 235 | printf("@regs_read: %lu\n", offsetof(cs_insn, regs_read)); |
| 236 | printf("@regs_read_count: %lu\n", offsetof(cs_insn, regs_read_count)); |
| 237 | printf("@regs_write: %lu\n", offsetof(cs_insn, regs_write)); |
| 238 | printf("@regs_write_count: %lu\n", offsetof(cs_insn, regs_write_count)); |
| 239 | printf("@groups: %lu\n", offsetof(cs_insn, groups)); |
| 240 | printf("@groups_count: %lu\n", offsetof(cs_insn, groups_count)); |
| 241 | printf("@arch: %lu\n", offsetof(cs_insn, x86)); |
Nguyen Anh Quynh | 26ee41a | 2013-11-27 12:11:31 +0800 | [diff] [blame] | 242 | #endif |
| 243 | |
| 244 | return 0; |
| 245 | } |