blob: ee398f1e00a1cc133e58cd646df8fbdd398ae064 [file] [log] [blame]
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08001/* Capstone Disassembler Engine */
2/* By Nguyen Anh Quynh <aquynh@gmail.com>, 2013> */
3
4#include <stdio.h>
5#include <stdlib.h>
Yegor Derevenetsced9d242014-09-21 17:27:11 +02006#include "../inttypes.h"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08007
8#include <capstone.h>
9
10struct platform {
11 cs_arch arch;
12 cs_mode mode;
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080013 unsigned char *code;
14 size_t size;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080015 char *comment;
Nguyen Anh Quynhb8ce68e2013-12-03 23:45:08 +080016 cs_opt_type opt_type;
17 cs_opt_value opt_value;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080018};
19
Mr. eXoDia9be1f932014-08-26 12:46:15 +020020static void print_string_hex(unsigned char *str, size_t len)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080021{
Nguyen Anh Quynhb42a6572013-11-29 17:40:07 +080022 unsigned char *c;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080023
24 printf("Code: ");
25 for (c = str; c < str + len; c++) {
26 printf("0x%02x ", *c & 0xff);
27 }
28 printf("\n");
29}
30
31static void test()
32{
33#define X86_CODE16 "\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00"
34#define X86_CODE32 "\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00"
Nguyen Anh Quynhb4ce3832013-12-06 08:06:21 +080035//#define X86_CODE32 "\x0f\xa7\xc0" // xstorerng
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080036#define X86_CODE64 "\x55\x48\x8b\x05\xb8\x13\x00\x00"
37//#define ARM_CODE "\x04\xe0\x2d\xe5"
38#define ARM_CODE "\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3"
39#define ARM_CODE2 "\x10\xf1\x10\xe7\x11\xf2\x31\xe7\xdc\xa1\x2e\xf3\xe8\x4e\x62\xf3"
Nguyen Anh Quynh83466d42014-11-11 21:44:42 +080040#define ARMV8 "\xe0\x3b\xb2\xee\x42\x00\x01\xe1\x51\xf0\x7f\xf5"
41#define THUMB_MCLASS "\xef\xf3\x02\x80"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080042#define THUMB_CODE "\x70\x47\xeb\x46\x83\xb0\xc9\x68"
43#define THUMB_CODE2 "\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0"
44#define MIPS_CODE "\x0C\x10\x00\x97\x00\x00\x00\x00\x24\x02\x00\x0c\x8f\xa2\x00\x00\x34\x21\x34\x56"
45#define MIPS_CODE2 "\x56\x34\x21\x34\xc2\x17\x01\x00"
Nguyen Anh Quynh248519e2014-11-09 14:07:07 +080046#define MIPS_32R6M "\x00\x07\x00\x07\x00\x11\x93\x7c\x01\x8c\x8b\x7c\x00\xc7\x48\xd0"
47#define MIPS_32R6 "\xec\x80\x00\x19\x7c\x43\x22\xa0"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080048//#define ARM64_CODE "\x00\x40\x21\x4b" // sub w0, w0, w1, uxtw
49//#define ARM64_CODE "\x21\x7c\x02\x9b" // mul x1, x1, x2
50//#define ARM64_CODE "\x20\x74\x0b\xd5" // dc zva, x0
51//#define ARM64_CODE "\xe1\x0b\x40\xb9" // ldr w1, [sp, #0x8]
52#define ARM64_CODE "\x21\x7c\x02\x9b\x21\x7c\x00\x53\x00\x40\x21\x4b\xe1\x0b\x40\xb9"
Nguyen Anh Quynhf1d489b2014-01-05 00:00:05 +080053#define PPC_CODE "\x80\x20\x00\x00\x80\x3f\x00\x00\x10\x43\x23\x0e\xd0\x44\x00\x80\x4c\x43\x22\x02\x2d\x03\x00\x80\x7c\x43\x20\x14\x7c\x43\x20\x93\x4f\x20\x00\x21\x4c\xc8\x00\x21"
Nguyen Anh Quynh05e27132014-03-10 11:58:57 +080054#define SPARC_CODE "\x80\xa0\x40\x02\x85\xc2\x60\x08\x85\xe8\x20\x01\x81\xe8\x00\x00\x90\x10\x20\x01\xd5\xf6\x10\x16\x21\x00\x00\x0a\x86\x00\x40\x02\x01\x00\x00\x00\x12\xbf\xff\xff\x10\xbf\xff\xff\xa0\x02\x00\x09\x0d\xbf\xff\xff\xd4\x20\x60\x00\xd4\x4e\x00\x16\x2a\xc2\x80\x03"
Nguyen Anh Quynhea9f4b12014-03-10 20:38:01 +080055#define SPARCV9_CODE "\x81\xa8\x0a\x24\x89\xa0\x10\x20\x89\xa0\x1a\x60\x89\xa0\x00\xe0"
Nguyen Anh Quynhda1e8332014-03-23 11:12:07 +080056#define SYSZ_CODE "\xed\x00\x00\x00\x00\x1a\x5a\x0f\x1f\xff\xc2\x09\x80\x00\x00\x00\x07\xf7\xeb\x2a\xff\xff\x7f\x57\xe3\x01\xff\xff\x7f\x57\xeb\x00\xf0\x00\x00\x24\xb2\x4f\x00\x78"
Nguyen Anh Quynhc80d8402014-05-26 23:02:48 +080057#define XCORE_CODE "\xfe\x0f\xfe\x17\x13\x17\xc6\xfe\xec\x17\x97\xf8\xec\x4f\x1f\xfd\xec\x37\x07\xf2\x45\x5b\xf9\xfa\x02\x06\x1b\x10"
Nguyen Anh Quynh42706a32014-05-09 07:33:35 +080058 struct platform {
59 cs_arch arch;
60 cs_mode mode;
61 unsigned char *code;
62 size_t size;
63 char *comment;
64 cs_opt_type opt_type;
65 cs_opt_value opt_value;
66 };
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080067 struct platform platforms[] = {
68 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +010069 CS_ARCH_X86,
70 CS_MODE_16,
71 (unsigned char*)X86_CODE16,
72 sizeof(X86_CODE16) - 1,
73 "X86 16bit (Intel syntax)"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080074 },
75 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +010076 CS_ARCH_X86,
77 CS_MODE_32,
78 (unsigned char*)X86_CODE32,
79 sizeof(X86_CODE32) - 1,
80 "X86 32bit (ATT syntax)",
81 CS_OPT_SYNTAX,
82 CS_OPT_SYNTAX_ATT,
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080083 },
84 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +010085 CS_ARCH_X86,
86 CS_MODE_32,
87 (unsigned char*)X86_CODE32,
88 sizeof(X86_CODE32) - 1,
89 "X86 32 (Intel syntax)"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080090 },
91 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +010092 CS_ARCH_X86,
93 CS_MODE_64,
94 (unsigned char*)X86_CODE64,
95 sizeof(X86_CODE64) - 1,
96 "X86 64 (Intel syntax)"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080097 },
98 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +010099 CS_ARCH_ARM,
100 CS_MODE_ARM,
101 (unsigned char*)ARM_CODE,
102 sizeof(ARM_CODE) - 1,
103 "ARM"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800104 },
105 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100106 CS_ARCH_ARM,
107 CS_MODE_THUMB,
108 (unsigned char*)THUMB_CODE2,
109 sizeof(THUMB_CODE2) - 1,
110 "THUMB-2"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800111 },
112 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100113 CS_ARCH_ARM,
114 CS_MODE_ARM,
115 (unsigned char*)ARM_CODE2,
116 sizeof(ARM_CODE2) - 1,
117 "ARM: Cortex-A15 + NEON"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800118 },
119 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100120 CS_ARCH_ARM,
121 CS_MODE_THUMB,
122 (unsigned char*)THUMB_CODE,
123 sizeof(THUMB_CODE) - 1,
124 "THUMB"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800125 },
126 {
Nguyen Anh Quynh83466d42014-11-11 21:44:42 +0800127 CS_ARCH_ARM,
128 (cs_mode)(CS_MODE_THUMB + CS_MODE_MCLASS),
129 (unsigned char*)THUMB_MCLASS,
130 sizeof(THUMB_MCLASS) - 1,
131 "Thumb-MClass"
132 },
133 {
134 CS_ARCH_ARM,
135 (cs_mode)(CS_MODE_ARM + CS_MODE_V8),
136 (unsigned char*)ARMV8,
137 sizeof(ARMV8) - 1,
138 "Arm-V8"
139 },
140 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100141 CS_ARCH_MIPS,
142 (cs_mode)(CS_MODE_32 + CS_MODE_BIG_ENDIAN),
143 (unsigned char*)MIPS_CODE,
144 sizeof(MIPS_CODE) - 1,
145 "MIPS-32 (Big-endian)"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800146 },
147 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100148 CS_ARCH_MIPS,
149 (cs_mode)(CS_MODE_64 + CS_MODE_LITTLE_ENDIAN),
150 (unsigned char*)MIPS_CODE2,
151 sizeof(MIPS_CODE2) - 1,
152 "MIPS-64-EL (Little-endian)"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800153 },
154 {
Nguyen Anh Quynh5720cb72014-10-29 22:35:02 +0800155 CS_ARCH_MIPS,
Nguyen Anh Quynh5720cb72014-10-29 22:35:02 +0800156 (cs_mode)(CS_MODE_32 + CS_MODE_MIPS32R6 + CS_MODE_MICRO + CS_MODE_BIG_ENDIAN),
Nguyen Anh Quynh248519e2014-11-09 14:07:07 +0800157 (unsigned char*)MIPS_32R6M,
158 sizeof(MIPS_32R6M) - 1,
159 "MIPS-32R6 | Micro (Big-endian)"
160 },
161 {
162 CS_ARCH_MIPS,
163 (cs_mode)(CS_MODE_32 + CS_MODE_MIPS32R6 + CS_MODE_BIG_ENDIAN),
Nguyen Anh Quynh5720cb72014-10-29 22:35:02 +0800164 (unsigned char*)MIPS_32R6,
165 sizeof(MIPS_32R6) - 1,
Nguyen Anh Quynh248519e2014-11-09 14:07:07 +0800166 "MIPS-32R6 (Big-endian)"
Nguyen Anh Quynh5720cb72014-10-29 22:35:02 +0800167 },
168 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100169 CS_ARCH_ARM64,
170 CS_MODE_ARM,
171 (unsigned char*)ARM64_CODE,
172 sizeof(ARM64_CODE) - 1,
173 "ARM-64"
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800174 },
Nguyen Anh Quynh42c6b1a2013-12-30 00:15:25 +0800175 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100176 CS_ARCH_PPC,
177 CS_MODE_BIG_ENDIAN,
178 (unsigned char*)PPC_CODE,
179 sizeof(PPC_CODE) - 1,
Nguyen Anh Quynh42706a32014-05-09 07:33:35 +0800180 "PPC-64"
Nguyen Anh Quynh42c6b1a2013-12-30 00:15:25 +0800181 },
182 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100183 CS_ARCH_PPC,
184 CS_MODE_BIG_ENDIAN,
185 (unsigned char*)PPC_CODE,
186 sizeof(PPC_CODE) - 1,
Nguyen Anh Quynh42706a32014-05-09 07:33:35 +0800187 "PPC-64, print register with number only",
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100188 CS_OPT_SYNTAX,
189 CS_OPT_SYNTAX_NOREGNAME
Nguyen Anh Quynh42c6b1a2013-12-30 00:15:25 +0800190 },
Nguyen Anh Quynh05e27132014-03-10 11:58:57 +0800191 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100192 CS_ARCH_SPARC,
193 CS_MODE_BIG_ENDIAN,
194 (unsigned char*)SPARC_CODE,
195 sizeof(SPARC_CODE) - 1,
196 "Sparc"
Nguyen Anh Quynh05e27132014-03-10 11:58:57 +0800197 },
Nguyen Anh Quynhea9f4b12014-03-10 20:38:01 +0800198 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100199 CS_ARCH_SPARC,
200 (cs_mode)(CS_MODE_BIG_ENDIAN + CS_MODE_V9),
201 (unsigned char*)SPARCV9_CODE,
202 sizeof(SPARCV9_CODE) - 1,
203 "SparcV9"
Nguyen Anh Quynhea9f4b12014-03-10 20:38:01 +0800204 },
Nguyen Anh Quynh48a14ca2014-03-23 08:35:45 +0800205 {
Axel 0vercl0k Souchet779d4c72014-05-08 23:44:49 +0100206 CS_ARCH_SYSZ,
207 (cs_mode)0,
208 (unsigned char*)SYSZ_CODE,
209 sizeof(SYSZ_CODE) - 1,
210 "SystemZ"
Nguyen Anh Quynh48a14ca2014-03-23 08:35:45 +0800211 },
Nguyen Anh Quynhc80d8402014-05-26 23:02:48 +0800212 {
213 CS_ARCH_XCORE,
214 (cs_mode)0,
215 (unsigned char*)XCORE_CODE,
216 sizeof(XCORE_CODE) - 1,
217 "XCore"
218 },
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800219 };
220
221 csh handle;
Nguyen Anh Quynh5df9e4b2013-12-03 15:02:12 +0800222 uint64_t address = 0x1000;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800223 cs_insn *insn;
224 int i;
Nguyen Anh Quynh5b556e52014-04-11 10:15:26 +0800225 size_t count;
Nguyen Anh Quynh655c7022014-04-11 12:15:33 +0800226 cs_err err;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800227
228 for (i = 0; i < sizeof(platforms)/sizeof(platforms[0]); i++) {
Nguyen Anh Quynh48a14ca2014-03-23 08:35:45 +0800229 printf("****************\n");
230 printf("Platform: %s\n", platforms[i].comment);
Nguyen Anh Quynh655c7022014-04-11 12:15:33 +0800231 err = cs_open(platforms[i].arch, platforms[i].mode, &handle);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800232 if (err) {
233 printf("Failed on cs_open() with error returned: %u\n", err);
Nguyen Anh Quynh49146912014-02-22 16:54:44 +0800234 continue;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800235 }
236
Nguyen Anh Quynhb8ce68e2013-12-03 23:45:08 +0800237 if (platforms[i].opt_type)
238 cs_option(handle, platforms[i].opt_type, platforms[i].opt_value);
Nguyen Anh Quynh01aba002013-12-03 21:00:09 +0800239
Nguyen Anh Quynh0beb0d42014-08-27 22:55:29 +0800240 count = cs_disasm(handle, platforms[i].code, platforms[i].size, address, 0, &insn);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800241 if (count) {
Nguyen Anh Quynh5b556e52014-04-11 10:15:26 +0800242 size_t j;
243
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800244 print_string_hex(platforms[i].code, platforms[i].size);
245 printf("Disasm:\n");
246
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800247 for (j = 0; j < count; j++) {
Nguyen Anh Quynh723687e2013-11-29 22:36:45 +0800248 printf("0x%"PRIx64":\t%s\t\t%s\n",
Nguyen Anh Quynh7b7b40c2013-12-03 12:24:06 +0800249 insn[j].address, insn[j].mnemonic, insn[j].op_str);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800250 }
251
252 // print out the next offset, after the last insn
Nguyen Anh Quynh7b7b40c2013-12-03 12:24:06 +0800253 printf("0x%"PRIx64":\n", insn[j-1].address + insn[j-1].size);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800254
Nguyen Anh Quynh0beb0d42014-08-27 22:55:29 +0800255 // free memory allocated by cs_disasm()
Nguyen Anh Quynh4fe224b2013-12-24 16:49:36 +0800256 cs_free(insn, count);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800257 } else {
258 printf("****************\n");
259 printf("Platform: %s\n", platforms[i].comment);
260 print_string_hex(platforms[i].code, platforms[i].size);
261 printf("ERROR: Failed to disasm given code!\n");
262 }
263
264 printf("\n");
265
Nguyen Anh Quynh226d7dc2014-02-27 22:20:39 +0800266 cs_close(&handle);
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800267 }
268}
269
270int main()
271{
Nguyen Anh Quynh8f13f3c2013-12-04 22:57:04 +0800272 test();
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800273
274#if 0
Nguyen Anh Quynh42706a32014-05-09 07:33:35 +0800275#define offsetof(st, m) __builtin_offsetof(st, m)
Nguyen Anh Quynh723687e2013-11-29 22:36:45 +0800276
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800277 cs_insn insn;
278 printf("size: %lu\n", sizeof(insn));
Nguyen Anh Quynh8f13f3c2013-12-04 22:57:04 +0800279 printf("@id: %lu\n", offsetof(cs_insn, id));
280 printf("@address: %lu\n", offsetof(cs_insn, address));
281 printf("@size: %lu\n", offsetof(cs_insn, size));
282 printf("@bytes: %lu\n", offsetof(cs_insn, bytes));
283 printf("@mnemonic: %lu\n", offsetof(cs_insn, mnemonic));
284 printf("@op_str: %lu\n", offsetof(cs_insn, op_str));
285 printf("@regs_read: %lu\n", offsetof(cs_insn, regs_read));
286 printf("@regs_read_count: %lu\n", offsetof(cs_insn, regs_read_count));
287 printf("@regs_write: %lu\n", offsetof(cs_insn, regs_write));
288 printf("@regs_write_count: %lu\n", offsetof(cs_insn, regs_write_count));
289 printf("@groups: %lu\n", offsetof(cs_insn, groups));
290 printf("@groups_count: %lu\n", offsetof(cs_insn, groups_count));
291 printf("@arch: %lu\n", offsetof(cs_insn, x86));
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800292#endif
293
294 return 0;
295}