blob: 9d7a8dbc30197389a045db017eb5db888ba05f24 [file] [log] [blame]
Nguyen Anh Quynh81a97c62014-09-26 23:38:53 +08001(* Capstone Disassembly Engine
2 * By Nguyen Anh Quynh <aquynh@gmail.com>, 2013-2014 *)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08003
4open Arm
5open Arm64
6open Mips
Guillaume Jeannee002ac72014-06-30 15:46:04 +02007open Ppc
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +08008open X86
Guillaume Jeanneae48c972014-08-19 14:46:06 +02009open Sparc
10open Systemz
11open Xcore
Wolfgang Schwotzer22b4d0e2017-10-21 15:44:36 +020012open M680x
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080013open Printf (* debug *)
14
Nguyen Anh Quynh69271dd2014-10-31 14:32:34 +080015(* Hardware architectures *)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080016type arch =
17 | CS_ARCH_ARM
18 | CS_ARCH_ARM64
19 | CS_ARCH_MIPS
20 | CS_ARCH_X86
Guillaume Jeanneae48c972014-08-19 14:46:06 +020021 | CS_ARCH_PPC
22 | CS_ARCH_SPARC
23 | CS_ARCH_SYSZ
24 | CS_ARCH_XCORE
Wolfgang Schwotzer22b4d0e2017-10-21 15:44:36 +020025 | CS_ARCH_M68K
26 | CS_ARCH_TMS320C64X
27 | CS_ARCH_M680X
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080028
Nguyen Anh Quynh69271dd2014-10-31 14:32:34 +080029(* Hardware modes *)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080030type mode =
31 | CS_MODE_LITTLE_ENDIAN (* little-endian mode (default mode) *)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080032 | CS_MODE_ARM (* ARM mode *)
Nguyen Anh Quynhff9a5742014-11-13 12:09:49 +080033 | CS_MODE_16 (* 16-bit mode (for X86) *)
34 | CS_MODE_32 (* 32-bit mode (for X86) *)
35 | CS_MODE_64 (* 64-bit mode (for X86, PPC) *)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080036 | CS_MODE_THUMB (* ARM's Thumb mode, including Thumb-2 *)
Nguyen Anh Quynh77d93e92014-09-25 23:03:36 +080037 | CS_MODE_MCLASS (* ARM's MClass mode *)
Nguyen Anh Quynh8e538902014-11-10 22:06:23 +080038 | CS_MODE_V8 (* ARMv8 A32 encodings for ARM *)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080039 | CS_MODE_MICRO (* MicroMips mode (MIPS architecture) *)
Nguyen Anh Quynh77d93e92014-09-25 23:03:36 +080040 | CS_MODE_MIPS3 (* Mips3 mode (MIPS architecture) *)
41 | CS_MODE_MIPS32R6 (* Mips32-R6 mode (MIPS architecture) *)
Francesco Tamagni1fb2b532017-06-27 14:56:54 +020042 | CS_MODE_MIPS2 (* Mips2 mode (MIPS architecture) *)
Nguyen Anh Quynh77d93e92014-09-25 23:03:36 +080043 | CS_MODE_V9 (* SparcV9 mode (Sparc architecture) *)
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080044 | CS_MODE_BIG_ENDIAN (* big-endian mode *)
Nguyen Anh Quynhff9a5742014-11-13 12:09:49 +080045 | CS_MODE_MIPS32 (* Mips32 mode (for Mips) *)
46 | CS_MODE_MIPS64 (* Mips64 mode (for Mips) *)
Wolfgang Schwotzer22b4d0e2017-10-21 15:44:36 +020047 | CS_MODE_QPX (* Quad Processing eXtensions mode (PowerPC) *)
48 | CS_MODE_M680X_6301 (* M680X Hitachi 6301,6303 mode *)
49 | CS_MODE_M680X_6309 (* M680X Hitachi 6309 mode *)
50 | CS_MODE_M680X_6800 (* M680X Motorola 6800,6802 mode *)
51 | CS_MODE_M680X_6801 (* M680X Motorola 6801,6803 mode *)
52 | CS_MODE_M680X_6805 (* M680X Motorola 6805 mode *)
53 | CS_MODE_M680X_6808 (* M680X Motorola 6808 mode *)
54 | CS_MODE_M680X_6809 (* M680X Motorola 6809 mode *)
55 | CS_MODE_M680X_6811 (* M680X Motorola/Freescale 68HC11 mode *)
56 | CS_MODE_M680X_CPU12 (* M680X Motorola/Freescale/NXP CPU12 mode *)
57 | CS_MODE_M680X_HCS08 (* M680X Freescale HCS08 mode *)
Nguyen Anh Quynhcac770a2015-03-12 17:03:33 +080058
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +080059
Guillaume Jeanneae48c972014-08-19 14:46:06 +020060
Nguyen Anh Quynh69271dd2014-10-31 14:32:34 +080061(* Runtime option for the disassembled engine *)
Guillaume Jeanneae48c972014-08-19 14:46:06 +020062type opt_type =
63 | CS_OPT_SYNTAX (* Asssembly output syntax *)
64 | CS_OPT_DETAIL (* Break down instruction structure into details *)
65 | CS_OPT_MODE (* Change engine's mode at run-time *)
66 | CS_OPT_MEM (* User-defined dynamic memory related functions *)
67 | CS_OPT_SKIPDATA (* Skip data when disassembling. Then engine is in SKIPDATA mode. *)
68 | CS_OPT_SKIPDATA_SETUP (* Setup user-defined function for SKIPDATA option *)
69
70
Nguyen Anh Quynh10647ae2015-03-25 17:35:59 +080071(* Common instruction operand access types - to be consistent across all architectures. *)
72(* It is possible to combine access types, for example: CS_AC_READ | CS_AC_WRITE *)
73let _CS_AC_INVALID = 0;; (* Uninitialized/invalid access type. *)
74let _CS_AC_READ = 1 lsl 0;; (* Operand read from memory or register. *)
75let _CS_AC_WRITE = 1 lsl 1;; (* Operand write to memory or register. *)
76
Nguyen Anh Quynh69271dd2014-10-31 14:32:34 +080077(* Runtime option value (associated with option type above) *)
Nguyen Anh Quynhfe4822c2014-10-04 16:30:02 +080078let _CS_OPT_OFF = 0L;; (* Turn OFF an option - default option of CS_OPT_DETAIL, CS_OPT_SKIPDATA. *)
79let _CS_OPT_ON = 3L;; (* Turn ON an option (CS_OPT_DETAIL, CS_OPT_SKIPDATA). *)
80let _CS_OPT_SYNTAX_DEFAULT = 0L;; (* Default asm syntax (CS_OPT_SYNTAX). *)
81let _CS_OPT_SYNTAX_INTEL = 1L;; (* X86 Intel asm syntax - default on X86 (CS_OPT_SYNTAX). *)
82let _CS_OPT_SYNTAX_ATT = 2L;; (* X86 ATT asm syntax (CS_OPT_SYNTAX). *)
83let _CS_OPT_SYNTAX_NOREGNAME = 3L;; (* Prints register name with only number (CS_OPT_SYNTAX) *)
Guillaume Jeanneae48c972014-08-19 14:46:06 +020084
Nguyen Anh Quynh69271dd2014-10-31 14:32:34 +080085(* Common instruction operand types - to be consistent across all architectures. *)
86let _CS_OP_INVALID = 0;; (* uninitialized/invalid operand. *)
87let _CS_OP_REG = 1;; (* Register operand. *)
88let _CS_OP_IMM = 2;; (* Immediate operand. *)
89let _CS_OP_MEM = 3;; (* Memory operand. *)
90let _CS_OP_FP = 4;; (* Floating-Point operand. *)
Nguyen Anh Quynh82354b62014-09-28 23:56:02 +080091
Nguyen Anh Quynha65d7ef2014-10-31 15:47:17 +080092(* Common instruction groups - to be consistent across all architectures. *)
93let _CS_GRP_INVALID = 0;; (* uninitialized/invalid group. *)
94let _CS_GRP_JUMP = 1;; (* all jump instructions (conditional+direct+indirect jumps) *)
95let _CS_GRP_CALL = 2;; (* all call instructions *)
96let _CS_GRP_RET = 3;; (* all return instructions *)
97let _CS_GRP_INT = 4;; (* all interrupt instructions (int+syscall) *)
98let _CS_GRP_IRET = 5;; (* all interrupt return instructions *)
Nguyen Anh Quynh4dd0dcb2015-03-09 00:04:45 +080099let _CS_GRP_PRIVILEGE = 6;; (* all privileged instructions *)
Nguyen Anh Quynha65d7ef2014-10-31 15:47:17 +0800100
Jay Oster79e253c2014-10-12 16:03:12 -0700101type cs_arch =
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800102 | CS_INFO_ARM of cs_arm
103 | CS_INFO_ARM64 of cs_arm64
104 | CS_INFO_MIPS of cs_mips
105 | CS_INFO_X86 of cs_x86
Guillaume Jeanneae48c972014-08-19 14:46:06 +0200106 | CS_INFO_PPC of cs_ppc
107 | CS_INFO_SPARC of cs_sparc
108 | CS_INFO_SYSZ of cs_sysz
109 | CS_INFO_XCORE of cs_xcore
Wolfgang Schwotzer22b4d0e2017-10-21 15:44:36 +0200110 | CS_INFO_M680X of cs_m680x
Guillaume Jeanneae48c972014-08-19 14:46:06 +0200111
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800112
Nguyen Anh Quynhfe4822c2014-10-04 16:30:02 +0800113type csh = {
114 h: Int64.t;
115 a: arch;
116}
117
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800118type cs_insn0 = {
119 id: int;
120 address: int;
121 size: int;
Guillaume Jeannecece24e2014-06-26 15:35:06 +0200122 bytes: int array;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800123 mnemonic: string;
124 op_str: string;
125 regs_read: int array;
126 regs_write: int array;
127 groups: int array;
128 arch: cs_arch;
129}
130
Nguyen Anh Quynhfe4822c2014-10-04 16:30:02 +0800131external _cs_open: arch -> mode list -> Int64.t option = "ocaml_open"
Nguyen Anh Quynh82354b62014-09-28 23:56:02 +0800132external cs_disasm_quick: arch -> mode list -> string -> Int64.t -> Int64.t -> cs_insn0 list = "ocaml_cs_disasm"
Nguyen Anh Quynh77d93e92014-09-25 23:03:36 +0800133external _cs_disasm_internal: arch -> Int64.t -> string -> Int64.t -> Int64.t -> cs_insn0 list = "ocaml_cs_disasm_internal"
Nguyen Anh Quynhfe4822c2014-10-04 16:30:02 +0800134external _cs_reg_name: Int64.t -> int -> string = "ocaml_register_name"
135external _cs_insn_name: Int64.t -> int -> string = "ocaml_instruction_name"
136external _cs_group_name: Int64.t -> int -> string = "ocaml_group_name"
Nguyen Anh Quynh77d93e92014-09-25 23:03:36 +0800137external cs_version: unit -> int = "ocaml_version"
Nguyen Anh Quynhfe4822c2014-10-04 16:30:02 +0800138external _cs_option: Int64.t -> opt_type -> Int64.t -> int = "ocaml_option"
139external _cs_close: Int64.t -> int = "ocaml_close"
140
141
142let cs_open _arch _mode: csh = (
143 let _handle = _cs_open _arch _mode in (
144 match _handle with
145 | None -> { h = 0L; a = _arch }
146 | Some v -> { h = v; a = _arch }
147 );
148);;
149
150let cs_close handle = (
151 _cs_close handle.h;
152)
153
154let cs_option handle opt value = (
155 _cs_option handle.h opt value;
156);;
157
158let cs_disasm handle code address count = (
159 _cs_disasm_internal handle.a handle.h code address count;
160);;
161
162let cs_reg_name handle id = (
163 _cs_reg_name handle.h id;
164);;
165
166let cs_insn_name handle id = (
167 _cs_insn_name handle.h id;
168);;
169
170let cs_group_name handle id = (
171 _cs_group_name handle.h id;
172);;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800173
174class cs_insn c a =
175 let csh = c in
Nguyen Anh Quynh6dc1dd52014-09-27 00:40:34 +0800176 let (id, address, size, bytes, mnemonic, op_str, regs_read,
177 regs_write, groups, arch) =
Guillaume Jeannecece24e2014-06-26 15:35:06 +0200178 (a.id, a.address, a.size, a.bytes, a.mnemonic, a.op_str,
Nguyen Anh Quynh6dc1dd52014-09-27 00:40:34 +0800179 a.regs_read, a.regs_write, a.groups, a.arch) in
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800180 object
181 method id = id;
182 method address = address;
183 method size = size;
Guillaume Jeannecece24e2014-06-26 15:35:06 +0200184 method bytes = bytes;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800185 method mnemonic = mnemonic;
186 method op_str = op_str;
187 method regs_read = regs_read;
188 method regs_write = regs_write;
189 method groups = groups;
190 method arch = arch;
Nguyen Anh Quynhfe4822c2014-10-04 16:30:02 +0800191 method reg_name id = _cs_reg_name csh.h id;
192 method insn_name id = _cs_insn_name csh.h id;
193 method group_name id = _cs_group_name csh.h id;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800194 end;;
195
196let cs_insn_group handle insn group_id =
197 List.exists (fun g -> g == group_id) (Array.to_list insn.groups);;
198
199let cs_reg_read handle insn reg_id =
200 List.exists (fun g -> g == reg_id) (Array.to_list insn.regs_read);;
201
202let cs_reg_write handle insn reg_id =
203 List.exists (fun g -> g == reg_id) (Array.to_list insn.regs_write);;
204
205
206class cs a m =
207 let mode = m and arch = a in
Nguyen Anh Quynhfe4822c2014-10-04 16:30:02 +0800208 let handle = cs_open arch mode in
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800209 object
210 method disasm code offset count =
Nguyen Anh Quynhfe4822c2014-10-04 16:30:02 +0800211 let insns = (_cs_disasm_internal arch handle.h code offset count) in
Guillaume Jeannecece24e2014-06-26 15:35:06 +0200212 List.map (fun x -> new cs_insn handle x) insns;
Nguyen Anh Quynh26ee41a2013-11-27 12:11:31 +0800213
214 end;;