blob: 4a03ebea0ca9a38fc03e1a8a9dac64024621c420 [file] [log] [blame]
Ian Rogers706a10e2012-03-23 17:00:55 -07001/*
2 * Copyright (C) 2012 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "disassembler_x86.h"
18
Ian Rogers706a10e2012-03-23 17:00:55 -070019#include <iostream>
20
Elliott Hughes07ed66b2012-12-12 18:34:25 -080021#include "base/logging.h"
Elliott Hughese222ee02012-12-13 14:41:43 -080022#include "base/stringprintf.h"
Elliott Hughes92301d92012-04-10 15:57:52 -070023#include "thread.h"
Elliott Hughes0f3c5532012-03-30 14:51:51 -070024
Ian Rogers706a10e2012-03-23 17:00:55 -070025namespace art {
26namespace x86 {
27
Ian Rogersb23a7722012-10-09 16:54:26 -070028size_t DisassemblerX86::Dump(std::ostream& os, const uint8_t* begin) {
29 return DumpInstruction(os, begin);
30}
31
Ian Rogers706a10e2012-03-23 17:00:55 -070032void DisassemblerX86::Dump(std::ostream& os, const uint8_t* begin, const uint8_t* end) {
33 size_t length = 0;
34 for (const uint8_t* cur = begin; cur < end; cur += length) {
35 length = DumpInstruction(os, cur);
36 }
37}
38
39static const char* gReg8Names[] = { "al", "cl", "dl", "bl", "ah", "ch", "dh", "bh" };
jeffhao703f2cd2012-07-13 17:25:52 -070040static const char* gReg16Names[] = { "ax", "cx", "dx", "bx", "sp", "bp", "si", "di" };
41static const char* gReg32Names[] = { "eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi" };
Ian Rogers38e12032014-03-14 14:06:14 -070042static const char* gReg64Names[] = {
43 "rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi",
44 "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"
45};
Ian Rogers706a10e2012-03-23 17:00:55 -070046
Ian Rogers38e12032014-03-14 14:06:14 -070047static void DumpReg0(std::ostream& os, uint8_t rex, size_t reg,
Ian Rogers706a10e2012-03-23 17:00:55 -070048 bool byte_operand, uint8_t size_override) {
Ian Rogers38e12032014-03-14 14:06:14 -070049 DCHECK_LT(reg, (rex == 0) ? 8u : 16u);
50 bool rex_w = (rex & 0b1000) != 0;
51 size_t size = byte_operand ? 1 : (size_override == 0x66 ? 2 : (rex_w ? 8 :4));
Ian Rogers706a10e2012-03-23 17:00:55 -070052 switch (size) {
53 case 1: os << gReg8Names[reg]; break;
54 case 2: os << gReg16Names[reg]; break;
55 case 4: os << gReg32Names[reg]; break;
Ian Rogers38e12032014-03-14 14:06:14 -070056 case 8: os << gReg64Names[reg]; break;
Ian Rogers706a10e2012-03-23 17:00:55 -070057 default: LOG(FATAL) << "unexpected size " << size;
58 }
59}
60
Ian Rogersbf989802012-04-16 16:07:49 -070061enum RegFile { GPR, MMX, SSE };
62
Ian Rogers706a10e2012-03-23 17:00:55 -070063static void DumpReg(std::ostream& os, uint8_t rex, uint8_t reg,
Ian Rogersbf989802012-04-16 16:07:49 -070064 bool byte_operand, uint8_t size_override, RegFile reg_file) {
Ian Rogers38e12032014-03-14 14:06:14 -070065 bool rex_r = (rex & 0b0100) != 0;
66 size_t reg_num = rex_r ? (reg + 8) : reg;
Ian Rogersbf989802012-04-16 16:07:49 -070067 if (reg_file == GPR) {
68 DumpReg0(os, rex, reg_num, byte_operand, size_override);
69 } else if (reg_file == SSE) {
70 os << "xmm" << reg_num;
71 } else {
72 os << "mm" << reg_num;
73 }
Ian Rogers706a10e2012-03-23 17:00:55 -070074}
75
Ian Rogers7caad772012-03-30 01:07:54 -070076static void DumpBaseReg(std::ostream& os, uint8_t rex, uint8_t reg) {
Ian Rogers38e12032014-03-14 14:06:14 -070077 bool rex_b = (rex & 0b0001) != 0;
78 size_t reg_num = rex_b ? (reg + 8) : reg;
Ian Rogers7caad772012-03-30 01:07:54 -070079 DumpReg0(os, rex, reg_num, false, 0);
Ian Rogers706a10e2012-03-23 17:00:55 -070080}
81
Ian Rogers7caad772012-03-30 01:07:54 -070082static void DumpIndexReg(std::ostream& os, uint8_t rex, uint8_t reg) {
Ian Rogers38e12032014-03-14 14:06:14 -070083 bool rex_x = (rex & 0b0010) != 0;
84 uint8_t reg_num = rex_x ? (reg + 8) : reg;
Ian Rogers7caad772012-03-30 01:07:54 -070085 DumpReg0(os, rex, reg_num, false, 0);
Ian Rogers706a10e2012-03-23 17:00:55 -070086}
87
Elliott Hughes92301d92012-04-10 15:57:52 -070088enum SegmentPrefix {
89 kCs = 0x2e,
90 kSs = 0x36,
91 kDs = 0x3e,
92 kEs = 0x26,
93 kFs = 0x64,
94 kGs = 0x65,
95};
96
Ian Rogers706a10e2012-03-23 17:00:55 -070097static void DumpSegmentOverride(std::ostream& os, uint8_t segment_prefix) {
98 switch (segment_prefix) {
Elliott Hughes92301d92012-04-10 15:57:52 -070099 case kCs: os << "cs:"; break;
100 case kSs: os << "ss:"; break;
101 case kDs: os << "ds:"; break;
102 case kEs: os << "es:"; break;
103 case kFs: os << "fs:"; break;
104 case kGs: os << "gs:"; break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700105 default: break;
106 }
107}
108
109size_t DisassemblerX86::DumpInstruction(std::ostream& os, const uint8_t* instr) {
110 const uint8_t* begin_instr = instr;
111 bool have_prefixes = true;
112 uint8_t prefix[4] = {0, 0, 0, 0};
113 const char** modrm_opcodes = NULL;
114 do {
115 switch (*instr) {
Ian Rogers7caad772012-03-30 01:07:54 -0700116 // Group 1 - lock and repeat prefixes:
Ian Rogers706a10e2012-03-23 17:00:55 -0700117 case 0xF0:
118 case 0xF2:
119 case 0xF3:
120 prefix[0] = *instr;
121 break;
122 // Group 2 - segment override prefixes:
Elliott Hughes92301d92012-04-10 15:57:52 -0700123 case kCs:
124 case kSs:
125 case kDs:
126 case kEs:
127 case kFs:
128 case kGs:
Ian Rogers706a10e2012-03-23 17:00:55 -0700129 prefix[1] = *instr;
130 break;
131 // Group 3 - operand size override:
132 case 0x66:
133 prefix[2] = *instr;
134 break;
135 // Group 4 - address size override:
136 case 0x67:
137 prefix[3] = *instr;
138 break;
139 default:
140 have_prefixes = false;
141 break;
142 }
143 if (have_prefixes) {
144 instr++;
145 }
146 } while (have_prefixes);
Ian Rogers38e12032014-03-14 14:06:14 -0700147 uint8_t rex = (supports_rex_ && (*instr >= 0x40) && (*instr <= 0x4F)) ? *instr : 0;
Ian Rogers706a10e2012-03-23 17:00:55 -0700148 bool has_modrm = false;
149 bool reg_is_opcode = false;
150 size_t immediate_bytes = 0;
151 size_t branch_bytes = 0;
152 std::ostringstream opcode;
153 bool store = false; // stores to memory (ie rm is on the left)
154 bool load = false; // loads from memory (ie rm is on the right)
155 bool byte_operand = false;
156 bool ax = false; // implicit use of ax
jeffhaoe2962482012-06-28 11:29:57 -0700157 bool cx = false; // implicit use of cx
Ian Rogers706a10e2012-03-23 17:00:55 -0700158 bool reg_in_opcode = false; // low 3-bits of opcode encode register parameter
jeffhao703f2cd2012-07-13 17:25:52 -0700159 bool no_ops = false;
Ian Rogersbf989802012-04-16 16:07:49 -0700160 RegFile src_reg_file = GPR;
161 RegFile dst_reg_file = GPR;
Ian Rogers706a10e2012-03-23 17:00:55 -0700162 switch (*instr) {
163#define DISASSEMBLER_ENTRY(opname, \
164 rm8_r8, rm32_r32, \
165 r8_rm8, r32_rm32, \
166 ax8_i8, ax32_i32) \
167 case rm8_r8: opcode << #opname; store = true; has_modrm = true; byte_operand = true; break; \
168 case rm32_r32: opcode << #opname; store = true; has_modrm = true; break; \
169 case r8_rm8: opcode << #opname; load = true; has_modrm = true; byte_operand = true; break; \
170 case r32_rm32: opcode << #opname; load = true; has_modrm = true; break; \
171 case ax8_i8: opcode << #opname; ax = true; immediate_bytes = 1; byte_operand = true; break; \
172 case ax32_i32: opcode << #opname; ax = true; immediate_bytes = 4; break;
173
174DISASSEMBLER_ENTRY(add,
175 0x00 /* RegMem8/Reg8 */, 0x01 /* RegMem32/Reg32 */,
176 0x02 /* Reg8/RegMem8 */, 0x03 /* Reg32/RegMem32 */,
177 0x04 /* Rax8/imm8 opcode */, 0x05 /* Rax32/imm32 */)
178DISASSEMBLER_ENTRY(or,
179 0x08 /* RegMem8/Reg8 */, 0x09 /* RegMem32/Reg32 */,
180 0x0A /* Reg8/RegMem8 */, 0x0B /* Reg32/RegMem32 */,
181 0x0C /* Rax8/imm8 opcode */, 0x0D /* Rax32/imm32 */)
182DISASSEMBLER_ENTRY(adc,
183 0x10 /* RegMem8/Reg8 */, 0x11 /* RegMem32/Reg32 */,
184 0x12 /* Reg8/RegMem8 */, 0x13 /* Reg32/RegMem32 */,
185 0x14 /* Rax8/imm8 opcode */, 0x15 /* Rax32/imm32 */)
186DISASSEMBLER_ENTRY(sbb,
187 0x18 /* RegMem8/Reg8 */, 0x19 /* RegMem32/Reg32 */,
188 0x1A /* Reg8/RegMem8 */, 0x1B /* Reg32/RegMem32 */,
189 0x1C /* Rax8/imm8 opcode */, 0x1D /* Rax32/imm32 */)
190DISASSEMBLER_ENTRY(and,
191 0x20 /* RegMem8/Reg8 */, 0x21 /* RegMem32/Reg32 */,
192 0x22 /* Reg8/RegMem8 */, 0x23 /* Reg32/RegMem32 */,
193 0x24 /* Rax8/imm8 opcode */, 0x25 /* Rax32/imm32 */)
194DISASSEMBLER_ENTRY(sub,
195 0x28 /* RegMem8/Reg8 */, 0x29 /* RegMem32/Reg32 */,
196 0x2A /* Reg8/RegMem8 */, 0x2B /* Reg32/RegMem32 */,
197 0x2C /* Rax8/imm8 opcode */, 0x2D /* Rax32/imm32 */)
198DISASSEMBLER_ENTRY(xor,
199 0x30 /* RegMem8/Reg8 */, 0x31 /* RegMem32/Reg32 */,
200 0x32 /* Reg8/RegMem8 */, 0x33 /* Reg32/RegMem32 */,
201 0x34 /* Rax8/imm8 opcode */, 0x35 /* Rax32/imm32 */)
202DISASSEMBLER_ENTRY(cmp,
203 0x38 /* RegMem8/Reg8 */, 0x39 /* RegMem32/Reg32 */,
204 0x3A /* Reg8/RegMem8 */, 0x3B /* Reg32/RegMem32 */,
205 0x3C /* Rax8/imm8 opcode */, 0x3D /* Rax32/imm32 */)
206
207#undef DISASSEMBLER_ENTRY
208 case 0x50: case 0x51: case 0x52: case 0x53: case 0x54: case 0x55: case 0x56: case 0x57:
209 opcode << "push";
210 reg_in_opcode = true;
211 break;
212 case 0x58: case 0x59: case 0x5A: case 0x5B: case 0x5C: case 0x5D: case 0x5E: case 0x5F:
213 opcode << "pop";
214 reg_in_opcode = true;
215 break;
216 case 0x68: opcode << "push"; immediate_bytes = 4; break;
Mark Mendelld19b55a2013-12-12 09:55:34 -0800217 case 0x69: opcode << "imul"; load = true; has_modrm = true; immediate_bytes = 4; break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700218 case 0x6A: opcode << "push"; immediate_bytes = 1; break;
Mark Mendelld19b55a2013-12-12 09:55:34 -0800219 case 0x6B: opcode << "imul"; load = true; has_modrm = true; immediate_bytes = 1; break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700220 case 0x70: case 0x71: case 0x72: case 0x73: case 0x74: case 0x75: case 0x76: case 0x77:
221 case 0x78: case 0x79: case 0x7A: case 0x7B: case 0x7C: case 0x7D: case 0x7E: case 0x7F:
222 static const char* condition_codes[] =
Elliott Hughesb25c3f62012-03-26 16:35:06 -0700223 {"o", "no", "b/nae/c", "nb/ae/nc", "z/eq", "nz/ne", "be/na", "nbe/a",
224 "s", "ns", "p/pe", "np/po", "l/nge", "nl/ge", "le/ng", "nle/g"
Ian Rogers706a10e2012-03-23 17:00:55 -0700225 };
226 opcode << "j" << condition_codes[*instr & 0xF];
227 branch_bytes = 1;
228 break;
Razvan A Lupusoru99ad7232014-02-25 17:41:08 -0800229 case 0x86: case 0x87:
230 opcode << "xchg";
231 store = true;
232 has_modrm = true;
233 byte_operand = (*instr == 0x86);
234 break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700235 case 0x88: opcode << "mov"; store = true; has_modrm = true; byte_operand = true; break;
236 case 0x89: opcode << "mov"; store = true; has_modrm = true; break;
237 case 0x8A: opcode << "mov"; load = true; has_modrm = true; byte_operand = true; break;
238 case 0x8B: opcode << "mov"; load = true; has_modrm = true; break;
239
240 case 0x0F: // 2 byte extended opcode
241 instr++;
242 switch (*instr) {
Ian Rogers7caad772012-03-30 01:07:54 -0700243 case 0x10: case 0x11:
244 if (prefix[0] == 0xF2) {
245 opcode << "movsd";
jeffhaofdffdf82012-07-11 16:08:43 -0700246 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogers7caad772012-03-30 01:07:54 -0700247 } else if (prefix[0] == 0xF3) {
248 opcode << "movss";
jeffhaofdffdf82012-07-11 16:08:43 -0700249 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogers7caad772012-03-30 01:07:54 -0700250 } else if (prefix[2] == 0x66) {
251 opcode << "movupd";
jeffhaofdffdf82012-07-11 16:08:43 -0700252 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogers7caad772012-03-30 01:07:54 -0700253 } else {
254 opcode << "movups";
255 }
256 has_modrm = true;
Ian Rogersbf989802012-04-16 16:07:49 -0700257 src_reg_file = dst_reg_file = SSE;
Ian Rogers7caad772012-03-30 01:07:54 -0700258 load = *instr == 0x10;
259 store = !load;
260 break;
Razvan A Lupusoru2c498d12014-01-29 16:02:57 -0800261 case 0x12: case 0x13:
262 if (prefix[2] == 0x66) {
263 opcode << "movlpd";
264 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
265 } else if (prefix[0] == 0) {
266 opcode << "movlps";
267 }
268 has_modrm = true;
269 src_reg_file = dst_reg_file = SSE;
270 load = *instr == 0x12;
271 store = !load;
272 break;
273 case 0x16: case 0x17:
274 if (prefix[2] == 0x66) {
275 opcode << "movhpd";
276 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
277 } else if (prefix[0] == 0) {
278 opcode << "movhps";
279 }
280 has_modrm = true;
281 src_reg_file = dst_reg_file = SSE;
282 load = *instr == 0x16;
283 store = !load;
284 break;
285 case 0x28: case 0x29:
286 if (prefix[2] == 0x66) {
287 opcode << "movapd";
288 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
289 } else if (prefix[0] == 0) {
290 opcode << "movaps";
291 }
292 has_modrm = true;
293 src_reg_file = dst_reg_file = SSE;
294 load = *instr == 0x28;
295 store = !load;
296 break;
jeffhaofdffdf82012-07-11 16:08:43 -0700297 case 0x2A:
298 if (prefix[2] == 0x66) {
299 opcode << "cvtpi2pd";
300 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
301 } else if (prefix[0] == 0xF2) {
302 opcode << "cvtsi2sd";
303 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
304 } else if (prefix[0] == 0xF3) {
305 opcode << "cvtsi2ss";
306 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
307 } else {
308 opcode << "cvtpi2ps";
309 }
310 load = true;
311 has_modrm = true;
312 dst_reg_file = SSE;
313 break;
314 case 0x2C:
315 if (prefix[2] == 0x66) {
316 opcode << "cvttpd2pi";
317 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
318 } else if (prefix[0] == 0xF2) {
319 opcode << "cvttsd2si";
320 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
321 } else if (prefix[0] == 0xF3) {
322 opcode << "cvttss2si";
323 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
324 } else {
325 opcode << "cvttps2pi";
326 }
327 load = true;
328 has_modrm = true;
329 src_reg_file = SSE;
330 break;
331 case 0x2D:
332 if (prefix[2] == 0x66) {
333 opcode << "cvtpd2pi";
334 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
335 } else if (prefix[0] == 0xF2) {
336 opcode << "cvtsd2si";
337 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
338 } else if (prefix[0] == 0xF3) {
339 opcode << "cvtss2si";
340 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
341 } else {
342 opcode << "cvtps2pi";
343 }
344 load = true;
345 has_modrm = true;
346 src_reg_file = SSE;
347 break;
348 case 0x2E:
349 opcode << "u";
350 // FALLTHROUGH
351 case 0x2F:
352 if (prefix[2] == 0x66) {
353 opcode << "comisd";
354 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
355 } else {
356 opcode << "comiss";
357 }
358 has_modrm = true;
359 load = true;
360 src_reg_file = dst_reg_file = SSE;
361 break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700362 case 0x38: // 3 byte extended opcode
363 opcode << StringPrintf("unknown opcode '0F 38 %02X'", *instr);
364 break;
365 case 0x3A: // 3 byte extended opcode
366 opcode << StringPrintf("unknown opcode '0F 3A %02X'", *instr);
367 break;
Razvan A Lupusorubd288c22013-12-20 17:27:23 -0800368 case 0x40: case 0x41: case 0x42: case 0x43: case 0x44: case 0x45: case 0x46: case 0x47:
369 case 0x48: case 0x49: case 0x4A: case 0x4B: case 0x4C: case 0x4D: case 0x4E: case 0x4F:
370 opcode << "cmov" << condition_codes[*instr & 0xF];
371 has_modrm = true;
372 load = true;
373 break;
Ian Rogersbf989802012-04-16 16:07:49 -0700374 case 0x50: case 0x51: case 0x52: case 0x53: case 0x54: case 0x55: case 0x56: case 0x57:
375 case 0x58: case 0x59: case 0x5C: case 0x5D: case 0x5E: case 0x5F: {
376 switch (*instr) {
377 case 0x50: opcode << "movmsk"; break;
378 case 0x51: opcode << "sqrt"; break;
379 case 0x52: opcode << "rsqrt"; break;
380 case 0x53: opcode << "rcp"; break;
381 case 0x54: opcode << "and"; break;
382 case 0x55: opcode << "andn"; break;
383 case 0x56: opcode << "or"; break;
384 case 0x57: opcode << "xor"; break;
385 case 0x58: opcode << "add"; break;
386 case 0x59: opcode << "mul"; break;
387 case 0x5C: opcode << "sub"; break;
388 case 0x5D: opcode << "min"; break;
389 case 0x5E: opcode << "div"; break;
390 case 0x5F: opcode << "max"; break;
391 default: LOG(FATAL) << "Unreachable";
392 }
393 if (prefix[2] == 0x66) {
394 opcode << "pd";
jeffhaofdffdf82012-07-11 16:08:43 -0700395 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700396 } else if (prefix[0] == 0xF2) {
397 opcode << "sd";
jeffhaofdffdf82012-07-11 16:08:43 -0700398 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700399 } else if (prefix[0] == 0xF3) {
400 opcode << "ss";
jeffhaofdffdf82012-07-11 16:08:43 -0700401 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700402 } else {
403 opcode << "ps";
404 }
405 load = true;
406 has_modrm = true;
407 src_reg_file = dst_reg_file = SSE;
408 break;
409 }
410 case 0x5A:
411 if (prefix[2] == 0x66) {
412 opcode << "cvtpd2ps";
jeffhaofdffdf82012-07-11 16:08:43 -0700413 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700414 } else if (prefix[0] == 0xF2) {
415 opcode << "cvtsd2ss";
jeffhaofdffdf82012-07-11 16:08:43 -0700416 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700417 } else if (prefix[0] == 0xF3) {
418 opcode << "cvtss2sd";
jeffhaofdffdf82012-07-11 16:08:43 -0700419 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700420 } else {
421 opcode << "cvtps2pd";
422 }
423 load = true;
424 has_modrm = true;
425 src_reg_file = dst_reg_file = SSE;
426 break;
427 case 0x5B:
428 if (prefix[2] == 0x66) {
429 opcode << "cvtps2dq";
jeffhaofdffdf82012-07-11 16:08:43 -0700430 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700431 } else if (prefix[0] == 0xF2) {
432 opcode << "bad opcode F2 0F 5B";
433 } else if (prefix[0] == 0xF3) {
434 opcode << "cvttps2dq";
jeffhaofdffdf82012-07-11 16:08:43 -0700435 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700436 } else {
437 opcode << "cvtdq2ps";
438 }
439 load = true;
440 has_modrm = true;
441 src_reg_file = dst_reg_file = SSE;
442 break;
Razvan A Lupusorud3266bc2014-01-24 12:55:31 -0800443 case 0x62:
444 if (prefix[2] == 0x66) {
445 src_reg_file = dst_reg_file = SSE;
446 prefix[2] = 0; // Clear prefix now. It has served its purpose as part of the opcode.
447 } else {
448 src_reg_file = dst_reg_file = MMX;
449 }
450 opcode << "punpckldq";
451 load = true;
452 has_modrm = true;
453 break;
Ian Rogersbf989802012-04-16 16:07:49 -0700454 case 0x6E:
455 if (prefix[2] == 0x66) {
456 dst_reg_file = SSE;
jeffhaofdffdf82012-07-11 16:08:43 -0700457 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700458 } else {
459 dst_reg_file = MMX;
Ian Rogersbf989802012-04-16 16:07:49 -0700460 }
jeffhaofdffdf82012-07-11 16:08:43 -0700461 opcode << "movd";
Ian Rogersbf989802012-04-16 16:07:49 -0700462 load = true;
463 has_modrm = true;
464 break;
465 case 0x6F:
466 if (prefix[2] == 0x66) {
467 dst_reg_file = SSE;
468 opcode << "movdqa";
jeffhaofdffdf82012-07-11 16:08:43 -0700469 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700470 } else if (prefix[0] == 0xF3) {
471 dst_reg_file = SSE;
472 opcode << "movdqu";
jeffhaofdffdf82012-07-11 16:08:43 -0700473 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
Ian Rogersbf989802012-04-16 16:07:49 -0700474 } else {
475 dst_reg_file = MMX;
476 opcode << "movq";
477 }
478 load = true;
479 has_modrm = true;
480 break;
jeffhaofdffdf82012-07-11 16:08:43 -0700481 case 0x71:
482 if (prefix[2] == 0x66) {
483 dst_reg_file = SSE;
484 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
485 } else {
486 dst_reg_file = MMX;
487 }
488 static const char* x71_opcodes[] = {"unknown-71", "unknown-71", "psrlw", "unknown-71", "psraw", "unknown-71", "psllw", "unknown-71"};
489 modrm_opcodes = x71_opcodes;
490 reg_is_opcode = true;
491 has_modrm = true;
492 store = true;
493 immediate_bytes = 1;
494 break;
495 case 0x72:
496 if (prefix[2] == 0x66) {
497 dst_reg_file = SSE;
498 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
499 } else {
500 dst_reg_file = MMX;
501 }
502 static const char* x72_opcodes[] = {"unknown-72", "unknown-72", "psrld", "unknown-72", "psrad", "unknown-72", "pslld", "unknown-72"};
503 modrm_opcodes = x72_opcodes;
504 reg_is_opcode = true;
505 has_modrm = true;
506 store = true;
507 immediate_bytes = 1;
508 break;
509 case 0x73:
510 if (prefix[2] == 0x66) {
511 dst_reg_file = SSE;
512 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
513 } else {
514 dst_reg_file = MMX;
515 }
516 static const char* x73_opcodes[] = {"unknown-73", "unknown-73", "psrlq", "unknown-73", "unknown-73", "unknown-73", "psllq", "unknown-73"};
517 modrm_opcodes = x73_opcodes;
518 reg_is_opcode = true;
519 has_modrm = true;
520 store = true;
521 immediate_bytes = 1;
522 break;
523 case 0x7E:
524 if (prefix[2] == 0x66) {
525 src_reg_file = SSE;
526 prefix[2] = 0; // clear prefix now it's served its purpose as part of the opcode
527 } else {
528 src_reg_file = MMX;
529 }
530 opcode << "movd";
531 has_modrm = true;
532 store = true;
533 break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700534 case 0x80: case 0x81: case 0x82: case 0x83: case 0x84: case 0x85: case 0x86: case 0x87:
535 case 0x88: case 0x89: case 0x8A: case 0x8B: case 0x8C: case 0x8D: case 0x8E: case 0x8F:
536 opcode << "j" << condition_codes[*instr & 0xF];
537 branch_bytes = 4;
538 break;
Ian Rogers7caad772012-03-30 01:07:54 -0700539 case 0x90: case 0x91: case 0x92: case 0x93: case 0x94: case 0x95: case 0x96: case 0x97:
540 case 0x98: case 0x99: case 0x9A: case 0x9B: case 0x9C: case 0x9D: case 0x9E: case 0x9F:
541 opcode << "set" << condition_codes[*instr & 0xF];
542 modrm_opcodes = NULL;
543 reg_is_opcode = true;
544 has_modrm = true;
545 store = true;
546 break;
Mark Mendell4708dcd2014-01-22 09:05:18 -0800547 case 0xA4:
548 opcode << "shld";
549 has_modrm = true;
550 load = true;
551 immediate_bytes = 1;
552 break;
553 case 0xAC:
554 opcode << "shrd";
555 has_modrm = true;
556 load = true;
557 immediate_bytes = 1;
558 break;
jeffhao703f2cd2012-07-13 17:25:52 -0700559 case 0xAE:
560 if (prefix[0] == 0xF3) {
Ian Rogers5e588b32013-02-21 15:05:09 -0800561 prefix[0] = 0; // clear prefix now it's served its purpose as part of the opcode
jeffhao703f2cd2012-07-13 17:25:52 -0700562 static const char* xAE_opcodes[] = {"rdfsbase", "rdgsbase", "wrfsbase", "wrgsbase", "unknown-AE", "unknown-AE", "unknown-AE", "unknown-AE"};
563 modrm_opcodes = xAE_opcodes;
564 reg_is_opcode = true;
565 has_modrm = true;
566 uint8_t reg_or_opcode = (instr[1] >> 3) & 7;
567 switch (reg_or_opcode) {
568 case 0:
569 prefix[1] = kFs;
570 load = true;
571 break;
572 case 1:
573 prefix[1] = kGs;
574 load = true;
575 break;
576 case 2:
577 prefix[1] = kFs;
578 store = true;
579 break;
580 case 3:
581 prefix[1] = kGs;
582 store = true;
583 break;
584 default:
585 load = true;
586 break;
587 }
588 } else {
589 static const char* xAE_opcodes[] = {"unknown-AE", "unknown-AE", "unknown-AE", "unknown-AE", "unknown-AE", "lfence", "mfence", "sfence"};
590 modrm_opcodes = xAE_opcodes;
591 reg_is_opcode = true;
592 has_modrm = true;
593 load = true;
594 no_ops = true;
595 }
596 break;
Mark Mendellf723f0c2013-12-11 17:50:58 -0800597 case 0xAF: opcode << "imul"; has_modrm = true; load = true; break;
jeffhao83025762012-08-02 11:08:56 -0700598 case 0xB1: opcode << "cmpxchg"; has_modrm = true; store = true; break;
Ian Rogers7caad772012-03-30 01:07:54 -0700599 case 0xB6: opcode << "movzxb"; has_modrm = true; load = true; break;
600 case 0xB7: opcode << "movzxw"; has_modrm = true; load = true; break;
jeffhao854029c2012-07-23 17:31:30 -0700601 case 0xBE: opcode << "movsxb"; has_modrm = true; load = true; break;
602 case 0xBF: opcode << "movsxw"; has_modrm = true; load = true; break;
Vladimir Marko70b797d2013-12-03 15:25:24 +0000603 case 0xC7:
604 static const char* x0FxC7_opcodes[] = { "unknown-0f-c7", "cmpxchg8b", "unknown-0f-c7", "unknown-0f-c7", "unknown-0f-c7", "unknown-0f-c7", "unknown-0f-c7", "unknown-0f-c7" };
605 modrm_opcodes = x0FxC7_opcodes;
606 has_modrm = true;
607 reg_is_opcode = true;
608 store = true;
609 break;
Vladimir Markoa8b4caf2013-10-24 15:08:57 +0100610 case 0xC8: case 0xC9: case 0xCA: case 0xCB: case 0xCC: case 0xCD: case 0xCE: case 0xCF:
611 opcode << "bswap";
612 reg_in_opcode = true;
613 break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700614 default:
615 opcode << StringPrintf("unknown opcode '0F %02X'", *instr);
616 break;
617 }
618 break;
619 case 0x80: case 0x81: case 0x82: case 0x83:
620 static const char* x80_opcodes[] = {"add", "or", "adc", "sbb", "and", "sub", "xor", "cmp"};
621 modrm_opcodes = x80_opcodes;
622 has_modrm = true;
623 reg_is_opcode = true;
624 store = true;
625 byte_operand = (*instr & 1) == 0;
626 immediate_bytes = *instr == 0x81 ? 4 : 1;
627 break;
jeffhao703f2cd2012-07-13 17:25:52 -0700628 case 0x84: case 0x85:
629 opcode << "test";
630 has_modrm = true;
631 load = true;
632 byte_operand = (*instr & 1) == 0;
633 break;
Ian Rogers7caad772012-03-30 01:07:54 -0700634 case 0x8D:
635 opcode << "lea";
636 has_modrm = true;
637 load = true;
638 break;
jeffhao703f2cd2012-07-13 17:25:52 -0700639 case 0x8F:
640 opcode << "pop";
641 has_modrm = true;
642 reg_is_opcode = true;
643 store = true;
644 break;
Mark Mendell2bf31e62014-01-23 12:13:40 -0800645 case 0x99:
646 opcode << "cdq";
647 break;
Mark Mendell4028a6c2014-02-19 20:06:20 -0800648 case 0xAF:
649 opcode << (prefix[2] == 0x66 ? "scasw" : "scasl");
650 break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700651 case 0xB0: case 0xB1: case 0xB2: case 0xB3: case 0xB4: case 0xB5: case 0xB6: case 0xB7:
652 opcode << "mov";
653 immediate_bytes = 1;
654 reg_in_opcode = true;
655 break;
656 case 0xB8: case 0xB9: case 0xBA: case 0xBB: case 0xBC: case 0xBD: case 0xBE: case 0xBF:
657 opcode << "mov";
658 immediate_bytes = 4;
659 reg_in_opcode = true;
660 break;
Ian Rogers7caad772012-03-30 01:07:54 -0700661 case 0xC0: case 0xC1:
jeffhaoe2962482012-06-28 11:29:57 -0700662 case 0xD0: case 0xD1: case 0xD2: case 0xD3:
Ian Rogers7caad772012-03-30 01:07:54 -0700663 static const char* shift_opcodes[] =
664 {"rol", "ror", "rcl", "rcr", "shl", "shr", "unknown-shift", "sar"};
665 modrm_opcodes = shift_opcodes;
666 has_modrm = true;
667 reg_is_opcode = true;
668 store = true;
Elliott Hughes16b5c292012-04-16 20:37:16 -0700669 immediate_bytes = ((*instr & 0xf0) == 0xc0) ? 1 : 0;
jeffhaoe2962482012-06-28 11:29:57 -0700670 cx = (*instr == 0xD2) || (*instr == 0xD3);
671 byte_operand = (*instr == 0xC0);
Ian Rogers7caad772012-03-30 01:07:54 -0700672 break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700673 case 0xC3: opcode << "ret"; break;
Elliott Hughes0589ca92012-04-09 18:26:20 -0700674 case 0xC7:
675 static const char* c7_opcodes[] = {"mov", "unknown-c7", "unknown-c7", "unknown-c7", "unknown-c7", "unknown-c7", "unknown-c7", "unknown-c7"};
676 modrm_opcodes = c7_opcodes;
677 store = true;
678 immediate_bytes = 4;
679 has_modrm = true;
680 reg_is_opcode = true;
681 break;
Ian Rogers7caad772012-03-30 01:07:54 -0700682 case 0xCC: opcode << "int 3"; break;
Mark Mendelld19b55a2013-12-12 09:55:34 -0800683 case 0xD9:
684 static const char* d9_opcodes[] = {"flds", "unknown-d9", "fsts", "fstps", "fldenv", "fldcw", "fnstenv", "fnstcw"};
685 modrm_opcodes = d9_opcodes;
686 store = true;
687 has_modrm = true;
688 reg_is_opcode = true;
689 break;
Razvan A Lupusoru614c2b42014-01-28 17:05:21 -0800690 case 0xDB:
691 static const char* db_opcodes[] = {"fildl", "unknown-db", "unknown-db", "unknown-db", "unknown-db", "unknown-db", "unknown-db", "unknown-db"};
692 modrm_opcodes = db_opcodes;
693 load = true;
694 has_modrm = true;
695 reg_is_opcode = true;
696 break;
Mark Mendelld19b55a2013-12-12 09:55:34 -0800697 case 0xDD:
698 static const char* dd_opcodes[] = {"fldl", "fisttp", "fstl", "fstpl", "frstor", "unknown-dd", "fnsave", "fnstsw"};
699 modrm_opcodes = dd_opcodes;
700 store = true;
701 has_modrm = true;
702 reg_is_opcode = true;
703 break;
Razvan A Lupusoru614c2b42014-01-28 17:05:21 -0800704 case 0xDF:
705 static const char* df_opcodes[] = {"fild", "unknown-df", "unknown-df", "unknown-df", "unknown-df", "fildll", "unknown-df", "unknown-df"};
706 modrm_opcodes = df_opcodes;
707 load = true;
708 has_modrm = true;
709 reg_is_opcode = true;
710 break;
Mark Mendell4028a6c2014-02-19 20:06:20 -0800711 case 0xE3: opcode << "jecxz"; branch_bytes = 1; break;
Ian Rogers7caad772012-03-30 01:07:54 -0700712 case 0xE8: opcode << "call"; branch_bytes = 4; break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700713 case 0xE9: opcode << "jmp"; branch_bytes = 4; break;
714 case 0xEB: opcode << "jmp"; branch_bytes = 1; break;
jeffhao77ae36b2012-08-07 14:18:16 -0700715 case 0xF5: opcode << "cmc"; break;
jeffhao174651d2012-04-19 15:27:22 -0700716 case 0xF6: case 0xF7:
717 static const char* f7_opcodes[] = {"test", "unknown-f7", "not", "neg", "mul edx:eax, eax *", "imul edx:eax, eax *", "div edx:eax, edx:eax /", "idiv edx:eax, edx:eax /"};
718 modrm_opcodes = f7_opcodes;
719 has_modrm = true;
720 reg_is_opcode = true;
721 store = true;
722 immediate_bytes = ((instr[1] & 0x38) == 0) ? 1 : 0;
723 break;
Ian Rogers706a10e2012-03-23 17:00:55 -0700724 case 0xFF:
725 static const char* ff_opcodes[] = {"inc", "dec", "call", "call", "jmp", "jmp", "push", "unknown-ff"};
726 modrm_opcodes = ff_opcodes;
727 has_modrm = true;
728 reg_is_opcode = true;
729 load = true;
730 break;
731 default:
732 opcode << StringPrintf("unknown opcode '%02X'", *instr);
733 break;
734 }
735 std::ostringstream args;
736 if (reg_in_opcode) {
737 DCHECK(!has_modrm);
Ian Rogersbf989802012-04-16 16:07:49 -0700738 DumpReg(args, rex, *instr & 0x7, false, prefix[2], GPR);
Ian Rogers706a10e2012-03-23 17:00:55 -0700739 }
740 instr++;
Elliott Hughes92301d92012-04-10 15:57:52 -0700741 uint32_t address_bits = 0;
Ian Rogers706a10e2012-03-23 17:00:55 -0700742 if (has_modrm) {
743 uint8_t modrm = *instr;
744 instr++;
745 uint8_t mod = modrm >> 6;
746 uint8_t reg_or_opcode = (modrm >> 3) & 7;
747 uint8_t rm = modrm & 7;
748 std::ostringstream address;
749 if (mod == 0 && rm == 5) { // fixed address
Elliott Hughes92301d92012-04-10 15:57:52 -0700750 address_bits = *reinterpret_cast<const uint32_t*>(instr);
751 address << StringPrintf("[0x%x]", address_bits);
Ian Rogers706a10e2012-03-23 17:00:55 -0700752 instr += 4;
753 } else if (rm == 4 && mod != 3) { // SIB
754 uint8_t sib = *instr;
755 instr++;
756 uint8_t ss = (sib >> 6) & 3;
757 uint8_t index = (sib >> 3) & 7;
758 uint8_t base = sib & 7;
759 address << "[";
760 if (base != 5 || mod != 0) {
Ian Rogers7caad772012-03-30 01:07:54 -0700761 DumpBaseReg(address, rex, base);
Ian Rogers706a10e2012-03-23 17:00:55 -0700762 if (index != 4) {
763 address << " + ";
764 }
765 }
766 if (index != 4) {
Ian Rogers7caad772012-03-30 01:07:54 -0700767 DumpIndexReg(address, rex, index);
Ian Rogers706a10e2012-03-23 17:00:55 -0700768 if (ss != 0) {
769 address << StringPrintf(" * %d", 1 << ss);
770 }
771 }
772 if (mod == 1) {
773 address << StringPrintf(" + %d", *reinterpret_cast<const int8_t*>(instr));
774 instr++;
775 } else if (mod == 2) {
776 address << StringPrintf(" + %d", *reinterpret_cast<const int32_t*>(instr));
777 instr += 4;
778 }
779 address << "]";
780 } else {
Ian Rogersbf989802012-04-16 16:07:49 -0700781 if (mod == 3) {
jeffhao703f2cd2012-07-13 17:25:52 -0700782 if (!no_ops) {
783 DumpReg(address, rex, rm, byte_operand, prefix[2], load ? src_reg_file : dst_reg_file);
784 }
Ian Rogersbf989802012-04-16 16:07:49 -0700785 } else {
Ian Rogers706a10e2012-03-23 17:00:55 -0700786 address << "[";
Ian Rogersbf989802012-04-16 16:07:49 -0700787 DumpBaseReg(address, rex, rm);
788 if (mod == 1) {
789 address << StringPrintf(" + %d", *reinterpret_cast<const int8_t*>(instr));
790 instr++;
791 } else if (mod == 2) {
792 address << StringPrintf(" + %d", *reinterpret_cast<const int32_t*>(instr));
793 instr += 4;
794 }
Ian Rogers706a10e2012-03-23 17:00:55 -0700795 address << "]";
796 }
797 }
798
Ian Rogers7caad772012-03-30 01:07:54 -0700799 if (reg_is_opcode && modrm_opcodes != NULL) {
Ian Rogers706a10e2012-03-23 17:00:55 -0700800 opcode << modrm_opcodes[reg_or_opcode];
801 }
802 if (load) {
803 if (!reg_is_opcode) {
Ian Rogersbf989802012-04-16 16:07:49 -0700804 DumpReg(args, rex, reg_or_opcode, byte_operand, prefix[2], dst_reg_file);
Ian Rogers706a10e2012-03-23 17:00:55 -0700805 args << ", ";
806 }
807 DumpSegmentOverride(args, prefix[1]);
808 args << address.str();
809 } else {
810 DCHECK(store);
811 DumpSegmentOverride(args, prefix[1]);
812 args << address.str();
813 if (!reg_is_opcode) {
814 args << ", ";
Ian Rogersbf989802012-04-16 16:07:49 -0700815 DumpReg(args, rex, reg_or_opcode, byte_operand, prefix[2], src_reg_file);
Ian Rogers706a10e2012-03-23 17:00:55 -0700816 }
817 }
818 }
819 if (ax) {
jeffhaofdffdf82012-07-11 16:08:43 -0700820 // If this opcode implicitly uses ax, ax is always the first arg.
Ian Rogersbf989802012-04-16 16:07:49 -0700821 DumpReg(args, rex, 0 /* EAX */, byte_operand, prefix[2], GPR);
Ian Rogers706a10e2012-03-23 17:00:55 -0700822 }
jeffhaoe2962482012-06-28 11:29:57 -0700823 if (cx) {
824 args << ", ";
825 DumpReg(args, rex, 1 /* ECX */, true, prefix[2], GPR);
826 }
Ian Rogers706a10e2012-03-23 17:00:55 -0700827 if (immediate_bytes > 0) {
jeffhaoe2962482012-06-28 11:29:57 -0700828 if (has_modrm || reg_in_opcode || ax || cx) {
Ian Rogers706a10e2012-03-23 17:00:55 -0700829 args << ", ";
830 }
831 if (immediate_bytes == 1) {
832 args << StringPrintf("%d", *reinterpret_cast<const int8_t*>(instr));
833 instr++;
834 } else {
835 CHECK_EQ(immediate_bytes, 4u);
836 args << StringPrintf("%d", *reinterpret_cast<const int32_t*>(instr));
837 instr += 4;
838 }
839 } else if (branch_bytes > 0) {
840 DCHECK(!has_modrm);
841 int32_t displacement;
842 if (branch_bytes == 1) {
843 displacement = *reinterpret_cast<const int8_t*>(instr);
844 instr++;
845 } else {
846 CHECK_EQ(branch_bytes, 4u);
847 displacement = *reinterpret_cast<const int32_t*>(instr);
848 instr += 4;
849 }
Elliott Hughes14178a92012-04-16 17:24:51 -0700850 args << StringPrintf("%+d (%p)", displacement, instr + displacement);
Ian Rogers706a10e2012-03-23 17:00:55 -0700851 }
Elliott Hughes92301d92012-04-10 15:57:52 -0700852 if (prefix[1] == kFs) {
853 args << " ; ";
854 Thread::DumpThreadOffset(args, address_bits, 4);
855 }
Elliott Hughes28fa76d2012-04-09 17:31:46 -0700856 std::stringstream hex;
Ian Rogers706a10e2012-03-23 17:00:55 -0700857 for (size_t i = 0; begin_instr + i < instr; ++i) {
Elliott Hughes28fa76d2012-04-09 17:31:46 -0700858 hex << StringPrintf("%02X", begin_instr[i]);
Ian Rogers706a10e2012-03-23 17:00:55 -0700859 }
Ian Rogers5e588b32013-02-21 15:05:09 -0800860 std::stringstream prefixed_opcode;
861 switch (prefix[0]) {
862 case 0xF0: prefixed_opcode << "lock "; break;
863 case 0xF2: prefixed_opcode << "repne "; break;
864 case 0xF3: prefixed_opcode << "repe "; break;
865 case 0: break;
866 default: LOG(FATAL) << "Unreachable";
867 }
868 prefixed_opcode << opcode.str();
869 os << StringPrintf("%p: %22s \t%-7s ", begin_instr, hex.str().c_str(),
870 prefixed_opcode.str().c_str())
871 << args.str() << '\n';
Ian Rogers706a10e2012-03-23 17:00:55 -0700872 return instr - begin_instr;
Brian Carlstrom7934ac22013-07-26 10:54:15 -0700873} // NOLINT(readability/fn_size)
Ian Rogers706a10e2012-03-23 17:00:55 -0700874
875} // namespace x86
876} // namespace art