blob: f73f94845ab0840ec8a1ce70f778e6cbccf6a766 [file] [log] [blame]
Steve Blocka7e24c12009-10-30 11:49:00 +00001// Copyright 2009 the V8 project authors. All rights reserved.
2// Redistribution and use in source and binary forms, with or without
3// modification, are permitted provided that the following conditions are
4// met:
5//
6// * Redistributions of source code must retain the above copyright
7// notice, this list of conditions and the following disclaimer.
8// * Redistributions in binary form must reproduce the above
9// copyright notice, this list of conditions and the following
10// disclaimer in the documentation and/or other materials provided
11// with the distribution.
12// * Neither the name of Google Inc. nor the names of its
13// contributors may be used to endorse or promote products derived
14// from this software without specific prior written permission.
15//
16// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27
28#include <assert.h>
29#include <stdio.h>
30#include <stdarg.h>
31
32#include "v8.h"
Leon Clarkef7060e22010-06-03 12:02:55 +010033
34#if defined(V8_TARGET_ARCH_X64)
35
Steve Blocka7e24c12009-10-30 11:49:00 +000036#include "disasm.h"
37
38namespace disasm {
39
40enum OperandType {
41 UNSET_OP_ORDER = 0,
42 // Operand size decides between 16, 32 and 64 bit operands.
43 REG_OPER_OP_ORDER = 1, // Register destination, operand source.
44 OPER_REG_OP_ORDER = 2, // Operand destination, register source.
45 // Fixed 8-bit operands.
46 BYTE_SIZE_OPERAND_FLAG = 4,
47 BYTE_REG_OPER_OP_ORDER = REG_OPER_OP_ORDER | BYTE_SIZE_OPERAND_FLAG,
48 BYTE_OPER_REG_OP_ORDER = OPER_REG_OP_ORDER | BYTE_SIZE_OPERAND_FLAG
49};
50
51//------------------------------------------------------------------
52// Tables
53//------------------------------------------------------------------
54struct ByteMnemonic {
55 int b; // -1 terminates, otherwise must be in range (0..255)
56 OperandType op_order_;
57 const char* mnem;
58};
59
60
61static ByteMnemonic two_operands_instr[] = {
62 { 0x00, BYTE_OPER_REG_OP_ORDER, "add" },
63 { 0x01, OPER_REG_OP_ORDER, "add" },
64 { 0x02, BYTE_REG_OPER_OP_ORDER, "add" },
65 { 0x03, REG_OPER_OP_ORDER, "add" },
66 { 0x08, BYTE_OPER_REG_OP_ORDER, "or" },
67 { 0x09, OPER_REG_OP_ORDER, "or" },
68 { 0x0A, BYTE_REG_OPER_OP_ORDER, "or" },
69 { 0x0B, REG_OPER_OP_ORDER, "or" },
70 { 0x10, BYTE_OPER_REG_OP_ORDER, "adc" },
71 { 0x11, OPER_REG_OP_ORDER, "adc" },
72 { 0x12, BYTE_REG_OPER_OP_ORDER, "adc" },
73 { 0x13, REG_OPER_OP_ORDER, "adc" },
74 { 0x18, BYTE_OPER_REG_OP_ORDER, "sbb" },
75 { 0x19, OPER_REG_OP_ORDER, "sbb" },
76 { 0x1A, BYTE_REG_OPER_OP_ORDER, "sbb" },
77 { 0x1B, REG_OPER_OP_ORDER, "sbb" },
78 { 0x20, BYTE_OPER_REG_OP_ORDER, "and" },
79 { 0x21, OPER_REG_OP_ORDER, "and" },
80 { 0x22, BYTE_REG_OPER_OP_ORDER, "and" },
81 { 0x23, REG_OPER_OP_ORDER, "and" },
82 { 0x28, BYTE_OPER_REG_OP_ORDER, "sub" },
83 { 0x29, OPER_REG_OP_ORDER, "sub" },
84 { 0x2A, BYTE_REG_OPER_OP_ORDER, "sub" },
85 { 0x2B, REG_OPER_OP_ORDER, "sub" },
86 { 0x30, BYTE_OPER_REG_OP_ORDER, "xor" },
87 { 0x31, OPER_REG_OP_ORDER, "xor" },
88 { 0x32, BYTE_REG_OPER_OP_ORDER, "xor" },
89 { 0x33, REG_OPER_OP_ORDER, "xor" },
90 { 0x38, BYTE_OPER_REG_OP_ORDER, "cmp" },
91 { 0x39, OPER_REG_OP_ORDER, "cmp" },
92 { 0x3A, BYTE_REG_OPER_OP_ORDER, "cmp" },
93 { 0x3B, REG_OPER_OP_ORDER, "cmp" },
94 { 0x63, REG_OPER_OP_ORDER, "movsxlq" },
95 { 0x84, BYTE_REG_OPER_OP_ORDER, "test" },
96 { 0x85, REG_OPER_OP_ORDER, "test" },
97 { 0x86, BYTE_REG_OPER_OP_ORDER, "xchg" },
98 { 0x87, REG_OPER_OP_ORDER, "xchg" },
99 { 0x88, BYTE_OPER_REG_OP_ORDER, "mov" },
100 { 0x89, OPER_REG_OP_ORDER, "mov" },
101 { 0x8A, BYTE_REG_OPER_OP_ORDER, "mov" },
102 { 0x8B, REG_OPER_OP_ORDER, "mov" },
103 { 0x8D, REG_OPER_OP_ORDER, "lea" },
104 { -1, UNSET_OP_ORDER, "" }
105};
106
107
108static ByteMnemonic zero_operands_instr[] = {
109 { 0xC3, UNSET_OP_ORDER, "ret" },
110 { 0xC9, UNSET_OP_ORDER, "leave" },
111 { 0xF4, UNSET_OP_ORDER, "hlt" },
112 { 0xCC, UNSET_OP_ORDER, "int3" },
113 { 0x60, UNSET_OP_ORDER, "pushad" },
114 { 0x61, UNSET_OP_ORDER, "popad" },
115 { 0x9C, UNSET_OP_ORDER, "pushfd" },
116 { 0x9D, UNSET_OP_ORDER, "popfd" },
117 { 0x9E, UNSET_OP_ORDER, "sahf" },
118 { 0x99, UNSET_OP_ORDER, "cdq" },
119 { 0x9B, UNSET_OP_ORDER, "fwait" },
Leon Clarked91b9f72010-01-27 17:25:45 +0000120 { 0xA4, UNSET_OP_ORDER, "movs" },
121 { 0xA5, UNSET_OP_ORDER, "movs" },
122 { 0xA6, UNSET_OP_ORDER, "cmps" },
123 { 0xA7, UNSET_OP_ORDER, "cmps" },
Steve Blocka7e24c12009-10-30 11:49:00 +0000124 { -1, UNSET_OP_ORDER, "" }
125};
126
127
128static ByteMnemonic call_jump_instr[] = {
129 { 0xE8, UNSET_OP_ORDER, "call" },
130 { 0xE9, UNSET_OP_ORDER, "jmp" },
131 { -1, UNSET_OP_ORDER, "" }
132};
133
134
135static ByteMnemonic short_immediate_instr[] = {
136 { 0x05, UNSET_OP_ORDER, "add" },
137 { 0x0D, UNSET_OP_ORDER, "or" },
138 { 0x15, UNSET_OP_ORDER, "adc" },
139 { 0x1D, UNSET_OP_ORDER, "sbb" },
140 { 0x25, UNSET_OP_ORDER, "and" },
141 { 0x2D, UNSET_OP_ORDER, "sub" },
142 { 0x35, UNSET_OP_ORDER, "xor" },
143 { 0x3D, UNSET_OP_ORDER, "cmp" },
144 { -1, UNSET_OP_ORDER, "" }
145};
146
147
148static const char* conditional_code_suffix[] = {
149 "o", "no", "c", "nc", "z", "nz", "na", "a",
150 "s", "ns", "pe", "po", "l", "ge", "le", "g"
151};
152
153
154enum InstructionType {
155 NO_INSTR,
156 ZERO_OPERANDS_INSTR,
157 TWO_OPERANDS_INSTR,
158 JUMP_CONDITIONAL_SHORT_INSTR,
159 REGISTER_INSTR,
160 PUSHPOP_INSTR, // Has implicit 64-bit operand size.
161 MOVE_REG_INSTR,
162 CALL_JUMP_INSTR,
163 SHORT_IMMEDIATE_INSTR
164};
165
166
Leon Clarked91b9f72010-01-27 17:25:45 +0000167enum Prefixes {
168 ESCAPE_PREFIX = 0x0F,
169 OPERAND_SIZE_OVERRIDE_PREFIX = 0x66,
170 ADDRESS_SIZE_OVERRIDE_PREFIX = 0x67,
171 REPNE_PREFIX = 0xF2,
172 REP_PREFIX = 0xF3,
173 REPEQ_PREFIX = REP_PREFIX
174};
175
176
Steve Blocka7e24c12009-10-30 11:49:00 +0000177struct InstructionDesc {
178 const char* mnem;
179 InstructionType type;
180 OperandType op_order_;
181 bool byte_size_operation; // Fixed 8-bit operation.
182};
183
184
185class InstructionTable {
186 public:
187 InstructionTable();
188 const InstructionDesc& Get(byte x) const {
189 return instructions_[x];
190 }
191
192 private:
193 InstructionDesc instructions_[256];
194 void Clear();
195 void Init();
196 void CopyTable(ByteMnemonic bm[], InstructionType type);
197 void SetTableRange(InstructionType type, byte start, byte end, bool byte_size,
198 const char* mnem);
199 void AddJumpConditionalShort();
200};
201
202
203InstructionTable::InstructionTable() {
204 Clear();
205 Init();
206}
207
208
209void InstructionTable::Clear() {
210 for (int i = 0; i < 256; i++) {
211 instructions_[i].mnem = "(bad)";
212 instructions_[i].type = NO_INSTR;
213 instructions_[i].op_order_ = UNSET_OP_ORDER;
214 instructions_[i].byte_size_operation = false;
215 }
216}
217
218
219void InstructionTable::Init() {
220 CopyTable(two_operands_instr, TWO_OPERANDS_INSTR);
221 CopyTable(zero_operands_instr, ZERO_OPERANDS_INSTR);
222 CopyTable(call_jump_instr, CALL_JUMP_INSTR);
223 CopyTable(short_immediate_instr, SHORT_IMMEDIATE_INSTR);
224 AddJumpConditionalShort();
225 SetTableRange(PUSHPOP_INSTR, 0x50, 0x57, false, "push");
226 SetTableRange(PUSHPOP_INSTR, 0x58, 0x5F, false, "pop");
227 SetTableRange(MOVE_REG_INSTR, 0xB8, 0xBF, false, "mov");
228}
229
230
231void InstructionTable::CopyTable(ByteMnemonic bm[], InstructionType type) {
232 for (int i = 0; bm[i].b >= 0; i++) {
233 InstructionDesc* id = &instructions_[bm[i].b];
234 id->mnem = bm[i].mnem;
235 OperandType op_order = bm[i].op_order_;
236 id->op_order_ =
237 static_cast<OperandType>(op_order & ~BYTE_SIZE_OPERAND_FLAG);
Steve Blockd0582a62009-12-15 09:54:21 +0000238 ASSERT_EQ(NO_INSTR, id->type); // Information not already entered
Steve Blocka7e24c12009-10-30 11:49:00 +0000239 id->type = type;
240 id->byte_size_operation = ((op_order & BYTE_SIZE_OPERAND_FLAG) != 0);
241 }
242}
243
244
245void InstructionTable::SetTableRange(InstructionType type,
246 byte start,
247 byte end,
248 bool byte_size,
249 const char* mnem) {
250 for (byte b = start; b <= end; b++) {
251 InstructionDesc* id = &instructions_[b];
Steve Blockd0582a62009-12-15 09:54:21 +0000252 ASSERT_EQ(NO_INSTR, id->type); // Information not already entered
Steve Blocka7e24c12009-10-30 11:49:00 +0000253 id->mnem = mnem;
254 id->type = type;
255 id->byte_size_operation = byte_size;
256 }
257}
258
259
260void InstructionTable::AddJumpConditionalShort() {
261 for (byte b = 0x70; b <= 0x7F; b++) {
262 InstructionDesc* id = &instructions_[b];
Steve Blockd0582a62009-12-15 09:54:21 +0000263 ASSERT_EQ(NO_INSTR, id->type); // Information not already entered
Steve Blocka7e24c12009-10-30 11:49:00 +0000264 id->mnem = NULL; // Computed depending on condition code.
265 id->type = JUMP_CONDITIONAL_SHORT_INSTR;
266 }
267}
268
269
270static InstructionTable instruction_table;
271
272static InstructionDesc cmov_instructions[16] = {
273 {"cmovo", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
274 {"cmovno", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
275 {"cmovc", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
276 {"cmovnc", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
277 {"cmovz", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
278 {"cmovnz", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
279 {"cmovna", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
280 {"cmova", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
281 {"cmovs", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
282 {"cmovns", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
283 {"cmovpe", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
284 {"cmovpo", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
285 {"cmovl", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
286 {"cmovge", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
287 {"cmovle", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false},
288 {"cmovg", TWO_OPERANDS_INSTR, REG_OPER_OP_ORDER, false}
289};
290
291//------------------------------------------------------------------------------
292// DisassemblerX64 implementation.
293
294enum UnimplementedOpcodeAction {
295 CONTINUE_ON_UNIMPLEMENTED_OPCODE,
296 ABORT_ON_UNIMPLEMENTED_OPCODE
297};
298
299// A new DisassemblerX64 object is created to disassemble each instruction.
300// The object can only disassemble a single instruction.
301class DisassemblerX64 {
302 public:
303 DisassemblerX64(const NameConverter& converter,
304 UnimplementedOpcodeAction unimplemented_action =
305 ABORT_ON_UNIMPLEMENTED_OPCODE)
306 : converter_(converter),
307 tmp_buffer_pos_(0),
308 abort_on_unimplemented_(
309 unimplemented_action == ABORT_ON_UNIMPLEMENTED_OPCODE),
310 rex_(0),
311 operand_size_(0),
312 group_1_prefix_(0),
313 byte_size_operand_(false) {
314 tmp_buffer_[0] = '\0';
315 }
316
317 virtual ~DisassemblerX64() {
318 }
319
320 // Writes one disassembled instruction into 'buffer' (0-terminated).
321 // Returns the length of the disassembled machine instruction in bytes.
322 int InstructionDecode(v8::internal::Vector<char> buffer, byte* instruction);
323
324 private:
325 enum OperandSize {
326 BYTE_SIZE = 0,
327 WORD_SIZE = 1,
328 DOUBLEWORD_SIZE = 2,
329 QUADWORD_SIZE = 3
330 };
331
332 const NameConverter& converter_;
333 v8::internal::EmbeddedVector<char, 128> tmp_buffer_;
334 unsigned int tmp_buffer_pos_;
335 bool abort_on_unimplemented_;
336 // Prefixes parsed
337 byte rex_;
338 byte operand_size_; // 0x66 or (if no group 3 prefix is present) 0x0.
339 byte group_1_prefix_; // 0xF2, 0xF3, or (if no group 1 prefix is present) 0.
340 // Byte size operand override.
341 bool byte_size_operand_;
342
343 void setRex(byte rex) {
344 ASSERT_EQ(0x40, rex & 0xF0);
345 rex_ = rex;
346 }
347
348 bool rex() { return rex_ != 0; }
349
350 bool rex_b() { return (rex_ & 0x01) != 0; }
351
352 // Actual number of base register given the low bits and the rex.b state.
353 int base_reg(int low_bits) { return low_bits | ((rex_ & 0x01) << 3); }
354
355 bool rex_x() { return (rex_ & 0x02) != 0; }
356
357 bool rex_r() { return (rex_ & 0x04) != 0; }
358
359 bool rex_w() { return (rex_ & 0x08) != 0; }
360
361 OperandSize operand_size() {
362 if (byte_size_operand_) return BYTE_SIZE;
363 if (rex_w()) return QUADWORD_SIZE;
364 if (operand_size_ != 0) return WORD_SIZE;
365 return DOUBLEWORD_SIZE;
366 }
367
368 char operand_size_code() {
369 return "bwlq"[operand_size()];
370 }
371
372 const char* NameOfCPURegister(int reg) const {
373 return converter_.NameOfCPURegister(reg);
374 }
375
376 const char* NameOfByteCPURegister(int reg) const {
377 return converter_.NameOfByteCPURegister(reg);
378 }
379
380 const char* NameOfXMMRegister(int reg) const {
381 return converter_.NameOfXMMRegister(reg);
382 }
383
384 const char* NameOfAddress(byte* addr) const {
385 return converter_.NameOfAddress(addr);
386 }
387
388 // Disassembler helper functions.
389 void get_modrm(byte data,
390 int* mod,
391 int* regop,
392 int* rm) {
393 *mod = (data >> 6) & 3;
394 *regop = ((data & 0x38) >> 3) | (rex_r() ? 8 : 0);
395 *rm = (data & 7) | (rex_b() ? 8 : 0);
396 }
397
398 void get_sib(byte data,
399 int* scale,
400 int* index,
401 int* base) {
402 *scale = (data >> 6) & 3;
403 *index = ((data >> 3) & 7) | (rex_x() ? 8 : 0);
404 *base = (data & 7) | (rex_b() ? 8 : 0);
405 }
406
407 typedef const char* (DisassemblerX64::*RegisterNameMapping)(int reg) const;
408
409 int PrintRightOperandHelper(byte* modrmp,
410 RegisterNameMapping register_name);
411 int PrintRightOperand(byte* modrmp);
412 int PrintRightByteOperand(byte* modrmp);
Steve Blockd0582a62009-12-15 09:54:21 +0000413 int PrintRightXMMOperand(byte* modrmp);
Steve Blocka7e24c12009-10-30 11:49:00 +0000414 int PrintOperands(const char* mnem,
415 OperandType op_order,
416 byte* data);
417 int PrintImmediate(byte* data, OperandSize size);
418 int PrintImmediateOp(byte* data);
419 const char* TwoByteMnemonic(byte opcode);
420 int TwoByteOpcodeInstruction(byte* data);
Steve Blockd0582a62009-12-15 09:54:21 +0000421 int F6F7Instruction(byte* data);
Steve Blocka7e24c12009-10-30 11:49:00 +0000422 int ShiftInstruction(byte* data);
423 int JumpShort(byte* data);
424 int JumpConditional(byte* data);
425 int JumpConditionalShort(byte* data);
426 int SetCC(byte* data);
427 int FPUInstruction(byte* data);
Steve Blockd0582a62009-12-15 09:54:21 +0000428 int MemoryFPUInstruction(int escape_opcode, int regop, byte* modrm_start);
429 int RegisterFPUInstruction(int escape_opcode, byte modrm_byte);
Steve Blocka7e24c12009-10-30 11:49:00 +0000430 void AppendToBuffer(const char* format, ...);
431
432 void UnimplementedInstruction() {
433 if (abort_on_unimplemented_) {
434 CHECK(false);
435 } else {
436 AppendToBuffer("'Unimplemented Instruction'");
437 }
438 }
439};
440
441
442void DisassemblerX64::AppendToBuffer(const char* format, ...) {
443 v8::internal::Vector<char> buf = tmp_buffer_ + tmp_buffer_pos_;
444 va_list args;
445 va_start(args, format);
446 int result = v8::internal::OS::VSNPrintF(buf, format, args);
447 va_end(args);
448 tmp_buffer_pos_ += result;
449}
450
451
452int DisassemblerX64::PrintRightOperandHelper(
453 byte* modrmp,
454 RegisterNameMapping register_name) {
455 int mod, regop, rm;
456 get_modrm(*modrmp, &mod, &regop, &rm);
457 switch (mod) {
458 case 0:
459 if ((rm & 7) == 5) {
460 int32_t disp = *reinterpret_cast<int32_t*>(modrmp + 1);
461 AppendToBuffer("[0x%x]", disp);
462 return 5;
463 } else if ((rm & 7) == 4) {
464 // Codes for SIB byte.
465 byte sib = *(modrmp + 1);
466 int scale, index, base;
467 get_sib(sib, &scale, &index, &base);
468 if (index == 4 && (base & 7) == 4 && scale == 0 /*times_1*/) {
469 // index == rsp means no index. Only use sib byte with no index for
470 // rsp and r12 base.
Steve Block8defd9f2010-07-08 12:39:36 +0100471 AppendToBuffer("[%s]", NameOfCPURegister(base));
Steve Blocka7e24c12009-10-30 11:49:00 +0000472 return 2;
473 } else if (base == 5) {
474 // base == rbp means no base register (when mod == 0).
475 int32_t disp = *reinterpret_cast<int32_t*>(modrmp + 2);
476 AppendToBuffer("[%s*%d+0x%x]",
Steve Block8defd9f2010-07-08 12:39:36 +0100477 NameOfCPURegister(index),
Steve Blocka7e24c12009-10-30 11:49:00 +0000478 1 << scale, disp);
479 return 6;
480 } else if (index != 4 && base != 5) {
481 // [base+index*scale]
482 AppendToBuffer("[%s+%s*%d]",
Steve Block8defd9f2010-07-08 12:39:36 +0100483 NameOfCPURegister(base),
484 NameOfCPURegister(index),
Steve Blocka7e24c12009-10-30 11:49:00 +0000485 1 << scale);
486 return 2;
487 } else {
488 UnimplementedInstruction();
489 return 1;
490 }
491 } else {
Steve Block8defd9f2010-07-08 12:39:36 +0100492 AppendToBuffer("[%s]", NameOfCPURegister(rm));
Steve Blocka7e24c12009-10-30 11:49:00 +0000493 return 1;
494 }
495 break;
496 case 1: // fall through
497 case 2:
498 if ((rm & 7) == 4) {
499 byte sib = *(modrmp + 1);
500 int scale, index, base;
501 get_sib(sib, &scale, &index, &base);
502 int disp = (mod == 2) ? *reinterpret_cast<int32_t*>(modrmp + 2)
503 : *reinterpret_cast<char*>(modrmp + 2);
504 if (index == 4 && (base & 7) == 4 && scale == 0 /*times_1*/) {
505 if (-disp > 0) {
Steve Block8defd9f2010-07-08 12:39:36 +0100506 AppendToBuffer("[%s-0x%x]", NameOfCPURegister(base), -disp);
Steve Blocka7e24c12009-10-30 11:49:00 +0000507 } else {
Steve Block8defd9f2010-07-08 12:39:36 +0100508 AppendToBuffer("[%s+0x%x]", NameOfCPURegister(base), disp);
Steve Blocka7e24c12009-10-30 11:49:00 +0000509 }
510 } else {
511 if (-disp > 0) {
512 AppendToBuffer("[%s+%s*%d-0x%x]",
Steve Block8defd9f2010-07-08 12:39:36 +0100513 NameOfCPURegister(base),
514 NameOfCPURegister(index),
Steve Blocka7e24c12009-10-30 11:49:00 +0000515 1 << scale,
516 -disp);
517 } else {
518 AppendToBuffer("[%s+%s*%d+0x%x]",
Steve Block8defd9f2010-07-08 12:39:36 +0100519 NameOfCPURegister(base),
520 NameOfCPURegister(index),
Steve Blocka7e24c12009-10-30 11:49:00 +0000521 1 << scale,
522 disp);
523 }
524 }
525 return mod == 2 ? 6 : 3;
526 } else {
527 // No sib.
528 int disp = (mod == 2) ? *reinterpret_cast<int32_t*>(modrmp + 1)
529 : *reinterpret_cast<char*>(modrmp + 1);
530 if (-disp > 0) {
Steve Block8defd9f2010-07-08 12:39:36 +0100531 AppendToBuffer("[%s-0x%x]", NameOfCPURegister(rm), -disp);
Steve Blocka7e24c12009-10-30 11:49:00 +0000532 } else {
Steve Block8defd9f2010-07-08 12:39:36 +0100533 AppendToBuffer("[%s+0x%x]", NameOfCPURegister(rm), disp);
Steve Blocka7e24c12009-10-30 11:49:00 +0000534 }
535 return (mod == 2) ? 5 : 2;
536 }
537 break;
538 case 3:
539 AppendToBuffer("%s", (this->*register_name)(rm));
540 return 1;
541 default:
542 UnimplementedInstruction();
543 return 1;
544 }
545 UNREACHABLE();
546}
547
548
549int DisassemblerX64::PrintImmediate(byte* data, OperandSize size) {
550 int64_t value;
551 int count;
552 switch (size) {
553 case BYTE_SIZE:
554 value = *data;
555 count = 1;
556 break;
557 case WORD_SIZE:
558 value = *reinterpret_cast<int16_t*>(data);
559 count = 2;
560 break;
561 case DOUBLEWORD_SIZE:
562 value = *reinterpret_cast<uint32_t*>(data);
563 count = 4;
564 break;
565 case QUADWORD_SIZE:
566 value = *reinterpret_cast<int32_t*>(data);
567 count = 4;
568 break;
569 default:
570 UNREACHABLE();
571 value = 0; // Initialize variables on all paths to satisfy the compiler.
572 count = 0;
573 }
574 AppendToBuffer("%" V8_PTR_PREFIX "x", value);
575 return count;
576}
577
578
579int DisassemblerX64::PrintRightOperand(byte* modrmp) {
580 return PrintRightOperandHelper(modrmp,
581 &DisassemblerX64::NameOfCPURegister);
582}
583
584
585int DisassemblerX64::PrintRightByteOperand(byte* modrmp) {
586 return PrintRightOperandHelper(modrmp,
587 &DisassemblerX64::NameOfByteCPURegister);
588}
589
590
Steve Blockd0582a62009-12-15 09:54:21 +0000591int DisassemblerX64::PrintRightXMMOperand(byte* modrmp) {
592 return PrintRightOperandHelper(modrmp,
593 &DisassemblerX64::NameOfXMMRegister);
594}
595
596
Steve Blocka7e24c12009-10-30 11:49:00 +0000597// Returns number of bytes used including the current *data.
598// Writes instruction's mnemonic, left and right operands to 'tmp_buffer_'.
599int DisassemblerX64::PrintOperands(const char* mnem,
600 OperandType op_order,
601 byte* data) {
602 byte modrm = *data;
603 int mod, regop, rm;
604 get_modrm(modrm, &mod, &regop, &rm);
605 int advance = 0;
606 const char* register_name =
607 byte_size_operand_ ? NameOfByteCPURegister(regop)
608 : NameOfCPURegister(regop);
609 switch (op_order) {
610 case REG_OPER_OP_ORDER: {
611 AppendToBuffer("%s%c %s,",
612 mnem,
613 operand_size_code(),
614 register_name);
615 advance = byte_size_operand_ ? PrintRightByteOperand(data)
616 : PrintRightOperand(data);
617 break;
618 }
619 case OPER_REG_OP_ORDER: {
620 AppendToBuffer("%s%c ", mnem, operand_size_code());
621 advance = byte_size_operand_ ? PrintRightByteOperand(data)
622 : PrintRightOperand(data);
623 AppendToBuffer(",%s", register_name);
624 break;
625 }
626 default:
627 UNREACHABLE();
628 break;
629 }
630 return advance;
631}
632
633
634// Returns number of bytes used by machine instruction, including *data byte.
635// Writes immediate instructions to 'tmp_buffer_'.
636int DisassemblerX64::PrintImmediateOp(byte* data) {
637 bool byte_size_immediate = (*data & 0x02) != 0;
638 byte modrm = *(data + 1);
639 int mod, regop, rm;
640 get_modrm(modrm, &mod, &regop, &rm);
641 const char* mnem = "Imm???";
642 switch (regop) {
643 case 0:
644 mnem = "add";
645 break;
646 case 1:
647 mnem = "or";
648 break;
649 case 2:
650 mnem = "adc";
651 break;
652 case 4:
653 mnem = "and";
654 break;
655 case 5:
656 mnem = "sub";
657 break;
658 case 6:
659 mnem = "xor";
660 break;
661 case 7:
662 mnem = "cmp";
663 break;
664 default:
665 UnimplementedInstruction();
666 }
667 AppendToBuffer("%s%c ", mnem, operand_size_code());
668 int count = PrintRightOperand(data + 1);
669 AppendToBuffer(",0x");
670 OperandSize immediate_size = byte_size_immediate ? BYTE_SIZE : operand_size();
671 count += PrintImmediate(data + 1 + count, immediate_size);
672 return 1 + count;
673}
674
675
676// Returns number of bytes used, including *data.
Steve Blockd0582a62009-12-15 09:54:21 +0000677int DisassemblerX64::F6F7Instruction(byte* data) {
678 ASSERT(*data == 0xF7 || *data == 0xF6);
Steve Blocka7e24c12009-10-30 11:49:00 +0000679 byte modrm = *(data + 1);
680 int mod, regop, rm;
681 get_modrm(modrm, &mod, &regop, &rm);
682 if (mod == 3 && regop != 0) {
683 const char* mnem = NULL;
684 switch (regop) {
685 case 2:
686 mnem = "not";
687 break;
688 case 3:
689 mnem = "neg";
690 break;
691 case 4:
692 mnem = "mul";
693 break;
694 case 7:
695 mnem = "idiv";
696 break;
697 default:
698 UnimplementedInstruction();
699 }
700 AppendToBuffer("%s%c %s",
701 mnem,
702 operand_size_code(),
703 NameOfCPURegister(rm));
704 return 2;
Steve Blocka7e24c12009-10-30 11:49:00 +0000705 } else if (regop == 0) {
706 AppendToBuffer("test%c ", operand_size_code());
Steve Blockd0582a62009-12-15 09:54:21 +0000707 int count = PrintRightOperand(data + 1); // Use name of 64-bit register.
708 AppendToBuffer(",0x");
709 count += PrintImmediate(data + 1 + count, operand_size());
710 return 1 + count;
Steve Blocka7e24c12009-10-30 11:49:00 +0000711 } else {
712 UnimplementedInstruction();
713 return 2;
714 }
715}
716
717
718int DisassemblerX64::ShiftInstruction(byte* data) {
719 byte op = *data & (~1);
720 if (op != 0xD0 && op != 0xD2 && op != 0xC0) {
721 UnimplementedInstruction();
722 return 1;
723 }
724 byte modrm = *(data + 1);
725 int mod, regop, rm;
726 get_modrm(modrm, &mod, &regop, &rm);
727 regop &= 0x7; // The REX.R bit does not affect the operation.
728 int imm8 = -1;
729 int num_bytes = 2;
730 if (mod != 3) {
731 UnimplementedInstruction();
732 return num_bytes;
733 }
734 const char* mnem = NULL;
735 switch (regop) {
736 case 0:
737 mnem = "rol";
738 break;
739 case 1:
740 mnem = "ror";
741 break;
742 case 2:
743 mnem = "rcl";
744 break;
745 case 3:
746 mnem = "rcr";
747 break;
748 case 4:
749 mnem = "shl";
750 break;
751 case 5:
752 mnem = "shr";
753 break;
754 case 7:
755 mnem = "sar";
756 break;
757 default:
758 UnimplementedInstruction();
759 return num_bytes;
760 }
Steve Blockd0582a62009-12-15 09:54:21 +0000761 ASSERT_NE(NULL, mnem);
Steve Blocka7e24c12009-10-30 11:49:00 +0000762 if (op == 0xD0) {
763 imm8 = 1;
764 } else if (op == 0xC0) {
765 imm8 = *(data + 2);
766 num_bytes = 3;
767 }
768 AppendToBuffer("%s%c %s,",
769 mnem,
770 operand_size_code(),
771 byte_size_operand_ ? NameOfByteCPURegister(rm)
772 : NameOfCPURegister(rm));
773 if (op == 0xD2) {
774 AppendToBuffer("cl");
775 } else {
776 AppendToBuffer("%d", imm8);
777 }
778 return num_bytes;
779}
780
781
782// Returns number of bytes used, including *data.
783int DisassemblerX64::JumpShort(byte* data) {
Steve Blockd0582a62009-12-15 09:54:21 +0000784 ASSERT_EQ(0xEB, *data);
Steve Blocka7e24c12009-10-30 11:49:00 +0000785 byte b = *(data + 1);
786 byte* dest = data + static_cast<int8_t>(b) + 2;
787 AppendToBuffer("jmp %s", NameOfAddress(dest));
788 return 2;
789}
790
791
792// Returns number of bytes used, including *data.
793int DisassemblerX64::JumpConditional(byte* data) {
Steve Blockd0582a62009-12-15 09:54:21 +0000794 ASSERT_EQ(0x0F, *data);
Steve Blocka7e24c12009-10-30 11:49:00 +0000795 byte cond = *(data + 1) & 0x0F;
796 byte* dest = data + *reinterpret_cast<int32_t*>(data + 2) + 6;
797 const char* mnem = conditional_code_suffix[cond];
798 AppendToBuffer("j%s %s", mnem, NameOfAddress(dest));
799 return 6; // includes 0x0F
800}
801
802
803// Returns number of bytes used, including *data.
804int DisassemblerX64::JumpConditionalShort(byte* data) {
805 byte cond = *data & 0x0F;
806 byte b = *(data + 1);
807 byte* dest = data + static_cast<int8_t>(b) + 2;
808 const char* mnem = conditional_code_suffix[cond];
809 AppendToBuffer("j%s %s", mnem, NameOfAddress(dest));
810 return 2;
811}
812
813
814// Returns number of bytes used, including *data.
815int DisassemblerX64::SetCC(byte* data) {
Steve Blockd0582a62009-12-15 09:54:21 +0000816 ASSERT_EQ(0x0F, *data);
Steve Blocka7e24c12009-10-30 11:49:00 +0000817 byte cond = *(data + 1) & 0x0F;
818 const char* mnem = conditional_code_suffix[cond];
819 AppendToBuffer("set%s%c ", mnem, operand_size_code());
820 PrintRightByteOperand(data + 2);
821 return 3; // includes 0x0F
822}
823
824
825// Returns number of bytes used, including *data.
826int DisassemblerX64::FPUInstruction(byte* data) {
Steve Blockd0582a62009-12-15 09:54:21 +0000827 byte escape_opcode = *data;
828 ASSERT_EQ(0xD8, escape_opcode & 0xF8);
829 byte modrm_byte = *(data+1);
830
831 if (modrm_byte >= 0xC0) {
832 return RegisterFPUInstruction(escape_opcode, modrm_byte);
833 } else {
834 return MemoryFPUInstruction(escape_opcode, modrm_byte, data+1);
Steve Blocka7e24c12009-10-30 11:49:00 +0000835 }
Steve Blockd0582a62009-12-15 09:54:21 +0000836}
837
838int DisassemblerX64::MemoryFPUInstruction(int escape_opcode,
839 int modrm_byte,
840 byte* modrm_start) {
841 const char* mnem = "?";
842 int regop = (modrm_byte >> 3) & 0x7; // reg/op field of modrm byte.
843 switch (escape_opcode) {
844 case 0xD9: switch (regop) {
845 case 0: mnem = "fld_s"; break;
846 case 3: mnem = "fstp_s"; break;
847 case 7: mnem = "fstcw"; break;
848 default: UnimplementedInstruction();
849 }
850 break;
851
852 case 0xDB: switch (regop) {
853 case 0: mnem = "fild_s"; break;
854 case 1: mnem = "fisttp_s"; break;
855 case 2: mnem = "fist_s"; break;
856 case 3: mnem = "fistp_s"; break;
857 default: UnimplementedInstruction();
858 }
859 break;
860
861 case 0xDD: switch (regop) {
862 case 0: mnem = "fld_d"; break;
863 case 3: mnem = "fstp_d"; break;
864 default: UnimplementedInstruction();
865 }
866 break;
867
868 case 0xDF: switch (regop) {
869 case 5: mnem = "fild_d"; break;
870 case 7: mnem = "fistp_d"; break;
871 default: UnimplementedInstruction();
872 }
873 break;
874
875 default: UnimplementedInstruction();
876 }
877 AppendToBuffer("%s ", mnem);
878 int count = PrintRightOperand(modrm_start);
879 return count + 1;
880}
881
882int DisassemblerX64::RegisterFPUInstruction(int escape_opcode,
883 byte modrm_byte) {
884 bool has_register = false; // Is the FPU register encoded in modrm_byte?
885 const char* mnem = "?";
886
887 switch (escape_opcode) {
888 case 0xD8:
889 UnimplementedInstruction();
890 break;
891
892 case 0xD9:
893 switch (modrm_byte & 0xF8) {
Kristian Monsen0d5e1162010-09-30 15:31:59 +0100894 case 0xC0:
895 mnem = "fld";
896 has_register = true;
897 break;
Steve Blockd0582a62009-12-15 09:54:21 +0000898 case 0xC8:
899 mnem = "fxch";
900 has_register = true;
901 break;
902 default:
903 switch (modrm_byte) {
904 case 0xE0: mnem = "fchs"; break;
905 case 0xE1: mnem = "fabs"; break;
906 case 0xE4: mnem = "ftst"; break;
907 case 0xE8: mnem = "fld1"; break;
Kristian Monsen0d5e1162010-09-30 15:31:59 +0100908 case 0xEB: mnem = "fldpi"; break;
Ben Murdochb0fe1622011-05-05 13:52:32 +0100909 case 0xED: mnem = "fldln2"; break;
Steve Blockd0582a62009-12-15 09:54:21 +0000910 case 0xEE: mnem = "fldz"; break;
Ben Murdochb0fe1622011-05-05 13:52:32 +0100911 case 0xF1: mnem = "fyl2x"; break;
Steve Blockd0582a62009-12-15 09:54:21 +0000912 case 0xF5: mnem = "fprem1"; break;
913 case 0xF7: mnem = "fincstp"; break;
914 case 0xF8: mnem = "fprem"; break;
915 case 0xFE: mnem = "fsin"; break;
916 case 0xFF: mnem = "fcos"; break;
917 default: UnimplementedInstruction();
918 }
919 }
920 break;
921
922 case 0xDA:
923 if (modrm_byte == 0xE9) {
924 mnem = "fucompp";
925 } else {
926 UnimplementedInstruction();
927 }
928 break;
929
930 case 0xDB:
931 if ((modrm_byte & 0xF8) == 0xE8) {
932 mnem = "fucomi";
933 has_register = true;
934 } else if (modrm_byte == 0xE2) {
935 mnem = "fclex";
936 } else {
937 UnimplementedInstruction();
938 }
939 break;
940
941 case 0xDC:
942 has_register = true;
943 switch (modrm_byte & 0xF8) {
944 case 0xC0: mnem = "fadd"; break;
945 case 0xE8: mnem = "fsub"; break;
946 case 0xC8: mnem = "fmul"; break;
947 case 0xF8: mnem = "fdiv"; break;
948 default: UnimplementedInstruction();
949 }
950 break;
951
952 case 0xDD:
953 has_register = true;
954 switch (modrm_byte & 0xF8) {
955 case 0xC0: mnem = "ffree"; break;
956 case 0xD8: mnem = "fstp"; break;
957 default: UnimplementedInstruction();
958 }
959 break;
960
961 case 0xDE:
962 if (modrm_byte == 0xD9) {
963 mnem = "fcompp";
964 } else {
965 has_register = true;
966 switch (modrm_byte & 0xF8) {
967 case 0xC0: mnem = "faddp"; break;
968 case 0xE8: mnem = "fsubp"; break;
969 case 0xC8: mnem = "fmulp"; break;
970 case 0xF8: mnem = "fdivp"; break;
971 default: UnimplementedInstruction();
972 }
973 }
974 break;
975
976 case 0xDF:
977 if (modrm_byte == 0xE0) {
978 mnem = "fnstsw_ax";
979 } else if ((modrm_byte & 0xF8) == 0xE8) {
980 mnem = "fucomip";
981 has_register = true;
982 }
983 break;
984
985 default: UnimplementedInstruction();
986 }
987
988 if (has_register) {
989 AppendToBuffer("%s st%d", mnem, modrm_byte & 0x7);
990 } else {
991 AppendToBuffer("%s", mnem);
992 }
Steve Blocka7e24c12009-10-30 11:49:00 +0000993 return 2;
994}
995
996
Steve Blockd0582a62009-12-15 09:54:21 +0000997
Steve Blocka7e24c12009-10-30 11:49:00 +0000998// Handle all two-byte opcodes, which start with 0x0F.
999// These instructions may be affected by an 0x66, 0xF2, or 0xF3 prefix.
1000// We do not use any three-byte opcodes, which start with 0x0F38 or 0x0F3A.
1001int DisassemblerX64::TwoByteOpcodeInstruction(byte* data) {
1002 byte opcode = *(data + 1);
1003 byte* current = data + 2;
1004 // At return, "current" points to the start of the next instruction.
1005 const char* mnemonic = TwoByteMnemonic(opcode);
Andrei Popescu402d9372010-02-26 13:31:12 +00001006 if (operand_size_ == 0x66) {
1007 // 0x66 0x0F prefix.
Steve Blocka7e24c12009-10-30 11:49:00 +00001008 int mod, regop, rm;
Steve Block6ded16b2010-05-10 14:33:55 +01001009 if (opcode == 0x3A) {
1010 byte third_byte = *current;
1011 current = data + 3;
1012 if (third_byte == 0x17) {
1013 get_modrm(*current, &mod, &regop, &rm);
1014 AppendToBuffer("extractps "); // reg/m32, xmm, imm8
1015 current += PrintRightOperand(current);
1016 AppendToBuffer(", %s, %d", NameOfCPURegister(regop), (*current) & 3);
1017 current += 1;
1018 } else {
1019 UnimplementedInstruction();
1020 }
Steve Blocka7e24c12009-10-30 11:49:00 +00001021 } else {
Steve Block6ded16b2010-05-10 14:33:55 +01001022 get_modrm(*current, &mod, &regop, &rm);
1023 if (opcode == 0x6E) {
1024 AppendToBuffer("mov%c %s,",
1025 rex_w() ? 'q' : 'd',
1026 NameOfXMMRegister(regop));
1027 current += PrintRightOperand(current);
Steve Block1e0659c2011-05-24 12:43:12 +01001028 } else if (opcode == 0x6F) {
1029 AppendToBuffer("movdqa %s,",
1030 NameOfXMMRegister(regop));
1031 current += PrintRightOperand(current);
Steve Block6ded16b2010-05-10 14:33:55 +01001032 } else if (opcode == 0x7E) {
Ben Murdochbb769b22010-08-11 14:56:33 +01001033 AppendToBuffer("mov%c ",
1034 rex_w() ? 'q' : 'd');
1035 current += PrintRightOperand(current);
1036 AppendToBuffer(", %s", NameOfXMMRegister(regop));
Steve Block1e0659c2011-05-24 12:43:12 +01001037 } else if (opcode == 0x7F) {
1038 AppendToBuffer("movdqa ");
1039 current += PrintRightOperand(current);
1040 AppendToBuffer(", %s", NameOfXMMRegister(regop));
Steve Block6ded16b2010-05-10 14:33:55 +01001041 } else {
1042 const char* mnemonic = "?";
1043 if (opcode == 0x57) {
1044 mnemonic = "xorpd";
1045 } else if (opcode == 0x2E) {
Steve Block6ded16b2010-05-10 14:33:55 +01001046 mnemonic = "ucomisd";
Steve Block8defd9f2010-07-08 12:39:36 +01001047 } else if (opcode == 0x2F) {
1048 mnemonic = "comisd";
Steve Block1e0659c2011-05-24 12:43:12 +01001049 } else if (opcode == 0x50) {
1050 mnemonic = "movmskpd";
Steve Block6ded16b2010-05-10 14:33:55 +01001051 } else {
1052 UnimplementedInstruction();
1053 }
1054 AppendToBuffer("%s %s,", mnemonic, NameOfXMMRegister(regop));
1055 current += PrintRightXMMOperand(current);
1056 }
Steve Blocka7e24c12009-10-30 11:49:00 +00001057 }
1058 } else if (group_1_prefix_ == 0xF2) {
1059 // Beginning of instructions with prefix 0xF2.
1060
1061 if (opcode == 0x11 || opcode == 0x10) {
1062 // MOVSD: Move scalar double-precision fp to/from/between XMM registers.
1063 AppendToBuffer("movsd ");
1064 int mod, regop, rm;
1065 get_modrm(*current, &mod, &regop, &rm);
1066 if (opcode == 0x11) {
1067 current += PrintRightOperand(current);
1068 AppendToBuffer(",%s", NameOfXMMRegister(regop));
1069 } else {
1070 AppendToBuffer("%s,", NameOfXMMRegister(regop));
1071 current += PrintRightOperand(current);
1072 }
1073 } else if (opcode == 0x2A) {
1074 // CVTSI2SD: integer to XMM double conversion.
1075 int mod, regop, rm;
1076 get_modrm(*current, &mod, &regop, &rm);
Steve Block8defd9f2010-07-08 12:39:36 +01001077 AppendToBuffer("%sd %s,", mnemonic, NameOfXMMRegister(regop));
Steve Blockd0582a62009-12-15 09:54:21 +00001078 current += PrintRightOperand(current);
Kristian Monsen0d5e1162010-09-30 15:31:59 +01001079 } else if (opcode == 0x2C) {
1080 // CVTTSD2SI:
1081 // Convert with truncation scalar double-precision FP to integer.
1082 int mod, regop, rm;
1083 get_modrm(*current, &mod, &regop, &rm);
1084 AppendToBuffer("cvttsd2si%c %s,",
1085 operand_size_code(), NameOfCPURegister(regop));
1086 current += PrintRightXMMOperand(current);
1087 } else if (opcode == 0x2D) {
1088 // CVTSD2SI: Convert scalar double-precision FP to integer.
1089 int mod, regop, rm;
1090 get_modrm(*current, &mod, &regop, &rm);
1091 AppendToBuffer("cvtsd2si%c %s,",
1092 operand_size_code(), NameOfCPURegister(regop));
1093 current += PrintRightXMMOperand(current);
Steve Block6ded16b2010-05-10 14:33:55 +01001094 } else if ((opcode & 0xF8) == 0x58 || opcode == 0x51) {
Steve Blocka7e24c12009-10-30 11:49:00 +00001095 // XMM arithmetic. Mnemonic was retrieved at the start of this function.
1096 int mod, regop, rm;
1097 get_modrm(*current, &mod, &regop, &rm);
Steve Blockd0582a62009-12-15 09:54:21 +00001098 AppendToBuffer("%s %s,", mnemonic, NameOfXMMRegister(regop));
1099 current += PrintRightXMMOperand(current);
Steve Blocka7e24c12009-10-30 11:49:00 +00001100 } else {
1101 UnimplementedInstruction();
1102 }
Steve Block6ded16b2010-05-10 14:33:55 +01001103 } else if (group_1_prefix_ == 0xF3) {
1104 // Instructions with prefix 0xF3.
Steve Block8defd9f2010-07-08 12:39:36 +01001105 if (opcode == 0x11 || opcode == 0x10) {
1106 // MOVSS: Move scalar double-precision fp to/from/between XMM registers.
1107 AppendToBuffer("movss ");
1108 int mod, regop, rm;
1109 get_modrm(*current, &mod, &regop, &rm);
1110 if (opcode == 0x11) {
1111 current += PrintRightOperand(current);
1112 AppendToBuffer(",%s", NameOfXMMRegister(regop));
1113 } else {
1114 AppendToBuffer("%s,", NameOfXMMRegister(regop));
1115 current += PrintRightOperand(current);
1116 }
1117 } else if (opcode == 0x2A) {
1118 // CVTSI2SS: integer to XMM single conversion.
1119 int mod, regop, rm;
1120 get_modrm(*current, &mod, &regop, &rm);
1121 AppendToBuffer("%ss %s,", mnemonic, NameOfXMMRegister(regop));
1122 current += PrintRightOperand(current);
1123 } else if (opcode == 0x2C) {
Kristian Monsen0d5e1162010-09-30 15:31:59 +01001124 // CVTTSS2SI:
1125 // Convert with truncation scalar single-precision FP to dword integer.
Steve Block1e0659c2011-05-24 12:43:12 +01001126 int mod, regop, rm;
1127 get_modrm(*current, &mod, &regop, &rm);
1128 AppendToBuffer("cvttss2si%c %s,",
1129 operand_size_code(), NameOfCPURegister(regop));
1130 current += PrintRightXMMOperand(current);
Steve Block6ded16b2010-05-10 14:33:55 +01001131 } else if (opcode == 0x5A) {
Kristian Monsen0d5e1162010-09-30 15:31:59 +01001132 // CVTSS2SD:
1133 // Convert scalar single-precision FP to scalar double-precision FP.
Steve Block6ded16b2010-05-10 14:33:55 +01001134 int mod, regop, rm;
1135 get_modrm(*current, &mod, &regop, &rm);
1136 AppendToBuffer("cvtss2sd %s,", NameOfXMMRegister(regop));
1137 current += PrintRightXMMOperand(current);
1138 } else {
1139 UnimplementedInstruction();
1140 }
Andrei Popescu402d9372010-02-26 13:31:12 +00001141 } else if (opcode == 0x1F) {
1142 // NOP
1143 int mod, regop, rm;
1144 get_modrm(*current, &mod, &regop, &rm);
1145 current++;
1146 if (regop == 4) { // SIB byte present.
1147 current++;
1148 }
1149 if (mod == 1) { // Byte displacement.
1150 current += 1;
1151 } else if (mod == 2) { // 32-bit displacement.
1152 current += 4;
1153 } // else no immediate displacement.
1154 AppendToBuffer("nop");
1155 } else if (opcode == 0xA2 || opcode == 0x31) {
1156 // RDTSC or CPUID
1157 AppendToBuffer("%s", mnemonic);
1158
1159 } else if ((opcode & 0xF0) == 0x40) {
1160 // CMOVcc: conditional move.
1161 int condition = opcode & 0x0F;
1162 const InstructionDesc& idesc = cmov_instructions[condition];
1163 byte_size_operand_ = idesc.byte_size_operation;
1164 current += PrintOperands(idesc.mnem, idesc.op_order_, current);
1165
1166 } else if ((opcode & 0xF0) == 0x80) {
1167 // Jcc: Conditional jump (branch).
1168 current = data + JumpConditional(data);
1169
1170 } else if (opcode == 0xBE || opcode == 0xBF || opcode == 0xB6 ||
1171 opcode == 0xB7 || opcode == 0xAF) {
1172 // Size-extending moves, IMUL.
1173 current += PrintOperands(mnemonic, REG_OPER_OP_ORDER, current);
1174
1175 } else if ((opcode & 0xF0) == 0x90) {
1176 // SETcc: Set byte on condition. Needs pointer to beginning of instruction.
1177 current = data + SetCC(data);
1178
1179 } else if (opcode == 0xAB || opcode == 0xA5 || opcode == 0xAD) {
1180 // SHLD, SHRD (double-precision shift), BTS (bit set).
1181 AppendToBuffer("%s ", mnemonic);
1182 int mod, regop, rm;
1183 get_modrm(*current, &mod, &regop, &rm);
1184 current += PrintRightOperand(current);
1185 if (opcode == 0xAB) {
1186 AppendToBuffer(",%s", NameOfCPURegister(regop));
1187 } else {
1188 AppendToBuffer(",%s,cl", NameOfCPURegister(regop));
1189 }
Steve Blocka7e24c12009-10-30 11:49:00 +00001190 } else {
1191 UnimplementedInstruction();
1192 }
Steve Blockd0582a62009-12-15 09:54:21 +00001193 return static_cast<int>(current - data);
Steve Blocka7e24c12009-10-30 11:49:00 +00001194}
1195
1196
1197// Mnemonics for two-byte opcode instructions starting with 0x0F.
1198// The argument is the second byte of the two-byte opcode.
1199// Returns NULL if the instruction is not handled here.
1200const char* DisassemblerX64::TwoByteMnemonic(byte opcode) {
1201 switch (opcode) {
1202 case 0x1F:
1203 return "nop";
Steve Block8defd9f2010-07-08 12:39:36 +01001204 case 0x2A: // F2/F3 prefix.
1205 return "cvtsi2s";
Steve Blocka7e24c12009-10-30 11:49:00 +00001206 case 0x31:
1207 return "rdtsc";
Steve Block6ded16b2010-05-10 14:33:55 +01001208 case 0x51: // F2 prefix.
1209 return "sqrtsd";
Steve Blocka7e24c12009-10-30 11:49:00 +00001210 case 0x58: // F2 prefix.
1211 return "addsd";
1212 case 0x59: // F2 prefix.
1213 return "mulsd";
1214 case 0x5C: // F2 prefix.
1215 return "subsd";
1216 case 0x5E: // F2 prefix.
1217 return "divsd";
1218 case 0xA2:
1219 return "cpuid";
1220 case 0xA5:
1221 return "shld";
1222 case 0xAB:
1223 return "bts";
1224 case 0xAD:
1225 return "shrd";
1226 case 0xAF:
1227 return "imul";
1228 case 0xB6:
1229 return "movzxb";
1230 case 0xB7:
1231 return "movzxw";
1232 case 0xBE:
1233 return "movsxb";
1234 case 0xBF:
1235 return "movsxw";
1236 default:
1237 return NULL;
1238 }
1239}
1240
1241
1242// Disassembles the instruction at instr, and writes it into out_buffer.
1243int DisassemblerX64::InstructionDecode(v8::internal::Vector<char> out_buffer,
1244 byte* instr) {
1245 tmp_buffer_pos_ = 0; // starting to write as position 0
1246 byte* data = instr;
1247 bool processed = true; // Will be set to false if the current instruction
1248 // is not in 'instructions' table.
1249 byte current;
1250
1251 // Scan for prefixes.
1252 while (true) {
1253 current = *data;
Leon Clarked91b9f72010-01-27 17:25:45 +00001254 if (current == OPERAND_SIZE_OVERRIDE_PREFIX) { // Group 3 prefix.
Steve Blocka7e24c12009-10-30 11:49:00 +00001255 operand_size_ = current;
1256 } else if ((current & 0xF0) == 0x40) { // REX prefix.
1257 setRex(current);
1258 if (rex_w()) AppendToBuffer("REX.W ");
Leon Clarked91b9f72010-01-27 17:25:45 +00001259 } else if ((current & 0xFE) == 0xF2) { // Group 1 prefix (0xF2 or 0xF3).
Steve Blocka7e24c12009-10-30 11:49:00 +00001260 group_1_prefix_ = current;
1261 } else { // Not a prefix - an opcode.
1262 break;
1263 }
1264 data++;
1265 }
1266
1267 const InstructionDesc& idesc = instruction_table.Get(current);
1268 byte_size_operand_ = idesc.byte_size_operation;
1269 switch (idesc.type) {
1270 case ZERO_OPERANDS_INSTR:
Leon Clarked91b9f72010-01-27 17:25:45 +00001271 if (current >= 0xA4 && current <= 0xA7) {
1272 // String move or compare operations.
1273 if (group_1_prefix_ == REP_PREFIX) {
1274 // REP.
1275 AppendToBuffer("rep ");
1276 }
1277 if (rex_w()) AppendToBuffer("REX.W ");
1278 AppendToBuffer("%s%c", idesc.mnem, operand_size_code());
1279 } else {
1280 AppendToBuffer("%s", idesc.mnem, operand_size_code());
1281 }
Steve Blocka7e24c12009-10-30 11:49:00 +00001282 data++;
1283 break;
1284
1285 case TWO_OPERANDS_INSTR:
1286 data++;
1287 data += PrintOperands(idesc.mnem, idesc.op_order_, data);
1288 break;
1289
1290 case JUMP_CONDITIONAL_SHORT_INSTR:
1291 data += JumpConditionalShort(data);
1292 break;
1293
1294 case REGISTER_INSTR:
1295 AppendToBuffer("%s%c %s",
1296 idesc.mnem,
1297 operand_size_code(),
1298 NameOfCPURegister(base_reg(current & 0x07)));
1299 data++;
1300 break;
1301 case PUSHPOP_INSTR:
1302 AppendToBuffer("%s %s",
1303 idesc.mnem,
1304 NameOfCPURegister(base_reg(current & 0x07)));
1305 data++;
1306 break;
1307 case MOVE_REG_INSTR: {
1308 byte* addr = NULL;
1309 switch (operand_size()) {
1310 case WORD_SIZE:
1311 addr = reinterpret_cast<byte*>(*reinterpret_cast<int16_t*>(data + 1));
1312 data += 3;
1313 break;
1314 case DOUBLEWORD_SIZE:
1315 addr = reinterpret_cast<byte*>(*reinterpret_cast<int32_t*>(data + 1));
1316 data += 5;
1317 break;
1318 case QUADWORD_SIZE:
1319 addr = reinterpret_cast<byte*>(*reinterpret_cast<int64_t*>(data + 1));
1320 data += 9;
1321 break;
1322 default:
1323 UNREACHABLE();
1324 }
1325 AppendToBuffer("mov%c %s,%s",
1326 operand_size_code(),
1327 NameOfCPURegister(base_reg(current & 0x07)),
1328 NameOfAddress(addr));
1329 break;
1330 }
1331
1332 case CALL_JUMP_INSTR: {
1333 byte* addr = data + *reinterpret_cast<int32_t*>(data + 1) + 5;
1334 AppendToBuffer("%s %s", idesc.mnem, NameOfAddress(addr));
1335 data += 5;
1336 break;
1337 }
1338
1339 case SHORT_IMMEDIATE_INSTR: {
1340 byte* addr =
1341 reinterpret_cast<byte*>(*reinterpret_cast<int32_t*>(data + 1));
1342 AppendToBuffer("%s rax, %s", idesc.mnem, NameOfAddress(addr));
1343 data += 5;
1344 break;
1345 }
1346
1347 case NO_INSTR:
1348 processed = false;
1349 break;
1350
1351 default:
1352 UNIMPLEMENTED(); // This type is not implemented.
1353 }
1354
1355 // The first byte didn't match any of the simple opcodes, so we
1356 // need to do special processing on it.
1357 if (!processed) {
1358 switch (*data) {
1359 case 0xC2:
1360 AppendToBuffer("ret 0x%x", *reinterpret_cast<uint16_t*>(data + 1));
1361 data += 3;
1362 break;
1363
1364 case 0x69: // fall through
1365 case 0x6B: {
1366 int mod, regop, rm;
1367 get_modrm(*(data + 1), &mod, &regop, &rm);
1368 int32_t imm = *data == 0x6B ? *(data + 2)
1369 : *reinterpret_cast<int32_t*>(data + 2);
Steve Block6ded16b2010-05-10 14:33:55 +01001370 AppendToBuffer("imul%c %s,%s,0x%x",
1371 operand_size_code(),
1372 NameOfCPURegister(regop),
Steve Blocka7e24c12009-10-30 11:49:00 +00001373 NameOfCPURegister(rm), imm);
1374 data += 2 + (*data == 0x6B ? 1 : 4);
1375 break;
1376 }
1377
Steve Blocka7e24c12009-10-30 11:49:00 +00001378 case 0x81: // fall through
1379 case 0x83: // 0x81 with sign extension bit set
1380 data += PrintImmediateOp(data);
1381 break;
1382
1383 case 0x0F:
1384 data += TwoByteOpcodeInstruction(data);
1385 break;
1386
1387 case 0x8F: {
1388 data++;
1389 int mod, regop, rm;
1390 get_modrm(*data, &mod, &regop, &rm);
1391 if (regop == 0) {
1392 AppendToBuffer("pop ");
1393 data += PrintRightOperand(data);
1394 }
1395 }
1396 break;
1397
1398 case 0xFF: {
1399 data++;
1400 int mod, regop, rm;
1401 get_modrm(*data, &mod, &regop, &rm);
1402 const char* mnem = NULL;
1403 switch (regop) {
1404 case 0:
1405 mnem = "inc";
1406 break;
1407 case 1:
1408 mnem = "dec";
1409 break;
1410 case 2:
1411 mnem = "call";
1412 break;
1413 case 4:
1414 mnem = "jmp";
1415 break;
1416 case 6:
1417 mnem = "push";
1418 break;
1419 default:
1420 mnem = "???";
1421 }
1422 AppendToBuffer(((regop <= 1) ? "%s%c " : "%s "),
1423 mnem,
1424 operand_size_code());
1425 data += PrintRightOperand(data);
1426 }
1427 break;
1428
1429 case 0xC7: // imm32, fall through
1430 case 0xC6: // imm8
1431 {
1432 bool is_byte = *data == 0xC6;
1433 data++;
1434
1435 AppendToBuffer("mov%c ", is_byte ? 'b' : operand_size_code());
1436 data += PrintRightOperand(data);
1437 int32_t imm = is_byte ? *data : *reinterpret_cast<int32_t*>(data);
1438 AppendToBuffer(",0x%x", imm);
1439 data += is_byte ? 1 : 4;
1440 }
1441 break;
1442
1443 case 0x80: {
1444 data++;
1445 AppendToBuffer("cmpb ");
1446 data += PrintRightOperand(data);
1447 int32_t imm = *data;
1448 AppendToBuffer(",0x%x", imm);
1449 data++;
1450 }
1451 break;
1452
1453 case 0x88: // 8bit, fall through
1454 case 0x89: // 32bit
1455 {
1456 bool is_byte = *data == 0x88;
1457 int mod, regop, rm;
1458 data++;
1459 get_modrm(*data, &mod, &regop, &rm);
1460 AppendToBuffer("mov%c ", is_byte ? 'b' : operand_size_code());
1461 data += PrintRightOperand(data);
1462 AppendToBuffer(",%s", NameOfCPURegister(regop));
1463 }
1464 break;
1465
1466 case 0x90:
1467 case 0x91:
1468 case 0x92:
1469 case 0x93:
1470 case 0x94:
1471 case 0x95:
1472 case 0x96:
1473 case 0x97: {
Steve Blockd0582a62009-12-15 09:54:21 +00001474 int reg = (*data & 0x7) | (rex_b() ? 8 : 0);
Steve Blocka7e24c12009-10-30 11:49:00 +00001475 if (reg == 0) {
1476 AppendToBuffer("nop"); // Common name for xchg rax,rax.
1477 } else {
1478 AppendToBuffer("xchg%c rax, %s",
1479 operand_size_code(),
1480 NameOfCPURegister(reg));
1481 }
Steve Blockd0582a62009-12-15 09:54:21 +00001482 data++;
Steve Blocka7e24c12009-10-30 11:49:00 +00001483 }
Steve Blockd0582a62009-12-15 09:54:21 +00001484 break;
Steve Blocka7e24c12009-10-30 11:49:00 +00001485
1486 case 0xFE: {
1487 data++;
1488 int mod, regop, rm;
1489 get_modrm(*data, &mod, &regop, &rm);
Kristian Monsen0d5e1162010-09-30 15:31:59 +01001490 if (regop == 1) {
1491 AppendToBuffer("decb ");
1492 data += PrintRightOperand(data);
Steve Blocka7e24c12009-10-30 11:49:00 +00001493 } else {
1494 UnimplementedInstruction();
1495 }
Steve Blocka7e24c12009-10-30 11:49:00 +00001496 }
1497 break;
1498
1499 case 0x68:
1500 AppendToBuffer("push 0x%x", *reinterpret_cast<int32_t*>(data + 1));
1501 data += 5;
1502 break;
1503
1504 case 0x6A:
1505 AppendToBuffer("push 0x%x", *reinterpret_cast<int8_t*>(data + 1));
1506 data += 2;
1507 break;
1508
1509 case 0xA1: // Fall through.
1510 case 0xA3:
1511 switch (operand_size()) {
1512 case DOUBLEWORD_SIZE: {
1513 const char* memory_location = NameOfAddress(
1514 reinterpret_cast<byte*>(
1515 *reinterpret_cast<int32_t*>(data + 1)));
1516 if (*data == 0xA1) { // Opcode 0xA1
1517 AppendToBuffer("movzxlq rax,(%s)", memory_location);
1518 } else { // Opcode 0xA3
1519 AppendToBuffer("movzxlq (%s),rax", memory_location);
1520 }
1521 data += 5;
1522 break;
1523 }
1524 case QUADWORD_SIZE: {
1525 // New x64 instruction mov rax,(imm_64).
1526 const char* memory_location = NameOfAddress(
1527 *reinterpret_cast<byte**>(data + 1));
1528 if (*data == 0xA1) { // Opcode 0xA1
1529 AppendToBuffer("movq rax,(%s)", memory_location);
1530 } else { // Opcode 0xA3
1531 AppendToBuffer("movq (%s),rax", memory_location);
1532 }
1533 data += 9;
1534 break;
1535 }
1536 default:
1537 UnimplementedInstruction();
1538 data += 2;
1539 }
1540 break;
1541
1542 case 0xA8:
1543 AppendToBuffer("test al,0x%x", *reinterpret_cast<uint8_t*>(data + 1));
1544 data += 2;
1545 break;
1546
1547 case 0xA9: {
1548 int64_t value = 0;
1549 switch (operand_size()) {
1550 case WORD_SIZE:
1551 value = *reinterpret_cast<uint16_t*>(data + 1);
1552 data += 3;
1553 break;
1554 case DOUBLEWORD_SIZE:
1555 value = *reinterpret_cast<uint32_t*>(data + 1);
1556 data += 5;
1557 break;
1558 case QUADWORD_SIZE:
1559 value = *reinterpret_cast<int32_t*>(data + 1);
1560 data += 5;
1561 break;
1562 default:
1563 UNREACHABLE();
1564 }
1565 AppendToBuffer("test%c rax,0x%"V8_PTR_PREFIX"x",
1566 operand_size_code(),
1567 value);
1568 break;
1569 }
1570 case 0xD1: // fall through
1571 case 0xD3: // fall through
1572 case 0xC1:
1573 data += ShiftInstruction(data);
1574 break;
1575 case 0xD0: // fall through
1576 case 0xD2: // fall through
1577 case 0xC0:
1578 byte_size_operand_ = true;
1579 data += ShiftInstruction(data);
1580 break;
1581
1582 case 0xD9: // fall through
1583 case 0xDA: // fall through
1584 case 0xDB: // fall through
1585 case 0xDC: // fall through
1586 case 0xDD: // fall through
1587 case 0xDE: // fall through
1588 case 0xDF:
1589 data += FPUInstruction(data);
1590 break;
1591
1592 case 0xEB:
1593 data += JumpShort(data);
1594 break;
1595
Steve Blockd0582a62009-12-15 09:54:21 +00001596 case 0xF6:
1597 byte_size_operand_ = true; // fall through
Steve Blocka7e24c12009-10-30 11:49:00 +00001598 case 0xF7:
Steve Blockd0582a62009-12-15 09:54:21 +00001599 data += F6F7Instruction(data);
Steve Blocka7e24c12009-10-30 11:49:00 +00001600 break;
1601
1602 default:
1603 UnimplementedInstruction();
1604 data += 1;
1605 }
1606 } // !processed
1607
1608 if (tmp_buffer_pos_ < sizeof tmp_buffer_) {
1609 tmp_buffer_[tmp_buffer_pos_] = '\0';
1610 }
1611
Steve Blockd0582a62009-12-15 09:54:21 +00001612 int instr_len = static_cast<int>(data - instr);
Steve Blocka7e24c12009-10-30 11:49:00 +00001613 ASSERT(instr_len > 0); // Ensure progress.
1614
1615 int outp = 0;
1616 // Instruction bytes.
1617 for (byte* bp = instr; bp < data; bp++) {
1618 outp += v8::internal::OS::SNPrintF(out_buffer + outp, "%02x", *bp);
1619 }
1620 for (int i = 6 - instr_len; i >= 0; i--) {
1621 outp += v8::internal::OS::SNPrintF(out_buffer + outp, " ");
1622 }
1623
1624 outp += v8::internal::OS::SNPrintF(out_buffer + outp, " %s",
1625 tmp_buffer_.start());
1626 return instr_len;
1627}
1628
1629//------------------------------------------------------------------------------
1630
1631
1632static const char* cpu_regs[16] = {
1633 "rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi",
1634 "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"
1635};
1636
1637
1638static const char* byte_cpu_regs[16] = {
1639 "al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil",
1640 "r8l", "r9l", "r10l", "r11l", "r12l", "r13l", "r14l", "r15l"
1641};
1642
1643
1644static const char* xmm_regs[16] = {
1645 "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7",
1646 "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15"
1647};
1648
1649
1650const char* NameConverter::NameOfAddress(byte* addr) const {
1651 static v8::internal::EmbeddedVector<char, 32> tmp_buffer;
1652 v8::internal::OS::SNPrintF(tmp_buffer, "%p", addr);
1653 return tmp_buffer.start();
1654}
1655
1656
1657const char* NameConverter::NameOfConstant(byte* addr) const {
1658 return NameOfAddress(addr);
1659}
1660
1661
1662const char* NameConverter::NameOfCPURegister(int reg) const {
1663 if (0 <= reg && reg < 16)
1664 return cpu_regs[reg];
1665 return "noreg";
1666}
1667
1668
1669const char* NameConverter::NameOfByteCPURegister(int reg) const {
1670 if (0 <= reg && reg < 16)
1671 return byte_cpu_regs[reg];
1672 return "noreg";
1673}
1674
1675
1676const char* NameConverter::NameOfXMMRegister(int reg) const {
1677 if (0 <= reg && reg < 16)
1678 return xmm_regs[reg];
1679 return "noxmmreg";
1680}
1681
1682
1683const char* NameConverter::NameInCode(byte* addr) const {
1684 // X64 does not embed debug strings at the moment.
1685 UNREACHABLE();
1686 return "";
1687}
1688
1689//------------------------------------------------------------------------------
1690
1691Disassembler::Disassembler(const NameConverter& converter)
1692 : converter_(converter) { }
1693
1694Disassembler::~Disassembler() { }
1695
1696
1697int Disassembler::InstructionDecode(v8::internal::Vector<char> buffer,
1698 byte* instruction) {
1699 DisassemblerX64 d(converter_, CONTINUE_ON_UNIMPLEMENTED_OPCODE);
1700 return d.InstructionDecode(buffer, instruction);
1701}
1702
1703
1704// The X64 assembler does not use constant pools.
1705int Disassembler::ConstantPoolSizeAt(byte* instruction) {
1706 return -1;
1707}
1708
1709
1710void Disassembler::Disassemble(FILE* f, byte* begin, byte* end) {
1711 NameConverter converter;
1712 Disassembler d(converter);
1713 for (byte* pc = begin; pc < end;) {
1714 v8::internal::EmbeddedVector<char, 128> buffer;
1715 buffer[0] = '\0';
1716 byte* prev_pc = pc;
1717 pc += d.InstructionDecode(buffer, pc);
1718 fprintf(f, "%p", prev_pc);
1719 fprintf(f, " ");
1720
1721 for (byte* bp = prev_pc; bp < pc; bp++) {
1722 fprintf(f, "%02x", *bp);
1723 }
Steve Blockd0582a62009-12-15 09:54:21 +00001724 for (int i = 6 - static_cast<int>(pc - prev_pc); i >= 0; i--) {
Steve Blocka7e24c12009-10-30 11:49:00 +00001725 fprintf(f, " ");
1726 }
1727 fprintf(f, " %s\n", buffer.start());
1728 }
1729}
1730
1731} // namespace disasm
Leon Clarkef7060e22010-06-03 12:02:55 +01001732
1733#endif // V8_TARGET_ARCH_X64