blob: c2e0ef288f4aa421e45963253b8f0d75f174ed37 [file] [log] [blame]
Chris Lattner24943d22010-06-08 16:52:24 +00001//===-- DisassemblerLLVM.cpp ------------------------------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include "DisassemblerLLVM.h"
11
12#include "llvm-c/EnhancedDisassembly.h"
13
14#include "lldb/Core/Address.h"
15#include "lldb/Core/DataExtractor.h"
16#include "lldb/Core/Disassembler.h"
17#include "lldb/Core/Module.h"
18#include "lldb/Core/PluginManager.h"
19#include "lldb/Core/Stream.h"
20#include "lldb/Core/StreamString.h"
21#include "lldb/Symbol/SymbolContext.h"
22
23#include "lldb/Target/ExecutionContext.h"
24#include "lldb/Target/Process.h"
25#include "lldb/Target/RegisterContext.h"
26#include "lldb/Target/Target.h"
27
Greg Claytonb01000f2011-01-17 03:46:26 +000028#include <assert.h>
Chris Lattner24943d22010-06-08 16:52:24 +000029
30using namespace lldb;
31using namespace lldb_private;
32
33
Greg Claytonb1888f22011-03-19 01:12:21 +000034static int
Greg Clayton7bc39082011-03-24 23:53:38 +000035DataExtractorByteReader (uint8_t *byte, uint64_t address, void *arg)
Chris Lattner24943d22010-06-08 16:52:24 +000036{
37 DataExtractor &extractor = *((DataExtractor *)arg);
38
39 if (extractor.ValidOffset(address))
40 {
41 *byte = *(extractor.GetDataStart() + address);
42 return 0;
43 }
44 else
45 {
46 return -1;
47 }
48}
49
50namespace {
51 struct RegisterReaderArg {
52 const lldb::addr_t instructionPointer;
53 const EDDisassemblerRef disassembler;
54
55 RegisterReaderArg(lldb::addr_t ip,
56 EDDisassemblerRef dis) :
57 instructionPointer(ip),
58 disassembler(dis)
59 {
60 }
61 };
62}
63
64static int IPRegisterReader(uint64_t *value, unsigned regID, void* arg)
65{
66 uint64_t instructionPointer = ((RegisterReaderArg*)arg)->instructionPointer;
67 EDDisassemblerRef disassembler = ((RegisterReaderArg*)arg)->disassembler;
68
Greg Claytonb1888f22011-03-19 01:12:21 +000069 if (EDRegisterIsProgramCounter(disassembler, regID)) {
Chris Lattner24943d22010-06-08 16:52:24 +000070 *value = instructionPointer;
71 return 0;
72 }
73
74 return -1;
75}
76
Caroline Ticeaf591802011-04-05 23:22:54 +000077InstructionLLVM::InstructionLLVM (const Address &addr,
78 AddressClass addr_class,
Greg Claytonabe0fed2011-04-18 08:33:37 +000079 EDDisassemblerRef disassembler,
Johnny Chen80ab18e2011-05-12 22:25:53 +000080 llvm::Triple::ArchType arch_type) :
Greg Clayton889fbd02011-03-26 19:14:58 +000081 Instruction (addr, addr_class),
Greg Claytonabe0fed2011-04-18 08:33:37 +000082 m_disassembler (disassembler),
Johnny Chen80ab18e2011-05-12 22:25:53 +000083 m_arch_type (arch_type)
Chris Lattner24943d22010-06-08 16:52:24 +000084{
85}
86
Caroline Ticeaf591802011-04-05 23:22:54 +000087InstructionLLVM::~InstructionLLVM()
Chris Lattner24943d22010-06-08 16:52:24 +000088{
89}
90
91static void
92PadString(Stream *s, const std::string &str, size_t width)
93{
94 int diff = width - str.length();
95
96 if (diff > 0)
97 s->Printf("%s%*.*s", str.c_str(), diff, diff, "");
98 else
99 s->Printf("%s ", str.c_str());
100}
101
Johnny Chen51ff2482011-05-19 01:05:37 +0000102#include "llvm/ADT/StringRef.h"
103static void
104StripSpaces(llvm::StringRef &Str)
105{
106 while (!Str.empty() && isspace(Str[0]))
107 Str = Str.substr(1);
108 while (!Str.empty() && isspace(Str.back()))
109 Str = Str.substr(0, Str.size()-1);
110}
111
Chris Lattner24943d22010-06-08 16:52:24 +0000112void
Caroline Ticeaf591802011-04-05 23:22:54 +0000113InstructionLLVM::Dump
Chris Lattner24943d22010-06-08 16:52:24 +0000114(
115 Stream *s,
Greg Clayton889fbd02011-03-26 19:14:58 +0000116 uint32_t max_opcode_byte_size,
Greg Clayton5c4c7462010-10-06 03:09:58 +0000117 bool show_address,
Greg Clayton149731c2011-03-25 18:03:16 +0000118 bool show_bytes,
Greg Clayton5c4c7462010-10-06 03:09:58 +0000119 const lldb_private::ExecutionContext* exe_ctx,
Chris Lattner24943d22010-06-08 16:52:24 +0000120 bool raw
121)
122{
123 const size_t opcodeColumnWidth = 7;
124 const size_t operandColumnWidth = 25;
125
Greg Clayton5c4c7462010-10-06 03:09:58 +0000126 ExecutionContextScope *exe_scope = NULL;
127 if (exe_ctx)
128 exe_scope = exe_ctx->GetBestExecutionContextScope();
129
Chris Lattner24943d22010-06-08 16:52:24 +0000130 // If we have an address, print it out
Sean Callanan91557b02010-11-10 01:38:28 +0000131 if (GetAddress().IsValid() && show_address)
Greg Clayton70436352010-06-30 23:03:03 +0000132 {
Greg Clayton5c4c7462010-10-06 03:09:58 +0000133 if (GetAddress().Dump (s,
134 exe_scope,
135 Address::DumpStyleLoadAddress,
136 Address::DumpStyleModuleWithFileAddress,
137 0))
Greg Clayton70436352010-06-30 23:03:03 +0000138 s->PutCString(": ");
139 }
Chris Lattner24943d22010-06-08 16:52:24 +0000140
141 // If we are supposed to show bytes, "bytes" will be non-NULL.
Greg Clayton149731c2011-03-25 18:03:16 +0000142 if (show_bytes)
Chris Lattner24943d22010-06-08 16:52:24 +0000143 {
Greg Clayton149731c2011-03-25 18:03:16 +0000144 if (m_opcode.GetType() == Opcode::eTypeBytes)
Chris Lattner24943d22010-06-08 16:52:24 +0000145 {
Greg Clayton149731c2011-03-25 18:03:16 +0000146 // x86_64 and i386 are the only ones that use bytes right now so
147 // pad out the byte dump to be able to always show 15 bytes (3 chars each)
148 // plus a space
Greg Clayton889fbd02011-03-26 19:14:58 +0000149 if (max_opcode_byte_size > 0)
150 m_opcode.Dump (s, max_opcode_byte_size * 3 + 1);
151 else
152 m_opcode.Dump (s, 15 * 3 + 1);
Greg Clayton149731c2011-03-25 18:03:16 +0000153 }
154 else
155 {
156 // Else, we have ARM which can show up to a uint32_t 0x00000000 (10 spaces)
157 // plus two for padding...
Greg Clayton889fbd02011-03-26 19:14:58 +0000158 if (max_opcode_byte_size > 0)
159 m_opcode.Dump (s, max_opcode_byte_size * 3 + 1);
160 else
161 m_opcode.Dump (s, 12);
Chris Lattner24943d22010-06-08 16:52:24 +0000162 }
163 }
164
Greg Claytonf15996e2011-04-07 22:46:35 +0000165 int numTokens = -1;
166
Johnny Chen80ab18e2011-05-12 22:25:53 +0000167 // FIXME!!!
168 /* Remove the following section of code related to force_raw .... */
169 bool force_raw = m_arch_type == llvm::Triple::arm ||
170 m_arch_type == llvm::Triple::thumb;
Greg Claytonf15996e2011-04-07 22:46:35 +0000171 if (!raw)
Johnny Chen80ab18e2011-05-12 22:25:53 +0000172 raw = force_raw;
173 /* .... when we fix the edis for arm/thumb. */
Greg Claytonabe0fed2011-04-18 08:33:37 +0000174
175 if (!raw)
Greg Claytonf15996e2011-04-07 22:46:35 +0000176 numTokens = EDNumTokens(m_inst);
Chris Lattner24943d22010-06-08 16:52:24 +0000177
178 int currentOpIndex = -1;
179
Greg Claytonf15996e2011-04-07 22:46:35 +0000180 bool printTokenized = false;
181
182 if (numTokens != -1 && !raw)
Sean Callanan8541f2f2010-07-23 02:19:15 +0000183 {
184 addr_t base_addr = LLDB_INVALID_ADDRESS;
Greg Claytonf15996e2011-04-07 22:46:35 +0000185
Greg Clayton5c4c7462010-10-06 03:09:58 +0000186 if (exe_ctx && exe_ctx->target && !exe_ctx->target->GetSectionLoadList().IsEmpty())
187 base_addr = GetAddress().GetLoadAddress (exe_ctx->target);
Sean Callanan8541f2f2010-07-23 02:19:15 +0000188 if (base_addr == LLDB_INVALID_ADDRESS)
Greg Clayton5c4c7462010-10-06 03:09:58 +0000189 base_addr = GetAddress().GetFileAddress ();
Greg Claytonf15996e2011-04-07 22:46:35 +0000190
Johnny Chen80ab18e2011-05-12 22:25:53 +0000191 lldb::addr_t PC = base_addr + EDInstByteSize(m_inst);
192
193 // When executing an ARM instruction, PC reads as the address of the
194 // current instruction plus 8. And for Thumb, it is plus 4.
195 if (m_arch_type == llvm::Triple::arm)
196 PC = base_addr + 8;
197 else if (m_arch_type == llvm::Triple::thumb)
198 PC = base_addr + 4;
199
200 RegisterReaderArg rra(PC, m_disassembler);
Johnny Chenc5272bf2011-05-12 18:48:11 +0000201
Chris Lattner24943d22010-06-08 16:52:24 +0000202 printTokenized = true;
203
204 // Handle the opcode column.
205
206 StreamString opcode;
207
208 int tokenIndex = 0;
209
210 EDTokenRef token;
211 const char *tokenStr;
212
Johnny Chenff8fea62011-05-18 22:48:41 +0000213 if (EDGetToken(&token, m_inst, tokenIndex)) // 0 on success
214 printTokenized = false;
215 else if (!EDTokenIsOpcode(token))
216 printTokenized = false;
217 else if (EDGetTokenString(&tokenStr, token)) // 0 on success
Chris Lattner24943d22010-06-08 16:52:24 +0000218 printTokenized = false;
219
Johnny Chenff8fea62011-05-18 22:48:41 +0000220 if (printTokenized)
Chris Lattner24943d22010-06-08 16:52:24 +0000221 {
Johnny Chenff8fea62011-05-18 22:48:41 +0000222 // Put the token string into our opcode string
223 opcode.PutCString(tokenStr);
Chris Lattner24943d22010-06-08 16:52:24 +0000224
Johnny Chenff8fea62011-05-18 22:48:41 +0000225 // If anything follows, it probably starts with some whitespace. Skip it.
226 if (++tokenIndex < numTokens)
227 {
228 if (EDGetToken(&token, m_inst, tokenIndex)) // 0 on success
229 printTokenized = false;
230 else if (!EDTokenIsWhitespace(token))
231 printTokenized = false;
232 }
233
234 ++tokenIndex;
Chris Lattner24943d22010-06-08 16:52:24 +0000235 }
236
Chris Lattner24943d22010-06-08 16:52:24 +0000237 // Handle the operands and the comment.
Chris Lattner24943d22010-06-08 16:52:24 +0000238 StreamString operands;
239 StreamString comment;
240
241 if (printTokenized)
242 {
Johnny Chen51ff2482011-05-19 01:05:37 +0000243 bool show_token = false;
Chris Lattner24943d22010-06-08 16:52:24 +0000244
245 for (; tokenIndex < numTokens; ++tokenIndex)
246 {
247 if (EDGetToken(&token, m_inst, tokenIndex))
248 return;
249
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000250 int operandIndex = EDOperandIndexForToken(token);
Chris Lattner24943d22010-06-08 16:52:24 +0000251
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000252 if (operandIndex >= 0)
253 {
254 if (operandIndex != currentOpIndex)
Chris Lattner24943d22010-06-08 16:52:24 +0000255 {
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000256 show_token = true;
257
258 currentOpIndex = operandIndex;
259 EDOperandRef operand;
260
261 if (!EDGetOperand(&operand, m_inst, currentOpIndex))
Chris Lattner24943d22010-06-08 16:52:24 +0000262 {
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000263 if (EDOperandIsMemory(operand))
Chris Lattner24943d22010-06-08 16:52:24 +0000264 {
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000265 uint64_t operand_value;
266
267 if (!EDEvaluateOperand(&operand_value, operand, IPRegisterReader, &rra))
Chris Lattner24943d22010-06-08 16:52:24 +0000268 {
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000269 if (EDInstIsBranch(m_inst))
Chris Lattner24943d22010-06-08 16:52:24 +0000270 {
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000271 operands.Printf("0x%llx ", operand_value);
272 show_token = false;
273 }
274 else
275 {
276 // Put the address value into the comment
277 comment.Printf("0x%llx ", operand_value);
278 }
Chris Lattner24943d22010-06-08 16:52:24 +0000279
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000280 lldb_private::Address so_addr;
281 if (exe_ctx && exe_ctx->target && !exe_ctx->target->GetSectionLoadList().IsEmpty())
282 {
283 if (exe_ctx->target->GetSectionLoadList().ResolveLoadAddress (operand_value, so_addr))
284 so_addr.Dump(&comment, exe_scope, Address::DumpStyleResolvedDescriptionNoModule, Address::DumpStyleSectionNameOffset);
285 }
286 else
287 {
288 Module *module = GetAddress().GetModule();
289 if (module)
Chris Lattner24943d22010-06-08 16:52:24 +0000290 {
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000291 if (module->ResolveFileAddress (operand_value, so_addr))
Greg Claytoncf7f1ad2010-07-01 01:26:43 +0000292 so_addr.Dump(&comment, exe_scope, Address::DumpStyleResolvedDescriptionNoModule, Address::DumpStyleSectionNameOffset);
Greg Clayton70436352010-06-30 23:03:03 +0000293 }
Johnny Chen6d61ebf2011-05-18 22:08:52 +0000294 }
295 } // EDEvaluateOperand
296 } // EDOperandIsMemory
297 } // EDGetOperand
298 } // operandIndex != currentOpIndex
299 } // operandIndex >= 0
Chris Lattner24943d22010-06-08 16:52:24 +0000300
301 if (show_token)
302 {
303 if(EDGetTokenString(&tokenStr, token))
304 {
305 printTokenized = false;
306 break;
307 }
308
309 operands.PutCString(tokenStr);
310 }
311 } // for (tokenIndex)
312
Johnny Chende5cc8c2011-05-20 17:27:37 +0000313 // FIXME!!!
314 // Workaround for llvm::tB's operands not properly parsed by ARMAsmParser.
315 if (m_arch_type == llvm::Triple::thumb && opcode.GetString() == "b") {
316 const char *inst_str;
Peter Collingbourned77c0392011-05-20 22:42:59 +0000317 const char *pos = NULL;
Johnny Chende5cc8c2011-05-20 17:27:37 +0000318 if (EDGetInstString(&inst_str, m_inst) == 0 && (pos = strstr(inst_str, "#")) != NULL) {
319 uint64_t operand_value = PC + atoi(++pos);
320 operands.Printf("0x%llx ", operand_value);
321
322 lldb_private::Address so_addr;
323 if (exe_ctx && exe_ctx->target && !exe_ctx->target->GetSectionLoadList().IsEmpty()) {
324 if (exe_ctx->target->GetSectionLoadList().ResolveLoadAddress (operand_value, so_addr))
325 so_addr.Dump(&comment, exe_scope, Address::DumpStyleResolvedDescriptionNoModule, Address::DumpStyleSectionNameOffset);
326 } else {
327 Module *module = GetAddress().GetModule();
328 if (module) {
329 if (module->ResolveFileAddress (operand_value, so_addr))
330 so_addr.Dump(&comment, exe_scope, Address::DumpStyleResolvedDescriptionNoModule, Address::DumpStyleSectionNameOffset);
331 }
332 }
333 }
334 }
335 // END of workaround.
336
Johnny Chen51ff2482011-05-19 01:05:37 +0000337 // If both operands and comment are empty, we will just print out
338 // the raw disassembly.
339 if (operands.GetString().empty() && comment.GetString().empty())
Chris Lattner24943d22010-06-08 16:52:24 +0000340 {
Johnny Chen51ff2482011-05-19 01:05:37 +0000341 const char *str;
342
343 if (EDGetInstString(&str, m_inst))
344 return;
345 llvm::StringRef raw_disasm(str);
346 StripSpaces(raw_disasm);
347 s->PutCString(raw_disasm.str().c_str());
348 }
349 else
350 {
351 PadString(s, opcode.GetString(), opcodeColumnWidth);
352
353 if (comment.GetString().empty())
354 s->PutCString(operands.GetString().c_str());
Chris Lattner24943d22010-06-08 16:52:24 +0000355 else
356 {
Johnny Chen51ff2482011-05-19 01:05:37 +0000357 PadString(s, operands.GetString(), operandColumnWidth);
Chris Lattner24943d22010-06-08 16:52:24 +0000358
Johnny Chen51ff2482011-05-19 01:05:37 +0000359 s->PutCString("; ");
360 s->PutCString(comment.GetString().c_str());
361 } // else (comment.GetString().empty())
362 } // else (operands.GetString().empty() && comment.GetString().empty())
363 } // printTokenized
Chris Lattner24943d22010-06-08 16:52:24 +0000364 } // numTokens != -1
365
366 if (!printTokenized)
367 {
368 const char *str;
369
Johnny Chen51ff2482011-05-19 01:05:37 +0000370 if (EDGetInstString(&str, m_inst)) // 0 on success
Chris Lattner24943d22010-06-08 16:52:24 +0000371 return;
Johnny Chen08251ef2011-05-21 00:44:42 +0000372 if (raw)
373 s->Write(str, strlen(str) - 1);
374 else
375 {
376 // EDis fails to parse the tokens of this inst. Need to align this
377 // raw disassembly with the rest of output.
378 llvm::StringRef raw_disasm(str);
379 StripSpaces(raw_disasm);
380 s->PutCString(raw_disasm.str().c_str());
381 }
Chris Lattner24943d22010-06-08 16:52:24 +0000382 }
383}
384
385bool
Caroline Ticeaf591802011-04-05 23:22:54 +0000386InstructionLLVM::DoesBranch() const
Chris Lattner24943d22010-06-08 16:52:24 +0000387{
388 return EDInstIsBranch(m_inst);
389}
390
391size_t
Caroline Ticeaf591802011-04-05 23:22:54 +0000392InstructionLLVM::Decode (const Disassembler &disassembler,
393 const lldb_private::DataExtractor &data,
394 uint32_t data_offset)
Chris Lattner24943d22010-06-08 16:52:24 +0000395{
396 if (EDCreateInsts(&m_inst, 1, m_disassembler, DataExtractorByteReader, data_offset, (void*)(&data)))
Greg Clayton7bc39082011-03-24 23:53:38 +0000397 {
398 const int byte_size = EDInstByteSize(m_inst);
399 uint32_t offset = data_offset;
400 // Make a copy of the opcode in m_opcode
401 switch (disassembler.GetArchitecture().GetMachine())
402 {
403 case llvm::Triple::x86:
404 case llvm::Triple::x86_64:
405 m_opcode.SetOpcodeBytes (data.PeekData (data_offset, byte_size), byte_size);
406 break;
407
408 case llvm::Triple::arm:
Greg Clayton7bc39082011-03-24 23:53:38 +0000409 case llvm::Triple::thumb:
Greg Clayton149731c2011-03-25 18:03:16 +0000410 switch (byte_size)
411 {
412 case 2:
413 m_opcode.SetOpcode16 (data.GetU16 (&offset));
414 break;
415
416 case 4:
Caroline Tice6b8d3b52011-04-19 23:30:03 +0000417 {
418 if (GetAddressClass() == eAddressClassCodeAlternateISA)
419 {
420 // If it is a 32-bit THUMB instruction, we need to swap the upper & lower halves.
421 uint32_t orig_bytes = data.GetU32 (&offset);
422 uint16_t upper_bits = (orig_bytes >> 16) & ((1u << 16) - 1);
423 uint16_t lower_bits = orig_bytes & ((1u << 16) - 1);
424 uint32_t swapped = (lower_bits << 16) | upper_bits;
425 m_opcode.SetOpcode32 (swapped);
426 }
427 else
428 m_opcode.SetOpcode32 (data.GetU32 (&offset));
429 }
Greg Clayton149731c2011-03-25 18:03:16 +0000430 break;
431
432 default:
433 assert (!"Invalid ARM opcode size");
434 break;
435 }
Greg Clayton7bc39082011-03-24 23:53:38 +0000436 break;
437
438 default:
439 assert (!"This shouldn't happen since we control the architecture we allow DisassemblerLLVM to be created for");
440 break;
441 }
442 return byte_size;
443 }
Chris Lattner24943d22010-06-08 16:52:24 +0000444 else
445 return 0;
446}
447
Chris Lattner24943d22010-06-08 16:52:24 +0000448static inline EDAssemblySyntax_t
Greg Claytoncf015052010-06-11 03:25:34 +0000449SyntaxForArchSpec (const ArchSpec &arch)
Chris Lattner24943d22010-06-08 16:52:24 +0000450{
Greg Clayton940b1032011-02-23 00:35:02 +0000451 switch (arch.GetMachine ())
Greg Clayton5e4f4a22011-02-16 00:00:43 +0000452 {
Greg Clayton940b1032011-02-23 00:35:02 +0000453 case llvm::Triple::x86:
454 case llvm::Triple::x86_64:
Chris Lattner24943d22010-06-08 16:52:24 +0000455 return kEDAssemblySyntaxX86ATT;
Sean Callanand151c8a2011-03-09 01:02:51 +0000456 case llvm::Triple::arm:
Greg Clayton889fbd02011-03-26 19:14:58 +0000457 case llvm::Triple::thumb:
Sean Callanand151c8a2011-03-09 01:02:51 +0000458 return kEDAssemblySyntaxARMUAL;
Greg Clayton5e4f4a22011-02-16 00:00:43 +0000459 default:
460 break;
461 }
Greg Claytoncf015052010-06-11 03:25:34 +0000462 return (EDAssemblySyntax_t)0; // default
Chris Lattner24943d22010-06-08 16:52:24 +0000463}
464
465Disassembler *
466DisassemblerLLVM::CreateInstance(const ArchSpec &arch)
467{
Greg Clayton5e4f4a22011-02-16 00:00:43 +0000468 std::auto_ptr<DisassemblerLLVM> disasm_ap (new DisassemblerLLVM(arch));
469
Caroline Tice080bf612011-04-05 18:46:00 +0000470 if (disasm_ap.get() && disasm_ap->IsValid())
Greg Clayton5e4f4a22011-02-16 00:00:43 +0000471 return disasm_ap.release();
Chris Lattner24943d22010-06-08 16:52:24 +0000472
Greg Claytoncf015052010-06-11 03:25:34 +0000473 return NULL;
Chris Lattner24943d22010-06-08 16:52:24 +0000474}
475
476DisassemblerLLVM::DisassemblerLLVM(const ArchSpec &arch) :
Greg Claytonb01000f2011-01-17 03:46:26 +0000477 Disassembler (arch),
Greg Claytonb1888f22011-03-19 01:12:21 +0000478 m_disassembler (NULL),
479 m_disassembler_thumb (NULL) // For ARM only
Chris Lattner24943d22010-06-08 16:52:24 +0000480{
Greg Clayton5e4f4a22011-02-16 00:00:43 +0000481 const std::string &arch_triple = arch.GetTriple().str();
482 if (!arch_triple.empty())
Greg Claytoncf015052010-06-11 03:25:34 +0000483 {
Greg Clayton5e4f4a22011-02-16 00:00:43 +0000484 if (EDGetDisassembler(&m_disassembler, arch_triple.c_str(), SyntaxForArchSpec (arch)))
485 m_disassembler = NULL;
Greg Claytonb1888f22011-03-19 01:12:21 +0000486 llvm::Triple::ArchType llvm_arch = arch.GetTriple().getArch();
Greg Clayton889fbd02011-03-26 19:14:58 +0000487 // Don't have the lldb::Triple::thumb architecture here. If someone specifies
488 // "thumb" as the architecture, we want a thumb only disassembler. But if any
489 // architecture starting with "arm" if specified, we want to auto detect the
490 // arm/thumb code automatically using the AddressClass from section offset
491 // addresses.
Greg Claytonb1888f22011-03-19 01:12:21 +0000492 if (llvm_arch == llvm::Triple::arm)
493 {
494 if (EDGetDisassembler(&m_disassembler_thumb, "thumb-apple-darwin", kEDAssemblySyntaxARMUAL))
495 m_disassembler_thumb = NULL;
496 }
Greg Claytoncf015052010-06-11 03:25:34 +0000497 }
Chris Lattner24943d22010-06-08 16:52:24 +0000498}
499
500DisassemblerLLVM::~DisassemblerLLVM()
501{
502}
503
504size_t
Greg Clayton70436352010-06-30 23:03:03 +0000505DisassemblerLLVM::DecodeInstructions
Chris Lattner24943d22010-06-08 16:52:24 +0000506(
Greg Clayton5c4c7462010-10-06 03:09:58 +0000507 const Address &base_addr,
Chris Lattner24943d22010-06-08 16:52:24 +0000508 const DataExtractor& data,
509 uint32_t data_offset,
Jim Inghamaa3e3e12011-03-22 01:48:42 +0000510 uint32_t num_instructions,
511 bool append
Chris Lattner24943d22010-06-08 16:52:24 +0000512)
513{
Greg Claytonb01000f2011-01-17 03:46:26 +0000514 if (m_disassembler == NULL)
515 return 0;
516
Chris Lattner24943d22010-06-08 16:52:24 +0000517 size_t total_inst_byte_size = 0;
518
Jim Inghamaa3e3e12011-03-22 01:48:42 +0000519 if (!append)
520 m_instruction_list.Clear();
Chris Lattner24943d22010-06-08 16:52:24 +0000521
522 while (data.ValidOffset(data_offset) && num_instructions)
523 {
Greg Clayton5c4c7462010-10-06 03:09:58 +0000524 Address inst_addr (base_addr);
525 inst_addr.Slide(data_offset);
Greg Claytonb1888f22011-03-19 01:12:21 +0000526
527 bool use_thumb = false;
528 // If we have a thumb disassembler, then we have an ARM architecture
529 // so we need to check what the instruction address class is to make
530 // sure we shouldn't be disassembling as thumb...
Greg Clayton889fbd02011-03-26 19:14:58 +0000531 AddressClass inst_address_class = eAddressClassInvalid;
Greg Claytonb1888f22011-03-19 01:12:21 +0000532 if (m_disassembler_thumb)
533 {
Greg Clayton889fbd02011-03-26 19:14:58 +0000534 inst_address_class = inst_addr.GetAddressClass ();
535 if (inst_address_class == eAddressClassCodeAlternateISA)
Greg Claytonb1888f22011-03-19 01:12:21 +0000536 use_thumb = true;
537 }
Johnny Chen80ab18e2011-05-12 22:25:53 +0000538
Greg Clayton7bc39082011-03-24 23:53:38 +0000539 InstructionSP inst_sp (new InstructionLLVM (inst_addr,
Greg Clayton889fbd02011-03-26 19:14:58 +0000540 inst_address_class,
Greg Claytonabe0fed2011-04-18 08:33:37 +0000541 use_thumb ? m_disassembler_thumb : m_disassembler,
Johnny Chen1608c872011-05-18 18:22:16 +0000542 use_thumb ? llvm::Triple::thumb : m_arch.GetMachine()));
Chris Lattner24943d22010-06-08 16:52:24 +0000543
Greg Clayton889fbd02011-03-26 19:14:58 +0000544 size_t inst_byte_size = inst_sp->Decode (*this, data, data_offset);
Chris Lattner24943d22010-06-08 16:52:24 +0000545
546 if (inst_byte_size == 0)
547 break;
548
Greg Clayton5c4c7462010-10-06 03:09:58 +0000549 m_instruction_list.Append (inst_sp);
Chris Lattner24943d22010-06-08 16:52:24 +0000550
551 total_inst_byte_size += inst_byte_size;
552 data_offset += inst_byte_size;
553 num_instructions--;
554 }
555
556 return total_inst_byte_size;
557}
558
559void
560DisassemblerLLVM::Initialize()
561{
562 PluginManager::RegisterPlugin (GetPluginNameStatic(),
563 GetPluginDescriptionStatic(),
564 CreateInstance);
565}
566
567void
568DisassemblerLLVM::Terminate()
569{
570 PluginManager::UnregisterPlugin (CreateInstance);
571}
572
573
574const char *
575DisassemblerLLVM::GetPluginNameStatic()
576{
Greg Clayton149731c2011-03-25 18:03:16 +0000577 return "llvm";
Chris Lattner24943d22010-06-08 16:52:24 +0000578}
579
580const char *
581DisassemblerLLVM::GetPluginDescriptionStatic()
582{
Greg Clayton149731c2011-03-25 18:03:16 +0000583 return "Disassembler that uses LLVM opcode tables to disassemble i386, x86_64 and ARM.";
Chris Lattner24943d22010-06-08 16:52:24 +0000584}
585
586//------------------------------------------------------------------
587// PluginInterface protocol
588//------------------------------------------------------------------
589const char *
590DisassemblerLLVM::GetPluginName()
591{
592 return "DisassemblerLLVM";
593}
594
595const char *
596DisassemblerLLVM::GetShortPluginName()
597{
598 return GetPluginNameStatic();
599}
600
601uint32_t
602DisassemblerLLVM::GetPluginVersion()
603{
604 return 1;
605}
606