blob: 19d0ba2e1c41563c0593a3eca84dc8e5c45d9842 [file] [log] [blame]
Tim Northover3b0846e2014-05-24 12:50:23 +00001//===- AArch64ExternalSymbolizer.cpp - Symbolizer for AArch64 ---*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include "AArch64ExternalSymbolizer.h"
11#include "AArch64Subtarget.h"
12#include "MCTargetDesc/AArch64AddressingModes.h"
13#include "Utils/AArch64BaseInfo.h"
14#include "llvm/MC/MCContext.h"
15#include "llvm/MC/MCExpr.h"
16#include "llvm/MC/MCInst.h"
17#include "llvm/Support/Format.h"
18#include "llvm/Support/raw_ostream.h"
19
20using namespace llvm;
21
22#define DEBUG_TYPE "aarch64-disassembler"
23
24static MCSymbolRefExpr::VariantKind
25getVariant(uint64_t LLVMDisassembler_VariantKind) {
26 switch (LLVMDisassembler_VariantKind) {
27 case LLVMDisassembler_VariantKind_None:
28 return MCSymbolRefExpr::VK_None;
29 case LLVMDisassembler_VariantKind_ARM64_PAGE:
30 return MCSymbolRefExpr::VK_PAGE;
31 case LLVMDisassembler_VariantKind_ARM64_PAGEOFF:
32 return MCSymbolRefExpr::VK_PAGEOFF;
33 case LLVMDisassembler_VariantKind_ARM64_GOTPAGE:
34 return MCSymbolRefExpr::VK_GOTPAGE;
35 case LLVMDisassembler_VariantKind_ARM64_GOTPAGEOFF:
36 return MCSymbolRefExpr::VK_GOTPAGEOFF;
37 case LLVMDisassembler_VariantKind_ARM64_TLVP:
38 case LLVMDisassembler_VariantKind_ARM64_TLVOFF:
39 default:
Craig Topper35b2f752014-06-19 06:10:58 +000040 llvm_unreachable("bad LLVMDisassembler_VariantKind");
Tim Northover3b0846e2014-05-24 12:50:23 +000041 }
42}
43
44/// tryAddingSymbolicOperand - tryAddingSymbolicOperand trys to add a symbolic
45/// operand in place of the immediate Value in the MCInst. The immediate
46/// Value has not had any PC adjustment made by the caller. If the instruction
47/// is a branch that adds the PC to the immediate Value then isBranch is
48/// Success, else Fail. If GetOpInfo is non-null, then it is called to get any
49/// symbolic information at the Address for this instrution. If that returns
50/// non-zero then the symbolic information it returns is used to create an
51/// MCExpr and that is added as an operand to the MCInst. If GetOpInfo()
52/// returns zero and isBranch is Success then a symbol look up for
53/// Address + Value is done and if a symbol is found an MCExpr is created with
54/// that, else an MCExpr with Address + Value is created. If GetOpInfo()
Eric Christopher572e03a2015-06-19 01:53:21 +000055/// returns zero and isBranch is Fail then the Opcode of the MCInst is
Tim Northover3b0846e2014-05-24 12:50:23 +000056/// tested and for ADRP an other instructions that help to load of pointers
57/// a symbol look up is done to see it is returns a specific reference type
58/// to add to the comment stream. This function returns Success if it adds
59/// an operand to the MCInst and Fail otherwise.
60bool AArch64ExternalSymbolizer::tryAddingSymbolicOperand(
61 MCInst &MI, raw_ostream &CommentStream, int64_t Value, uint64_t Address,
62 bool IsBranch, uint64_t Offset, uint64_t InstSize) {
63 // FIXME: This method shares a lot of code with
64 // MCExternalSymbolizer::tryAddingSymbolicOperand. It may be possible
65 // refactor the MCExternalSymbolizer interface to allow more of this
66 // implementation to be shared.
67 //
68 struct LLVMOpInfo1 SymbolicOp;
69 memset(&SymbolicOp, '\0', sizeof(struct LLVMOpInfo1));
70 SymbolicOp.Value = Value;
71 uint64_t ReferenceType;
72 const char *ReferenceName;
73 if (!GetOpInfo ||
74 !GetOpInfo(DisInfo, Address, 0 /* Offset */, InstSize, 1, &SymbolicOp)) {
75 if (IsBranch) {
76 ReferenceType = LLVMDisassembler_ReferenceType_In_Branch;
77 const char *Name = SymbolLookUp(DisInfo, Address + Value, &ReferenceType,
78 Address, &ReferenceName);
79 if (Name) {
80 SymbolicOp.AddSymbol.Name = Name;
81 SymbolicOp.AddSymbol.Present = true;
82 SymbolicOp.Value = 0;
83 } else {
84 SymbolicOp.Value = Address + Value;
85 }
86 if (ReferenceType == LLVMDisassembler_ReferenceType_Out_SymbolStub)
87 CommentStream << "symbol stub for: " << ReferenceName;
88 else if (ReferenceType ==
89 LLVMDisassembler_ReferenceType_Out_Objc_Message)
90 CommentStream << "Objc message: " << ReferenceName;
91 } else if (MI.getOpcode() == AArch64::ADRP) {
92 ReferenceType = LLVMDisassembler_ReferenceType_In_ARM64_ADRP;
93 // otool expects the fully encoded ADRP instruction to be passed in as
94 // the value here, so reconstruct it:
95 const MCRegisterInfo &MCRI = *Ctx.getRegisterInfo();
96 uint32_t EncodedInst = 0x90000000;
97 EncodedInst |= (Value & 0x3) << 29; // immlo
98 EncodedInst |= ((Value >> 2) & 0x7FFFF) << 5; // immhi
99 EncodedInst |= MCRI.getEncodingValue(MI.getOperand(0).getReg()); // reg
100 SymbolLookUp(DisInfo, EncodedInst, &ReferenceType, Address,
101 &ReferenceName);
102 CommentStream << format("0x%llx",
103 0xfffffffffffff000LL & (Address + Value));
104 } else if (MI.getOpcode() == AArch64::ADDXri ||
105 MI.getOpcode() == AArch64::LDRXui ||
106 MI.getOpcode() == AArch64::LDRXl ||
107 MI.getOpcode() == AArch64::ADR) {
108 if (MI.getOpcode() == AArch64::ADDXri)
109 ReferenceType = LLVMDisassembler_ReferenceType_In_ARM64_ADDXri;
110 else if (MI.getOpcode() == AArch64::LDRXui)
111 ReferenceType = LLVMDisassembler_ReferenceType_In_ARM64_LDRXui;
112 if (MI.getOpcode() == AArch64::LDRXl) {
113 ReferenceType = LLVMDisassembler_ReferenceType_In_ARM64_LDRXl;
114 SymbolLookUp(DisInfo, Address + Value, &ReferenceType, Address,
115 &ReferenceName);
116 } else if (MI.getOpcode() == AArch64::ADR) {
117 ReferenceType = LLVMDisassembler_ReferenceType_In_ARM64_ADR;
118 SymbolLookUp(DisInfo, Address + Value, &ReferenceType, Address,
119 &ReferenceName);
120 } else {
121 const MCRegisterInfo &MCRI = *Ctx.getRegisterInfo();
122 // otool expects the fully encoded ADD/LDR instruction to be passed in
123 // as the value here, so reconstruct it:
124 unsigned EncodedInst =
125 MI.getOpcode() == AArch64::ADDXri ? 0x91000000: 0xF9400000;
126 EncodedInst |= Value << 10; // imm12 [+ shift:2 for ADD]
127 EncodedInst |=
128 MCRI.getEncodingValue(MI.getOperand(1).getReg()) << 5; // Rn
129 EncodedInst |= MCRI.getEncodingValue(MI.getOperand(0).getReg()); // Rd
130
131 SymbolLookUp(DisInfo, EncodedInst, &ReferenceType, Address,
132 &ReferenceName);
133 }
134 if (ReferenceType == LLVMDisassembler_ReferenceType_Out_LitPool_SymAddr)
135 CommentStream << "literal pool symbol address: " << ReferenceName;
136 else if (ReferenceType ==
Kevin Enderbyd2d2ce92016-06-13 21:08:57 +0000137 LLVMDisassembler_ReferenceType_Out_LitPool_CstrAddr) {
138 CommentStream << "literal pool for: \"";
NAKAMURA Takumife1202c2016-06-20 00:37:41 +0000139 CommentStream.write_escaped(ReferenceName);
Kevin Enderbyd2d2ce92016-06-13 21:08:57 +0000140 CommentStream << "\"";
141 } else if (ReferenceType ==
Tim Northover3b0846e2014-05-24 12:50:23 +0000142 LLVMDisassembler_ReferenceType_Out_Objc_CFString_Ref)
143 CommentStream << "Objc cfstring ref: @\"" << ReferenceName << "\"";
144 else if (ReferenceType ==
145 LLVMDisassembler_ReferenceType_Out_Objc_Message)
146 CommentStream << "Objc message: " << ReferenceName;
147 else if (ReferenceType ==
148 LLVMDisassembler_ReferenceType_Out_Objc_Message_Ref)
149 CommentStream << "Objc message ref: " << ReferenceName;
150 else if (ReferenceType ==
151 LLVMDisassembler_ReferenceType_Out_Objc_Selector_Ref)
152 CommentStream << "Objc selector ref: " << ReferenceName;
153 else if (ReferenceType ==
154 LLVMDisassembler_ReferenceType_Out_Objc_Class_Ref)
155 CommentStream << "Objc class ref: " << ReferenceName;
156 // For these instructions, the SymbolLookUp() above is just to get the
157 // ReferenceType and ReferenceName. We want to make sure not to
158 // fall through so we don't build an MCExpr to leave the disassembly
159 // of the immediate values of these instructions to the InstPrinter.
160 return false;
161 } else {
162 return false;
163 }
164 }
165
166 const MCExpr *Add = nullptr;
167 if (SymbolicOp.AddSymbol.Present) {
168 if (SymbolicOp.AddSymbol.Name) {
169 StringRef Name(SymbolicOp.AddSymbol.Name);
Jim Grosbach6f482002015-05-18 18:43:14 +0000170 MCSymbol *Sym = Ctx.getOrCreateSymbol(Name);
Tim Northover3b0846e2014-05-24 12:50:23 +0000171 MCSymbolRefExpr::VariantKind Variant = getVariant(SymbolicOp.VariantKind);
172 if (Variant != MCSymbolRefExpr::VK_None)
Jim Grosbach13760bd2015-05-30 01:25:56 +0000173 Add = MCSymbolRefExpr::create(Sym, Variant, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000174 else
Jim Grosbach13760bd2015-05-30 01:25:56 +0000175 Add = MCSymbolRefExpr::create(Sym, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000176 } else {
Jim Grosbach13760bd2015-05-30 01:25:56 +0000177 Add = MCConstantExpr::create(SymbolicOp.AddSymbol.Value, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000178 }
179 }
180
181 const MCExpr *Sub = nullptr;
182 if (SymbolicOp.SubtractSymbol.Present) {
183 if (SymbolicOp.SubtractSymbol.Name) {
184 StringRef Name(SymbolicOp.SubtractSymbol.Name);
Jim Grosbach6f482002015-05-18 18:43:14 +0000185 MCSymbol *Sym = Ctx.getOrCreateSymbol(Name);
Jim Grosbach13760bd2015-05-30 01:25:56 +0000186 Sub = MCSymbolRefExpr::create(Sym, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000187 } else {
Jim Grosbach13760bd2015-05-30 01:25:56 +0000188 Sub = MCConstantExpr::create(SymbolicOp.SubtractSymbol.Value, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000189 }
190 }
191
192 const MCExpr *Off = nullptr;
193 if (SymbolicOp.Value != 0)
Jim Grosbach13760bd2015-05-30 01:25:56 +0000194 Off = MCConstantExpr::create(SymbolicOp.Value, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000195
196 const MCExpr *Expr;
197 if (Sub) {
198 const MCExpr *LHS;
199 if (Add)
Jim Grosbach13760bd2015-05-30 01:25:56 +0000200 LHS = MCBinaryExpr::createSub(Add, Sub, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000201 else
Jim Grosbach13760bd2015-05-30 01:25:56 +0000202 LHS = MCUnaryExpr::createMinus(Sub, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000203 if (Off)
Jim Grosbach13760bd2015-05-30 01:25:56 +0000204 Expr = MCBinaryExpr::createAdd(LHS, Off, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000205 else
206 Expr = LHS;
207 } else if (Add) {
208 if (Off)
Jim Grosbach13760bd2015-05-30 01:25:56 +0000209 Expr = MCBinaryExpr::createAdd(Add, Off, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000210 else
211 Expr = Add;
212 } else {
213 if (Off)
214 Expr = Off;
215 else
Jim Grosbach13760bd2015-05-30 01:25:56 +0000216 Expr = MCConstantExpr::create(0, Ctx);
Tim Northover3b0846e2014-05-24 12:50:23 +0000217 }
218
Jim Grosbache9119e42015-05-13 18:37:00 +0000219 MI.addOperand(MCOperand::createExpr(Expr));
Tim Northover3b0846e2014-05-24 12:50:23 +0000220
221 return true;
222}