blob: 618e4d77db4cd5fe8e6ad3a0f08b2c67b5409186 [file] [log] [blame]
Clement Courbet44b4c542018-06-19 11:28:59 +00001//===-- Target.cpp ----------------------------------------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9#include "../Target.h"
10
Clement Courbet4860b982018-06-26 08:49:30 +000011#include "../Latency.h"
12#include "../Uops.h"
Clement Courbet717c9762018-06-28 07:41:16 +000013#include "MCTargetDesc/X86BaseInfo.h"
Clement Courbeta51efc22018-06-25 13:12:02 +000014#include "MCTargetDesc/X86MCTargetDesc.h"
Clement Courbet6fd00e32018-06-20 11:54:35 +000015#include "X86.h"
Clement Courbeta51efc22018-06-25 13:12:02 +000016#include "X86RegisterInfo.h"
Clement Courbete7851692018-07-03 06:17:05 +000017#include "X86Subtarget.h"
Clement Courbeta51efc22018-06-25 13:12:02 +000018#include "llvm/MC/MCInstBuilder.h"
Clement Courbet6fd00e32018-06-20 11:54:35 +000019
Fangrui Song32401af2018-10-22 17:10:47 +000020namespace llvm {
Clement Courbet44b4c542018-06-19 11:28:59 +000021namespace exegesis {
22
23namespace {
24
Clement Courbetc5448382018-11-07 16:14:55 +000025// Returns an error if we cannot handle the memory references in this
26// instruction.
27Error isInvalidMemoryInstr(const Instruction &Instr) {
28 switch (Instr.Description->TSFlags & X86II::FormMask) {
29 default:
30 llvm_unreachable("Unknown FormMask value");
31 // These have no memory access.
32 case X86II::Pseudo:
33 case X86II::RawFrm:
34 case X86II::MRMDestReg:
35 case X86II::MRMSrcReg:
36 case X86II::MRMSrcReg4VOp3:
37 case X86II::MRMSrcRegOp4:
38 case X86II::MRMXr:
39 case X86II::MRM0r:
40 case X86II::MRM1r:
41 case X86II::MRM2r:
42 case X86II::MRM3r:
43 case X86II::MRM4r:
44 case X86II::MRM5r:
45 case X86II::MRM6r:
46 case X86II::MRM7r:
47 case X86II::MRM_C0:
48 case X86II::MRM_C1:
49 case X86II::MRM_C2:
50 case X86II::MRM_C3:
51 case X86II::MRM_C4:
52 case X86II::MRM_C5:
53 case X86II::MRM_C6:
54 case X86II::MRM_C7:
55 case X86II::MRM_C8:
56 case X86II::MRM_C9:
57 case X86II::MRM_CA:
58 case X86II::MRM_CB:
59 case X86II::MRM_CC:
60 case X86II::MRM_CD:
61 case X86II::MRM_CE:
62 case X86II::MRM_CF:
63 case X86II::MRM_D0:
64 case X86II::MRM_D1:
65 case X86II::MRM_D2:
66 case X86II::MRM_D3:
67 case X86II::MRM_D4:
68 case X86II::MRM_D5:
69 case X86II::MRM_D6:
70 case X86II::MRM_D7:
71 case X86II::MRM_D8:
72 case X86II::MRM_D9:
73 case X86II::MRM_DA:
74 case X86II::MRM_DB:
75 case X86II::MRM_DC:
76 case X86II::MRM_DD:
77 case X86II::MRM_DE:
78 case X86II::MRM_DF:
79 case X86II::MRM_E0:
80 case X86II::MRM_E1:
81 case X86II::MRM_E2:
82 case X86II::MRM_E3:
83 case X86II::MRM_E4:
84 case X86II::MRM_E5:
85 case X86II::MRM_E6:
86 case X86II::MRM_E7:
87 case X86II::MRM_E8:
88 case X86II::MRM_E9:
89 case X86II::MRM_EA:
90 case X86II::MRM_EB:
91 case X86II::MRM_EC:
92 case X86II::MRM_ED:
93 case X86II::MRM_EE:
94 case X86II::MRM_EF:
95 case X86II::MRM_F0:
96 case X86II::MRM_F1:
97 case X86II::MRM_F2:
98 case X86II::MRM_F3:
99 case X86II::MRM_F4:
100 case X86II::MRM_F5:
101 case X86II::MRM_F6:
102 case X86II::MRM_F7:
103 case X86II::MRM_F8:
104 case X86II::MRM_F9:
105 case X86II::MRM_FA:
106 case X86II::MRM_FB:
107 case X86II::MRM_FC:
108 case X86II::MRM_FD:
109 case X86II::MRM_FE:
110 case X86II::MRM_FF:
111 case X86II::RawFrmImm8:
112 return Error::success();
113 case X86II::AddRegFrm:
114 return (Instr.Description->Opcode == X86::POP16r || Instr.Description->Opcode == X86::POP32r ||
115 Instr.Description->Opcode == X86::PUSH16r || Instr.Description->Opcode == X86::PUSH32r)
116 ? make_error<BenchmarkFailure>(
117 "unsupported opcode: unsupported memory access")
118 : Error::success();
119 // These access memory and are handled.
120 case X86II::MRMDestMem:
121 case X86II::MRMSrcMem:
122 case X86II::MRMSrcMem4VOp3:
123 case X86II::MRMSrcMemOp4:
124 case X86II::MRMXm:
125 case X86II::MRM0m:
126 case X86II::MRM1m:
127 case X86II::MRM2m:
128 case X86II::MRM3m:
129 case X86II::MRM4m:
130 case X86II::MRM5m:
131 case X86II::MRM6m:
132 case X86II::MRM7m:
133 return Error::success();
134 // These access memory and are not handled yet.
135 case X86II::RawFrmImm16:
136 case X86II::RawFrmMemOffs:
137 case X86II::RawFrmSrc:
138 case X86II::RawFrmDst:
139 case X86II::RawFrmDstSrc:
140 return make_error<BenchmarkFailure>(
141 "unsupported opcode: non uniform memory access");
Guillaume Chatelet3c639f32018-10-22 14:46:08 +0000142 }
Guillaume Chatelet3c639f32018-10-22 14:46:08 +0000143}
144
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000145static llvm::Error IsInvalidOpcode(const Instruction &Instr) {
146 const auto OpcodeName = Instr.Name;
Clement Courbet003e08f2018-11-06 14:11:58 +0000147 if ((Instr.Description->TSFlags & X86II::FormMask) == X86II::Pseudo)
148 return llvm::make_error<BenchmarkFailure>(
149 "unsupported opcode: pseudo instruction");
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000150 if (OpcodeName.startswith("POPF") || OpcodeName.startswith("PUSHF") ||
151 OpcodeName.startswith("ADJCALLSTACK"))
152 return llvm::make_error<BenchmarkFailure>(
Clement Courbet8d0dd0b2018-10-19 12:24:49 +0000153 "unsupported opcode: Push/Pop/AdjCallStack");
Clement Courbetc5448382018-11-07 16:14:55 +0000154 if (llvm::Error Error = isInvalidMemoryInstr(Instr))
Clement Courbet5b0d7832018-11-07 16:52:50 +0000155 return Error;
Guillaume Chatelet3c639f32018-10-22 14:46:08 +0000156 // We do not handle instructions with OPERAND_PCREL.
157 for (const Operand &Op : Instr.Operands)
158 if (Op.isExplicit() &&
159 Op.getExplicitOperandInfo().OperandType == llvm::MCOI::OPERAND_PCREL)
160 return llvm::make_error<BenchmarkFailure>(
161 "unsupported opcode: PC relative operand");
Clement Courbet8d0dd0b2018-10-19 12:24:49 +0000162 // We do not handle second-form X87 instructions. We only handle first-form
163 // ones (_Fp), see comment in X86InstrFPStack.td.
164 for (const Operand &Op : Instr.Operands)
165 if (Op.isReg() && Op.isExplicit() &&
166 Op.getExplicitOperandInfo().RegClass == llvm::X86::RSTRegClassID)
167 return llvm::make_error<BenchmarkFailure>(
168 "unsupported second-form X87 instruction");
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000169 return llvm::Error::success();
170}
171
172static unsigned GetX86FPFlags(const Instruction &Instr) {
173 return Instr.Description->TSFlags & llvm::X86II::FPTypeMask;
174}
175
176class X86LatencySnippetGenerator : public LatencySnippetGenerator {
177public:
178 using LatencySnippetGenerator::LatencySnippetGenerator;
Clement Courbet4860b982018-06-26 08:49:30 +0000179
Guillaume Chatelet296a8622018-10-15 09:09:19 +0000180 llvm::Expected<std::vector<CodeTemplate>>
181 generateCodeTemplates(const Instruction &Instr) const override {
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000182 if (auto E = IsInvalidOpcode(Instr))
183 return std::move(E);
Clement Courbet717c9762018-06-28 07:41:16 +0000184
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000185 switch (GetX86FPFlags(Instr)) {
Clement Courbet717c9762018-06-28 07:41:16 +0000186 case llvm::X86II::NotFP:
Guillaume Chatelet296a8622018-10-15 09:09:19 +0000187 return LatencySnippetGenerator::generateCodeTemplates(Instr);
Clement Courbet717c9762018-06-28 07:41:16 +0000188 case llvm::X86II::ZeroArgFP:
Clement Courbet717c9762018-06-28 07:41:16 +0000189 case llvm::X86II::OneArgFP:
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000190 case llvm::X86II::SpecialFP:
191 case llvm::X86II::CompareFP:
192 case llvm::X86II::CondMovFP:
193 return llvm::make_error<BenchmarkFailure>("Unsupported x87 Instruction");
Clement Courbet717c9762018-06-28 07:41:16 +0000194 case llvm::X86II::OneArgFPRW:
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000195 case llvm::X86II::TwoArgFP:
196 // These are instructions like
197 // - `ST(0) = fsqrt(ST(0))` (OneArgFPRW)
198 // - `ST(0) = ST(0) + ST(i)` (TwoArgFP)
199 // They are intrinsically serial and do not modify the state of the stack.
Guillaume Chatelet296a8622018-10-15 09:09:19 +0000200 return generateSelfAliasingCodeTemplates(Instr);
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000201 default:
202 llvm_unreachable("Unknown FP Type!");
203 }
204 }
205};
206
207class X86UopsSnippetGenerator : public UopsSnippetGenerator {
208public:
209 using UopsSnippetGenerator::UopsSnippetGenerator;
210
Guillaume Chatelet296a8622018-10-15 09:09:19 +0000211 llvm::Expected<std::vector<CodeTemplate>>
212 generateCodeTemplates(const Instruction &Instr) const override {
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000213 if (auto E = IsInvalidOpcode(Instr))
214 return std::move(E);
215
216 switch (GetX86FPFlags(Instr)) {
217 case llvm::X86II::NotFP:
Guillaume Chatelet296a8622018-10-15 09:09:19 +0000218 return UopsSnippetGenerator::generateCodeTemplates(Instr);
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000219 case llvm::X86II::ZeroArgFP:
220 case llvm::X86II::OneArgFP:
221 case llvm::X86II::SpecialFP:
222 return llvm::make_error<BenchmarkFailure>("Unsupported x87 Instruction");
223 case llvm::X86II::OneArgFPRW:
224 case llvm::X86II::TwoArgFP:
Clement Courbet717c9762018-06-28 07:41:16 +0000225 // These are instructions like
226 // - `ST(0) = fsqrt(ST(0))` (OneArgFPRW)
227 // - `ST(0) = ST(0) + ST(i)` (TwoArgFP)
228 // They are intrinsically serial and do not modify the state of the stack.
229 // We generate the same code for latency and uops.
Guillaume Chatelet296a8622018-10-15 09:09:19 +0000230 return generateSelfAliasingCodeTemplates(Instr);
Clement Courbet717c9762018-06-28 07:41:16 +0000231 case llvm::X86II::CompareFP:
Clement Courbet717c9762018-06-28 07:41:16 +0000232 case llvm::X86II::CondMovFP:
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000233 // We can compute uops for any FP instruction that does not grow or shrink
234 // the stack (either do not touch the stack or push as much as they pop).
Guillaume Chatelet296a8622018-10-15 09:09:19 +0000235 return generateUnconstrainedCodeTemplates(
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000236 Instr, "instruction does not grow/shrink the FP stack");
Clement Courbet717c9762018-06-28 07:41:16 +0000237 default:
238 llvm_unreachable("Unknown FP Type!");
239 }
Clement Courbet4860b982018-06-26 08:49:30 +0000240 }
241};
242
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000243static unsigned GetLoadImmediateOpcode(unsigned RegBitWidth) {
244 switch (RegBitWidth) {
Guillaume Chatelet5ad29092018-09-18 11:26:27 +0000245 case 8:
246 return llvm::X86::MOV8ri;
247 case 16:
248 return llvm::X86::MOV16ri;
249 case 32:
250 return llvm::X86::MOV32ri;
251 case 64:
252 return llvm::X86::MOV64ri;
253 }
254 llvm_unreachable("Invalid Value Width");
255}
256
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000257// Generates instruction to load an immediate value into a register.
258static llvm::MCInst loadImmediate(unsigned Reg, unsigned RegBitWidth,
259 const llvm::APInt &Value) {
260 if (Value.getBitWidth() > RegBitWidth)
261 llvm_unreachable("Value must fit in the Register");
262 return llvm::MCInstBuilder(GetLoadImmediateOpcode(RegBitWidth))
Guillaume Chatelet5ad29092018-09-18 11:26:27 +0000263 .addReg(Reg)
264 .addImm(Value.getZExtValue());
265}
266
267// Allocates scratch memory on the stack.
268static llvm::MCInst allocateStackSpace(unsigned Bytes) {
269 return llvm::MCInstBuilder(llvm::X86::SUB64ri8)
270 .addReg(llvm::X86::RSP)
271 .addReg(llvm::X86::RSP)
272 .addImm(Bytes);
273}
274
275// Fills scratch memory at offset `OffsetBytes` with value `Imm`.
276static llvm::MCInst fillStackSpace(unsigned MovOpcode, unsigned OffsetBytes,
277 uint64_t Imm) {
278 return llvm::MCInstBuilder(MovOpcode)
279 // Address = ESP
280 .addReg(llvm::X86::RSP) // BaseReg
281 .addImm(1) // ScaleAmt
282 .addReg(0) // IndexReg
283 .addImm(OffsetBytes) // Disp
284 .addReg(0) // Segment
285 // Immediate.
286 .addImm(Imm);
287}
288
289// Loads scratch memory into register `Reg` using opcode `RMOpcode`.
290static llvm::MCInst loadToReg(unsigned Reg, unsigned RMOpcode) {
291 return llvm::MCInstBuilder(RMOpcode)
292 .addReg(Reg)
293 // Address = ESP
294 .addReg(llvm::X86::RSP) // BaseReg
295 .addImm(1) // ScaleAmt
296 .addReg(0) // IndexReg
297 .addImm(0) // Disp
298 .addReg(0); // Segment
299}
300
301// Releases scratch memory.
302static llvm::MCInst releaseStackSpace(unsigned Bytes) {
303 return llvm::MCInstBuilder(llvm::X86::ADD64ri8)
304 .addReg(llvm::X86::RSP)
305 .addReg(llvm::X86::RSP)
306 .addImm(Bytes);
307}
308
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000309// Reserves some space on the stack, fills it with the content of the provided
310// constant and provide methods to load the stack value into a register.
Guillaume Chatelet5ad29092018-09-18 11:26:27 +0000311struct ConstantInliner {
Clement Courbet78b2e732018-09-25 07:31:44 +0000312 explicit ConstantInliner(const llvm::APInt &Constant) : Constant_(Constant) {}
Guillaume Chatelet5ad29092018-09-18 11:26:27 +0000313
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000314 std::vector<llvm::MCInst> loadAndFinalize(unsigned Reg, unsigned RegBitWidth,
315 unsigned Opcode) {
Clement Courbet78b2e732018-09-25 07:31:44 +0000316 assert((RegBitWidth & 7) == 0 &&
317 "RegBitWidth must be a multiple of 8 bits");
318 initStack(RegBitWidth / 8);
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000319 add(loadToReg(Reg, Opcode));
Clement Courbet78b2e732018-09-25 07:31:44 +0000320 add(releaseStackSpace(RegBitWidth / 8));
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000321 return std::move(Instructions);
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000322 }
323
Clement Courbetc51f4522018-10-19 09:56:54 +0000324 std::vector<llvm::MCInst> loadX87STAndFinalize(unsigned Reg) {
325 initStack(kF80Bytes);
326 add(llvm::MCInstBuilder(llvm::X86::LD_F80m)
327 // Address = ESP
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000328 .addReg(llvm::X86::RSP) // BaseReg
329 .addImm(1) // ScaleAmt
330 .addReg(0) // IndexReg
331 .addImm(0) // Disp
332 .addReg(0)); // Segment
333 if (Reg != llvm::X86::ST0)
334 add(llvm::MCInstBuilder(llvm::X86::ST_Frr).addReg(Reg));
Clement Courbetc51f4522018-10-19 09:56:54 +0000335 add(releaseStackSpace(kF80Bytes));
336 return std::move(Instructions);
337 }
338
339 std::vector<llvm::MCInst> loadX87FPAndFinalize(unsigned Reg) {
340 initStack(kF80Bytes);
341 add(llvm::MCInstBuilder(llvm::X86::LD_Fp80m)
342 .addReg(Reg)
343 // Address = ESP
344 .addReg(llvm::X86::RSP) // BaseReg
345 .addImm(1) // ScaleAmt
346 .addReg(0) // IndexReg
347 .addImm(0) // Disp
348 .addReg(0)); // Segment
349 add(releaseStackSpace(kF80Bytes));
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000350 return std::move(Instructions);
351 }
352
353 std::vector<llvm::MCInst> popFlagAndFinalize() {
Clement Courbet78b2e732018-09-25 07:31:44 +0000354 initStack(8);
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000355 add(llvm::MCInstBuilder(llvm::X86::POPF64));
Simon Pilgrimf652ef32018-09-18 15:38:16 +0000356 return std::move(Instructions);
357 }
358
359private:
Clement Courbetc51f4522018-10-19 09:56:54 +0000360 static constexpr const unsigned kF80Bytes = 10; // 80 bits.
361
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000362 ConstantInliner &add(const llvm::MCInst &Inst) {
363 Instructions.push_back(Inst);
364 return *this;
365 }
366
Clement Courbet78b2e732018-09-25 07:31:44 +0000367 void initStack(unsigned Bytes) {
368 assert(Constant_.getBitWidth() <= Bytes * 8 &&
369 "Value does not have the correct size");
370 const llvm::APInt WideConstant = Constant_.getBitWidth() < Bytes * 8
371 ? Constant_.sext(Bytes * 8)
372 : Constant_;
373 add(allocateStackSpace(Bytes));
374 size_t ByteOffset = 0;
375 for (; Bytes - ByteOffset >= 4; ByteOffset += 4)
376 add(fillStackSpace(
377 llvm::X86::MOV32mi, ByteOffset,
378 WideConstant.extractBits(32, ByteOffset * 8).getZExtValue()));
379 if (Bytes - ByteOffset >= 2) {
380 add(fillStackSpace(
381 llvm::X86::MOV16mi, ByteOffset,
382 WideConstant.extractBits(16, ByteOffset * 8).getZExtValue()));
383 ByteOffset += 2;
384 }
385 if (Bytes - ByteOffset >= 1)
386 add(fillStackSpace(
387 llvm::X86::MOV8mi, ByteOffset,
388 WideConstant.extractBits(8, ByteOffset * 8).getZExtValue()));
389 }
390
391 llvm::APInt Constant_;
Guillaume Chatelet5ad29092018-09-18 11:26:27 +0000392 std::vector<llvm::MCInst> Instructions;
393};
394
Clement Courbet41c8af32018-10-25 07:44:01 +0000395#include "X86GenExegesis.inc"
396
Clement Courbet44b4c542018-06-19 11:28:59 +0000397class ExegesisX86Target : public ExegesisTarget {
Clement Courbet41c8af32018-10-25 07:44:01 +0000398public:
399 ExegesisX86Target() : ExegesisTarget(X86CpuPfmCounters) {}
400
401private:
Clement Courbet6fd00e32018-06-20 11:54:35 +0000402 void addTargetSpecificPasses(llvm::PassManagerBase &PM) const override {
403 // Lowers FP pseudo-instructions, e.g. ABS_Fp32 -> ABS_F.
Clement Courbet717c9762018-06-28 07:41:16 +0000404 PM.add(llvm::createX86FloatingPointStackifierPass());
Clement Courbet6fd00e32018-06-20 11:54:35 +0000405 }
406
Guillaume Chateletfb943542018-08-01 14:41:45 +0000407 unsigned getScratchMemoryRegister(const llvm::Triple &TT) const override {
408 if (!TT.isArch64Bit()) {
409 // FIXME: This would require popping from the stack, so we would have to
410 // add some additional setup code.
411 return 0;
412 }
413 return TT.isOSWindows() ? llvm::X86::RCX : llvm::X86::RDI;
414 }
415
416 unsigned getMaxMemoryAccessSize() const override { return 64; }
417
Guillaume Chatelet70ac0192018-09-27 09:23:04 +0000418 void fillMemoryOperands(InstructionTemplate &IT, unsigned Reg,
Guillaume Chateletfb943542018-08-01 14:41:45 +0000419 unsigned Offset) const override {
Clement Courbetc5448382018-11-07 16:14:55 +0000420 assert(!isInvalidMemoryInstr(IT.Instr) &&
421 "fillMemoryOperands requires a valid memory instruction");
422 int MemOpIdx = X86II::getMemoryOperandNo(IT.Instr.Description->TSFlags);
423 assert(MemOpIdx >= 0 && "invalid memory operand index");
424 // getMemoryOperandNo() ignores tied operands, so we have to add them back.
425 for (unsigned I = 0; I <= static_cast<unsigned>(MemOpIdx); ++I) {
426 const auto &Op = IT.Instr.Operands[I];
427 if (Op.isTied() && Op.getTiedToIndex() < I) {
428 ++MemOpIdx;
429 }
430 }
431 // Now fill in the memory operands.
432 const auto SetOp = [&IT](int OpIdx, const MCOperand &OpVal) {
433 const auto Op = IT.Instr.Operands[OpIdx];
434 assert(Op.isMemory() && Op.isExplicit() && "invalid memory pattern");
435 IT.getValueFor(Op) = OpVal;
436 };
437 SetOp(MemOpIdx + 0, MCOperand::createReg(Reg)); // BaseReg
438 SetOp(MemOpIdx + 1, MCOperand::createImm(1)); // ScaleAmt
439 SetOp(MemOpIdx + 2, MCOperand::createReg(0)); // IndexReg
440 SetOp(MemOpIdx + 3, MCOperand::createImm(Offset)); // Disp
441 SetOp(MemOpIdx + 4, MCOperand::createReg(0)); // Segment
Guillaume Chateletfb943542018-08-01 14:41:45 +0000442 }
443
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000444 std::vector<llvm::MCInst> setRegTo(const llvm::MCSubtargetInfo &STI,
445 unsigned Reg,
446 const llvm::APInt &Value) const override {
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000447 if (llvm::X86::GR8RegClass.contains(Reg))
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000448 return {loadImmediate(Reg, 8, Value)};
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000449 if (llvm::X86::GR16RegClass.contains(Reg))
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000450 return {loadImmediate(Reg, 16, Value)};
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000451 if (llvm::X86::GR32RegClass.contains(Reg))
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000452 return {loadImmediate(Reg, 32, Value)};
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000453 if (llvm::X86::GR64RegClass.contains(Reg))
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000454 return {loadImmediate(Reg, 64, Value)};
455 ConstantInliner CI(Value);
Guillaume Chatelet5ad29092018-09-18 11:26:27 +0000456 if (llvm::X86::VR64RegClass.contains(Reg))
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000457 return CI.loadAndFinalize(Reg, 64, llvm::X86::MMX_MOVQ64rm);
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000458 if (llvm::X86::VR128XRegClass.contains(Reg)) {
459 if (STI.getFeatureBits()[llvm::X86::FeatureAVX512])
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000460 return CI.loadAndFinalize(Reg, 128, llvm::X86::VMOVDQU32Z128rm);
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000461 if (STI.getFeatureBits()[llvm::X86::FeatureAVX])
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000462 return CI.loadAndFinalize(Reg, 128, llvm::X86::VMOVDQUrm);
463 return CI.loadAndFinalize(Reg, 128, llvm::X86::MOVDQUrm);
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000464 }
465 if (llvm::X86::VR256XRegClass.contains(Reg)) {
466 if (STI.getFeatureBits()[llvm::X86::FeatureAVX512])
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000467 return CI.loadAndFinalize(Reg, 256, llvm::X86::VMOVDQU32Z256rm);
468 if (STI.getFeatureBits()[llvm::X86::FeatureAVX])
469 return CI.loadAndFinalize(Reg, 256, llvm::X86::VMOVDQUYrm);
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000470 }
471 if (llvm::X86::VR512RegClass.contains(Reg))
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000472 if (STI.getFeatureBits()[llvm::X86::FeatureAVX512])
473 return CI.loadAndFinalize(Reg, 512, llvm::X86::VMOVDQU32Zrm);
474 if (llvm::X86::RSTRegClass.contains(Reg)) {
Clement Courbetc51f4522018-10-19 09:56:54 +0000475 return CI.loadX87STAndFinalize(Reg);
476 }
477 if (llvm::X86::RFP32RegClass.contains(Reg) ||
478 llvm::X86::RFP64RegClass.contains(Reg) ||
479 llvm::X86::RFP80RegClass.contains(Reg)) {
480 return CI.loadX87FPAndFinalize(Reg);
Guillaume Chatelet8721ad92018-09-18 11:26:35 +0000481 }
Guillaume Chateletc96a97b2018-09-20 12:22:18 +0000482 if (Reg == llvm::X86::EFLAGS)
483 return CI.popFlagAndFinalize();
484 return {}; // Not yet implemented.
Clement Courbeta51efc22018-06-25 13:12:02 +0000485 }
486
Clement Courbetd939f6d2018-09-13 07:40:53 +0000487 std::unique_ptr<SnippetGenerator>
488 createLatencySnippetGenerator(const LLVMState &State) const override {
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000489 return llvm::make_unique<X86LatencySnippetGenerator>(State);
Clement Courbet4860b982018-06-26 08:49:30 +0000490 }
491
Clement Courbetd939f6d2018-09-13 07:40:53 +0000492 std::unique_ptr<SnippetGenerator>
493 createUopsSnippetGenerator(const LLVMState &State) const override {
Guillaume Chatelet946fb052018-10-12 15:12:22 +0000494 return llvm::make_unique<X86UopsSnippetGenerator>(State);
Clement Courbet4860b982018-06-26 08:49:30 +0000495 }
496
Clement Courbet44b4c542018-06-19 11:28:59 +0000497 bool matchesArch(llvm::Triple::ArchType Arch) const override {
498 return Arch == llvm::Triple::x86_64 || Arch == llvm::Triple::x86;
499 }
500};
501
502} // namespace
503
Clement Courbetcff2caa2018-06-25 11:22:23 +0000504static ExegesisTarget *getTheExegesisX86Target() {
Clement Courbet44b4c542018-06-19 11:28:59 +0000505 static ExegesisX86Target Target;
506 return &Target;
507}
508
509void InitializeX86ExegesisTarget() {
510 ExegesisTarget::registerTarget(getTheExegesisX86Target());
511}
512
Clement Courbetcff2caa2018-06-25 11:22:23 +0000513} // namespace exegesis
Fangrui Song32401af2018-10-22 17:10:47 +0000514} // namespace llvm