blob: c1d8086e9d9b0d12923094db0631236ab31e3247 [file] [log] [blame]
Eugene Zelenko60433b62017-10-05 00:33:50 +00001//===- X86EvexToVex.cpp ---------------------------------------------------===//
Gadi Haber19c4fc52016-12-28 10:12:48 +00002// Compress EVEX instructions to VEX encoding when possible to reduce code size
3//
4// The LLVM Compiler Infrastructure
5//
6// This file is distributed under the University of Illinois Open Source
7// License. See LICENSE.TXT for details.
8//
Eugene Zelenko60433b62017-10-05 00:33:50 +00009//===----------------------------------------------------------------------===//
10//
Gadi Haber19c4fc52016-12-28 10:12:48 +000011/// \file
12/// This file defines the pass that goes over all AVX-512 instructions which
13/// are encoded using the EVEX prefix and if possible replaces them by their
14/// corresponding VEX encoding which is usually shorter by 2 bytes.
15/// EVEX instructions may be encoded via the VEX prefix when the AVX-512
16/// instruction has a corresponding AVX/AVX2 opcode and when it does not
Craig Topperfbb19852017-10-17 04:17:54 +000017/// use the xmm or the mask registers or xmm/ymm registers with indexes
Gadi Haber19c4fc52016-12-28 10:12:48 +000018/// higher than 15.
19/// The pass applies code reduction on the generated code for AVX-512 instrs.
Eugene Zelenko60433b62017-10-05 00:33:50 +000020//
21//===----------------------------------------------------------------------===//
Gadi Haber19c4fc52016-12-28 10:12:48 +000022
23#include "InstPrinter/X86InstComments.h"
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000024#include "MCTargetDesc/X86BaseInfo.h"
Gadi Haber19c4fc52016-12-28 10:12:48 +000025#include "X86.h"
Gadi Haber19c4fc52016-12-28 10:12:48 +000026#include "X86InstrInfo.h"
Gadi Haber19c4fc52016-12-28 10:12:48 +000027#include "X86Subtarget.h"
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000028#include "llvm/ADT/DenseMap.h"
29#include "llvm/ADT/StringRef.h"
30#include "llvm/CodeGen/MachineFunction.h"
31#include "llvm/CodeGen/MachineFunctionPass.h"
32#include "llvm/CodeGen/MachineInstr.h"
33#include "llvm/CodeGen/MachineOperand.h"
34#include "llvm/MC/MCInstrDesc.h"
35#include "llvm/Pass.h"
36#include <cassert>
37#include <cstdint>
Gadi Haber19c4fc52016-12-28 10:12:48 +000038
39using namespace llvm;
40
Ayman Musa850fc972017-03-07 08:11:19 +000041// Including the generated EVEX2VEX tables.
42struct X86EvexToVexCompressTableEntry {
43 uint16_t EvexOpcode;
44 uint16_t VexOpcode;
45};
46#include "X86GenEVEX2VEXTables.inc"
47
Gadi Haber19c4fc52016-12-28 10:12:48 +000048#define EVEX2VEX_DESC "Compressing EVEX instrs to VEX encoding when possible"
49#define EVEX2VEX_NAME "x86-evex-to-vex-compress"
50
51#define DEBUG_TYPE EVEX2VEX_NAME
52
53namespace {
54
55class EvexToVexInstPass : public MachineFunctionPass {
56
57 /// X86EvexToVexCompressTable - Evex to Vex encoding opcode map.
Eugene Zelenko60433b62017-10-05 00:33:50 +000058 using EvexToVexTableType = DenseMap<unsigned, uint16_t>;
Gadi Haber19c4fc52016-12-28 10:12:48 +000059 EvexToVexTableType EvexToVex128Table;
60 EvexToVexTableType EvexToVex256Table;
61
62 /// For EVEX instructions that can be encoded using VEX encoding, replace
63 /// them by the VEX encoding in order to reduce size.
64 bool CompressEvexToVexImpl(MachineInstr &MI) const;
65
66 /// For initializing the hash map tables of all AVX-512 EVEX
67 /// corresponding to AVX/AVX2 opcodes.
68 void AddTableEntry(EvexToVexTableType &EvexToVexTable, uint16_t EvexOp,
69 uint16_t VexOp);
70
71public:
72 static char ID;
73
Gadi Haber19c4fc52016-12-28 10:12:48 +000074 EvexToVexInstPass() : MachineFunctionPass(ID) {
75 initializeEvexToVexInstPassPass(*PassRegistry::getPassRegistry());
76
77 // Initialize the EVEX to VEX 128 table map.
78 for (X86EvexToVexCompressTableEntry Entry : X86EvexToVex128CompressTable) {
79 AddTableEntry(EvexToVex128Table, Entry.EvexOpcode, Entry.VexOpcode);
80 }
81
82 // Initialize the EVEX to VEX 256 table map.
83 for (X86EvexToVexCompressTableEntry Entry : X86EvexToVex256CompressTable) {
84 AddTableEntry(EvexToVex256Table, Entry.EvexOpcode, Entry.VexOpcode);
85 }
86 }
87
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000088 StringRef getPassName() const override { return EVEX2VEX_DESC; }
89
Gadi Haber19c4fc52016-12-28 10:12:48 +000090 /// Loop over all of the basic blocks, replacing EVEX instructions
91 /// by equivalent VEX instructions when possible for reducing code size.
92 bool runOnMachineFunction(MachineFunction &MF) override;
93
94 // This pass runs after regalloc and doesn't support VReg operands.
95 MachineFunctionProperties getRequiredProperties() const override {
96 return MachineFunctionProperties().set(
97 MachineFunctionProperties::Property::NoVRegs);
98 }
99
100private:
101 /// Machine instruction info used throughout the class.
102 const X86InstrInfo *TII;
103};
104
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000105} // end anonymous namespace
Gadi Haber19c4fc52016-12-28 10:12:48 +0000106
Eugene Zelenko60433b62017-10-05 00:33:50 +0000107char EvexToVexInstPass::ID = 0;
108
Gadi Haber19c4fc52016-12-28 10:12:48 +0000109bool EvexToVexInstPass::runOnMachineFunction(MachineFunction &MF) {
110 TII = MF.getSubtarget<X86Subtarget>().getInstrInfo();
111
112 const X86Subtarget &ST = MF.getSubtarget<X86Subtarget>();
113 if (!ST.hasAVX512())
114 return false;
115
116 bool Changed = false;
117
118 /// Go over all basic blocks in function and replace
119 /// EVEX encoded instrs by VEX encoding when possible.
120 for (MachineBasicBlock &MBB : MF) {
121
Simon Pilgrim60ea09e2017-09-05 12:32:16 +0000122 // Traverse the basic block.
123 for (MachineInstr &MI : MBB)
Gadi Haber19c4fc52016-12-28 10:12:48 +0000124 Changed |= CompressEvexToVexImpl(MI);
125 }
126
127 return Changed;
128}
129
130void EvexToVexInstPass::AddTableEntry(EvexToVexTableType &EvexToVexTable,
131 uint16_t EvexOp, uint16_t VexOp) {
132 EvexToVexTable[EvexOp] = VexOp;
133}
134
Craig Topper730414b2017-10-30 03:35:43 +0000135static bool usesExtendedRegister(const MachineInstr &MI) {
136 auto isHiRegIdx = [](unsigned Reg) {
137 // Check for XMM register with indexes between 16 - 31.
138 if (Reg >= X86::XMM16 && Reg <= X86::XMM31)
139 return true;
140
141 // Check for YMM register with indexes between 16 - 31.
142 if (Reg >= X86::YMM16 && Reg <= X86::YMM31)
143 return true;
144
145 return false;
146 };
147
148 // Check that operands are not ZMM regs or
149 // XMM/YMM regs with hi indexes between 16 - 31.
150 for (const MachineOperand &MO : MI.explicit_operands()) {
151 if (!MO.isReg())
152 continue;
153
154 unsigned Reg = MO.getReg();
155
156 assert(!(Reg >= X86::ZMM0 && Reg <= X86::ZMM31) &&
157 "ZMM instructions should not be in the EVEX->VEX tables");
158
159 if (isHiRegIdx(Reg))
160 return true;
161 }
162
163 return false;
164}
165
Craig Topper4e56ba22017-11-01 21:00:59 +0000166// Do any custom cleanup needed to finalize the conversion.
Craig Topperdf99baa2018-02-13 04:19:26 +0000167static bool performCustomAdjustments(MachineInstr &MI, unsigned NewOpc) {
Craig Topper4e56ba22017-11-01 21:00:59 +0000168 (void)NewOpc;
169 unsigned Opc = MI.getOpcode();
170 switch (Opc) {
171 case X86::VALIGNDZ128rri:
172 case X86::VALIGNDZ128rmi:
173 case X86::VALIGNQZ128rri:
Craig Toppere5d44ce2017-11-04 18:10:03 +0000174 case X86::VALIGNQZ128rmi: {
Craig Topper4e56ba22017-11-01 21:00:59 +0000175 assert((NewOpc == X86::VPALIGNRrri || NewOpc == X86::VPALIGNRrmi) &&
176 "Unexpected new opcode!");
177 unsigned Scale = (Opc == X86::VALIGNQZ128rri ||
178 Opc == X86::VALIGNQZ128rmi) ? 8 : 4;
179 MachineOperand &Imm = MI.getOperand(MI.getNumExplicitOperands()-1);
180 Imm.setImm(Imm.getImm() * Scale);
181 break;
182 }
Craig Toppere5d44ce2017-11-04 18:10:03 +0000183 case X86::VSHUFF32X4Z256rmi:
184 case X86::VSHUFF32X4Z256rri:
185 case X86::VSHUFF64X2Z256rmi:
186 case X86::VSHUFF64X2Z256rri:
187 case X86::VSHUFI32X4Z256rmi:
188 case X86::VSHUFI32X4Z256rri:
189 case X86::VSHUFI64X2Z256rmi:
190 case X86::VSHUFI64X2Z256rri: {
191 assert((NewOpc == X86::VPERM2F128rr || NewOpc == X86::VPERM2I128rr ||
192 NewOpc == X86::VPERM2F128rm || NewOpc == X86::VPERM2I128rm) &&
193 "Unexpected new opcode!");
194 MachineOperand &Imm = MI.getOperand(MI.getNumExplicitOperands()-1);
195 int64_t ImmVal = Imm.getImm();
196 // Set bit 5, move bit 1 to bit 4, copy bit 0.
197 Imm.setImm(0x20 | ((ImmVal & 2) << 3) | (ImmVal & 1));
198 break;
199 }
Craig Topperdf99baa2018-02-13 04:19:26 +0000200 case X86::VRNDSCALEPDZ128rri:
201 case X86::VRNDSCALEPDZ128rmi:
202 case X86::VRNDSCALEPSZ128rri:
203 case X86::VRNDSCALEPSZ128rmi:
204 case X86::VRNDSCALEPDZ256rri:
205 case X86::VRNDSCALEPDZ256rmi:
206 case X86::VRNDSCALEPSZ256rri:
207 case X86::VRNDSCALEPSZ256rmi:
208 case X86::VRNDSCALESDr:
209 case X86::VRNDSCALESDm:
210 case X86::VRNDSCALESSr:
211 case X86::VRNDSCALESSm:
212 case X86::VRNDSCALESDr_Int:
213 case X86::VRNDSCALESDm_Int:
214 case X86::VRNDSCALESSr_Int:
215 case X86::VRNDSCALESSm_Int:
216 const MachineOperand &Imm = MI.getOperand(MI.getNumExplicitOperands()-1);
217 int64_t ImmVal = Imm.getImm();
218 // Ensure that only bits 3:0 of the immediate are used.
219 if ((ImmVal & 0xf) != ImmVal)
220 return false;
221 break;
Craig Toppere5d44ce2017-11-04 18:10:03 +0000222 }
Craig Topperdf99baa2018-02-13 04:19:26 +0000223
224 return true;
Craig Topper4e56ba22017-11-01 21:00:59 +0000225}
226
Craig Topper730414b2017-10-30 03:35:43 +0000227
Gadi Haber19c4fc52016-12-28 10:12:48 +0000228// For EVEX instructions that can be encoded using VEX encoding
229// replace them by the VEX encoding in order to reduce size.
230bool EvexToVexInstPass::CompressEvexToVexImpl(MachineInstr &MI) const {
Gadi Haber19c4fc52016-12-28 10:12:48 +0000231 // VEX format.
232 // # of bytes: 0,2,3 1 1 0,1 0,1,2,4 0,1
233 // [Prefixes] [VEX] OPCODE ModR/M [SIB] [DISP] [IMM]
234 //
235 // EVEX format.
236 // # of bytes: 4 1 1 1 4 / 1 1
237 // [Prefixes] EVEX Opcode ModR/M [SIB] [Disp32] / [Disp8*N] [Immediate]
238
239 const MCInstrDesc &Desc = MI.getDesc();
240
241 // Check for EVEX instructions only.
242 if ((Desc.TSFlags & X86II::EncodingMask) != X86II::EVEX)
243 return false;
Simon Pilgrim60ea09e2017-09-05 12:32:16 +0000244
245 // Check for EVEX instructions with mask or broadcast as in these cases
246 // the EVEX prefix is needed in order to carry this information
Gadi Haber19c4fc52016-12-28 10:12:48 +0000247 // thus preventing the transformation to VEX encoding.
248 if (Desc.TSFlags & (X86II::EVEX_K | X86II::EVEX_B))
249 return false;
Simon Pilgrim60ea09e2017-09-05 12:32:16 +0000250
Gadi Haber19c4fc52016-12-28 10:12:48 +0000251 // Check for non EVEX_V512 instrs only.
252 // EVEX_V512 instr: bit EVEX_L2 = 1; bit VEX_L = 0.
253 if ((Desc.TSFlags & X86II::EVEX_L2) && !(Desc.TSFlags & X86II::VEX_L))
Simon Pilgrim60ea09e2017-09-05 12:32:16 +0000254 return false;
255
Gadi Haber19c4fc52016-12-28 10:12:48 +0000256 // EVEX_V128 instr: bit EVEX_L2 = 0, bit VEX_L = 0.
257 bool IsEVEX_V128 =
258 (!(Desc.TSFlags & X86II::EVEX_L2) && !(Desc.TSFlags & X86II::VEX_L));
259
260 // EVEX_V256 instr: bit EVEX_L2 = 0, bit VEX_L = 1.
261 bool IsEVEX_V256 =
262 (!(Desc.TSFlags & X86II::EVEX_L2) && (Desc.TSFlags & X86II::VEX_L));
263
264 unsigned NewOpc = 0;
265
266 // Check for EVEX_V256 instructions.
267 if (IsEVEX_V256) {
268 // Search for opcode in the EvexToVex256 table.
269 auto It = EvexToVex256Table.find(MI.getOpcode());
270 if (It != EvexToVex256Table.end())
271 NewOpc = It->second;
272 }
Gadi Haber19c4fc52016-12-28 10:12:48 +0000273 // Check for EVEX_V128 or Scalar instructions.
274 else if (IsEVEX_V128) {
275 // Search for opcode in the EvexToVex128 table.
276 auto It = EvexToVex128Table.find(MI.getOpcode());
277 if (It != EvexToVex128Table.end())
278 NewOpc = It->second;
279 }
280
281 if (!NewOpc)
282 return false;
283
Craig Topper730414b2017-10-30 03:35:43 +0000284 if (usesExtendedRegister(MI))
Gadi Haber19c4fc52016-12-28 10:12:48 +0000285 return false;
Simon Pilgrim60ea09e2017-09-05 12:32:16 +0000286
Craig Topperdf99baa2018-02-13 04:19:26 +0000287 if (!performCustomAdjustments(MI, NewOpc))
288 return false;
Craig Topper4e56ba22017-11-01 21:00:59 +0000289
Craig Topperc84835532017-10-30 03:35:44 +0000290 MI.setDesc(TII->get(NewOpc));
Craig Topperf27016f2018-03-10 05:15:22 +0000291 MI.setAsmPrinterFlag(X86::AC_EVEX_2_VEX);
Simon Pilgrim60ea09e2017-09-05 12:32:16 +0000292 return true;
Gadi Haber19c4fc52016-12-28 10:12:48 +0000293}
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000294
295INITIALIZE_PASS(EvexToVexInstPass, EVEX2VEX_NAME, EVEX2VEX_DESC, false, false)
296
297FunctionPass *llvm::createX86EvexToVexInsts() {
298 return new EvexToVexInstPass();
299}