blob: 651925e616f9a98fab31c8d6eef8b67e989853fa [file] [log] [blame]
Tim Northover69fa84a2016-10-14 22:18:18 +00001//===- AArch64LegalizerInfo.cpp ----------------------------------*- C++ -*-==//
Tim Northover33b07d62016-07-22 20:03:43 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9/// \file
10/// This file implements the targeting of the Machinelegalizer class for
11/// AArch64.
12/// \todo This should be generated by TableGen.
13//===----------------------------------------------------------------------===//
14
Tim Northover69fa84a2016-10-14 22:18:18 +000015#include "AArch64LegalizerInfo.h"
Tim Northover91366172017-02-15 23:22:50 +000016#include "llvm/CodeGen/MachineInstr.h"
17#include "llvm/CodeGen/MachineRegisterInfo.h"
Tim Northover33b07d62016-07-22 20:03:43 +000018#include "llvm/CodeGen/ValueTypes.h"
Tim Northover91366172017-02-15 23:22:50 +000019#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
Tim Northover33b07d62016-07-22 20:03:43 +000020#include "llvm/IR/Type.h"
21#include "llvm/IR/DerivedTypes.h"
22#include "llvm/Target/TargetOpcodes.h"
23
24using namespace llvm;
25
26#ifndef LLVM_BUILD_GLOBAL_ISEL
27#error "You shouldn't build this"
28#endif
29
Tim Northover69fa84a2016-10-14 22:18:18 +000030AArch64LegalizerInfo::AArch64LegalizerInfo() {
Ahmed Bougachaad30db32016-08-02 15:10:28 +000031 using namespace TargetOpcode;
Tim Northover5ae83502016-09-15 09:20:34 +000032 const LLT p0 = LLT::pointer(0, 64);
Tim Northoverea904f92016-08-19 22:40:00 +000033 const LLT s1 = LLT::scalar(1);
Tim Northover9656f142016-08-04 20:54:13 +000034 const LLT s8 = LLT::scalar(8);
35 const LLT s16 = LLT::scalar(16);
Ahmed Bougachaad30db32016-08-02 15:10:28 +000036 const LLT s32 = LLT::scalar(32);
37 const LLT s64 = LLT::scalar(64);
38 const LLT v2s32 = LLT::vector(2, 32);
39 const LLT v4s32 = LLT::vector(4, 32);
40 const LLT v2s64 = LLT::vector(2, 64);
41
Quentin Colombet24203cf2017-01-27 01:13:30 +000042 for (unsigned BinOp : {G_ADD, G_SUB, G_MUL, G_AND, G_OR, G_XOR, G_SHL}) {
Tim Northoverfe880a82016-08-25 17:37:39 +000043 // These operations naturally get the right answer when used on
44 // GPR32, even if the actual type is narrower.
Ahmed Bougachacfb384d2017-01-23 21:10:05 +000045 for (auto Ty : {s32, s64, v2s32, v4s32, v2s64})
Quentin Colombete15e4602017-01-27 01:13:25 +000046 setAction({BinOp, Ty}, Legal);
Ahmed Bougachacfb384d2017-01-23 21:10:05 +000047
48 for (auto Ty : {s1, s8, s16})
Quentin Colombete15e4602017-01-27 01:13:25 +000049 setAction({BinOp, Ty}, WidenScalar);
Tim Northover9656f142016-08-04 20:54:13 +000050 }
51
Quentin Colombete15e4602017-01-27 01:13:25 +000052 setAction({G_GEP, p0}, Legal);
53 setAction({G_GEP, 1, s64}, Legal);
Tim Northover22d82cf2016-09-15 11:02:19 +000054
55 for (auto Ty : {s1, s8, s16, s32})
Quentin Colombete15e4602017-01-27 01:13:25 +000056 setAction({G_GEP, 1, Ty}, WidenScalar);
Tim Northover22d82cf2016-09-15 11:02:19 +000057
Tim Northover398c5f52017-02-14 20:56:29 +000058 setAction({G_PTR_MASK, p0}, Legal);
59
Quentin Colombet24203cf2017-01-27 01:13:30 +000060 for (unsigned BinOp : {G_LSHR, G_ASHR, G_SDIV, G_UDIV}) {
Ahmed Bougacha2ac5bf92016-08-16 14:02:47 +000061 for (auto Ty : {s32, s64})
Quentin Colombete15e4602017-01-27 01:13:25 +000062 setAction({BinOp, Ty}, Legal);
Ahmed Bougacha2ac5bf92016-08-16 14:02:47 +000063
Tim Northover7a753d92016-08-26 17:46:06 +000064 for (auto Ty : {s1, s8, s16})
Quentin Colombete15e4602017-01-27 01:13:25 +000065 setAction({BinOp, Ty}, WidenScalar);
Tim Northover7a753d92016-08-26 17:46:06 +000066 }
67
Quentin Colombet24203cf2017-01-27 01:13:30 +000068 for (unsigned BinOp : {G_SREM, G_UREM})
Tim Northovercecee562016-08-26 17:46:13 +000069 for (auto Ty : { s1, s8, s16, s32, s64 })
Quentin Colombete15e4602017-01-27 01:13:25 +000070 setAction({BinOp, Ty}, Lower);
Tim Northovercecee562016-08-26 17:46:13 +000071
Tim Northover0a9b2792017-02-08 21:22:15 +000072 for (unsigned Op : {G_SMULO, G_UMULO})
73 setAction({Op, s64}, Lower);
74
75 for (unsigned Op : {G_UADDE, G_USUBE, G_SADDO, G_SSUBO, G_SMULH, G_UMULH}) {
Tim Northover438c77c2016-08-25 17:37:32 +000076 for (auto Ty : { s32, s64 })
Quentin Colombete15e4602017-01-27 01:13:25 +000077 setAction({Op, Ty}, Legal);
Tim Northover438c77c2016-08-25 17:37:32 +000078
Quentin Colombete15e4602017-01-27 01:13:25 +000079 setAction({Op, 1, s1}, Legal);
Tim Northoverd8a6d7c2016-08-25 17:37:41 +000080 }
81
Quentin Colombet24203cf2017-01-27 01:13:30 +000082 for (unsigned BinOp : {G_FADD, G_FSUB, G_FMUL, G_FDIV})
Ahmed Bougacha33e19fe2016-08-18 16:05:11 +000083 for (auto Ty : {s32, s64})
Quentin Colombete15e4602017-01-27 01:13:25 +000084 setAction({BinOp, Ty}, Legal);
Ahmed Bougacha33e19fe2016-08-18 16:05:11 +000085
Tim Northovere0418412017-02-08 23:23:39 +000086 for (unsigned BinOp : {G_FREM, G_FPOW}) {
87 setAction({BinOp, s32}, Libcall);
88 setAction({BinOp, s64}, Libcall);
89 }
Tim Northoveredb3c8c2016-08-29 19:07:16 +000090
Tim Northover0e6afbd2017-02-06 21:56:47 +000091 // FIXME: what should we do about G_INSERTs with more than one source value?
92 // For now the default of not specifying means we'll fall back.
93 for (auto Ty : {s32, s64}) {
94 setAction({G_INSERT, Ty}, Legal);
95 setAction({G_INSERT, 1, Ty}, Legal);
96 }
97 for (auto Ty : {s1, s8, s16}) {
98 setAction({G_INSERT, Ty}, WidenScalar);
99 // FIXME: Can't widen the sources because that violates the constraints on
100 // G_INSERT (It seems entirely reasonable that inputs shouldn't overlap).
101 }
102
Quentin Colombet24203cf2017-01-27 01:13:30 +0000103 for (unsigned MemOp : {G_LOAD, G_STORE}) {
Quentin Colombetd3126d52016-10-11 00:21:08 +0000104 for (auto Ty : {s8, s16, s32, s64, p0, v2s32})
Quentin Colombete15e4602017-01-27 01:13:25 +0000105 setAction({MemOp, Ty}, Legal);
Ahmed Bougachaad30db32016-08-02 15:10:28 +0000106
Quentin Colombete15e4602017-01-27 01:13:25 +0000107 setAction({MemOp, s1}, WidenScalar);
Tim Northovera01bece2016-08-23 19:30:42 +0000108
109 // And everything's fine in addrspace 0.
Quentin Colombete15e4602017-01-27 01:13:25 +0000110 setAction({MemOp, 1, p0}, Legal);
Tim Northover3c73e362016-08-23 18:20:09 +0000111 }
112
Tim Northoverb3a0be42016-08-23 21:01:20 +0000113 // Constants
Tim Northoverea904f92016-08-19 22:40:00 +0000114 for (auto Ty : {s32, s64}) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000115 setAction({TargetOpcode::G_CONSTANT, Ty}, Legal);
116 setAction({TargetOpcode::G_FCONSTANT, Ty}, Legal);
Tim Northoverea904f92016-08-19 22:40:00 +0000117 }
118
Quentin Colombete15e4602017-01-27 01:13:25 +0000119 setAction({G_CONSTANT, p0}, Legal);
Tim Northover7a1ec012016-08-25 17:37:35 +0000120
Tim Northoverea904f92016-08-19 22:40:00 +0000121 for (auto Ty : {s1, s8, s16})
Quentin Colombete15e4602017-01-27 01:13:25 +0000122 setAction({TargetOpcode::G_CONSTANT, Ty}, WidenScalar);
Tim Northoverea904f92016-08-19 22:40:00 +0000123
Quentin Colombete15e4602017-01-27 01:13:25 +0000124 setAction({TargetOpcode::G_FCONSTANT, s16}, WidenScalar);
Tim Northover9656f142016-08-04 20:54:13 +0000125
Quentin Colombete15e4602017-01-27 01:13:25 +0000126 setAction({G_ICMP, s1}, Legal);
127 setAction({G_ICMP, 1, s32}, Legal);
128 setAction({G_ICMP, 1, s64}, Legal);
129 setAction({G_ICMP, 1, p0}, Legal);
Tim Northover6cd4b232016-08-23 21:01:26 +0000130
Tim Northover051b8ad2016-08-26 17:46:17 +0000131 for (auto Ty : {s1, s8, s16}) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000132 setAction({G_ICMP, 1, Ty}, WidenScalar);
Tim Northover6cd4b232016-08-23 21:01:26 +0000133 }
134
Quentin Colombete15e4602017-01-27 01:13:25 +0000135 setAction({G_FCMP, s1}, Legal);
136 setAction({G_FCMP, 1, s32}, Legal);
137 setAction({G_FCMP, 1, s64}, Legal);
Tim Northover30bd36e2016-08-26 17:46:19 +0000138
Tim Northover2c4a8382016-08-25 17:37:25 +0000139 // Extensions
140 for (auto Ty : { s1, s8, s16, s32, s64 }) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000141 setAction({G_ZEXT, Ty}, Legal);
142 setAction({G_SEXT, Ty}, Legal);
143 setAction({G_ANYEXT, Ty}, Legal);
Tim Northover2c4a8382016-08-25 17:37:25 +0000144 }
145
146 for (auto Ty : { s1, s8, s16, s32 }) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000147 setAction({G_ZEXT, 1, Ty}, Legal);
148 setAction({G_SEXT, 1, Ty}, Legal);
149 setAction({G_ANYEXT, 1, Ty}, Legal);
Tim Northover2c4a8382016-08-25 17:37:25 +0000150 }
151
Quentin Colombete15e4602017-01-27 01:13:25 +0000152 setAction({G_FPEXT, s64}, Legal);
153 setAction({G_FPEXT, 1, s32}, Legal);
Tim Northoverbc1701c2016-08-26 17:46:22 +0000154
Tim Northover438c77c2016-08-25 17:37:32 +0000155 // Truncations
156 for (auto Ty : { s16, s32 })
Quentin Colombete15e4602017-01-27 01:13:25 +0000157 setAction({G_FPTRUNC, Ty}, Legal);
Tim Northover438c77c2016-08-25 17:37:32 +0000158
159 for (auto Ty : { s32, s64 })
Quentin Colombete15e4602017-01-27 01:13:25 +0000160 setAction({G_FPTRUNC, 1, Ty}, Legal);
Tim Northover438c77c2016-08-25 17:37:32 +0000161
162 for (auto Ty : { s1, s8, s16, s32 })
Quentin Colombete15e4602017-01-27 01:13:25 +0000163 setAction({G_TRUNC, Ty}, Legal);
Tim Northover438c77c2016-08-25 17:37:32 +0000164
165 for (auto Ty : { s8, s16, s32, s64 })
Quentin Colombete15e4602017-01-27 01:13:25 +0000166 setAction({G_TRUNC, 1, Ty}, Legal);
Tim Northover438c77c2016-08-25 17:37:32 +0000167
Tim Northover5d0eaa42016-08-26 17:45:58 +0000168 // Conversions
Ahmed Bougachad2948232017-01-20 01:37:24 +0000169 for (auto Ty : { s32, s64 }) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000170 setAction({G_FPTOSI, 0, Ty}, Legal);
171 setAction({G_FPTOUI, 0, Ty}, Legal);
172 setAction({G_SITOFP, 1, Ty}, Legal);
173 setAction({G_UITOFP, 1, Ty}, Legal);
Tim Northover5d0eaa42016-08-26 17:45:58 +0000174 }
Ahmed Bougachad2948232017-01-20 01:37:24 +0000175 for (auto Ty : { s1, s8, s16 }) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000176 setAction({G_FPTOSI, 0, Ty}, WidenScalar);
177 setAction({G_FPTOUI, 0, Ty}, WidenScalar);
178 setAction({G_SITOFP, 1, Ty}, WidenScalar);
179 setAction({G_UITOFP, 1, Ty}, WidenScalar);
Ahmed Bougachad2948232017-01-20 01:37:24 +0000180 }
Tim Northover5d0eaa42016-08-26 17:45:58 +0000181
182 for (auto Ty : { s32, s64 }) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000183 setAction({G_FPTOSI, 1, Ty}, Legal);
184 setAction({G_FPTOUI, 1, Ty}, Legal);
185 setAction({G_SITOFP, 0, Ty}, Legal);
186 setAction({G_UITOFP, 0, Ty}, Legal);
Tim Northover5d0eaa42016-08-26 17:45:58 +0000187 }
Tim Northover438c77c2016-08-25 17:37:32 +0000188
Tim Northoverb3a0be42016-08-23 21:01:20 +0000189 // Control-flow
Tim Northover6aacd272016-10-12 22:48:36 +0000190 for (auto Ty : {s1, s8, s16, s32})
Quentin Colombete15e4602017-01-27 01:13:25 +0000191 setAction({G_BRCOND, Ty}, Legal);
Kristof Beyls65a12c02017-01-30 09:13:18 +0000192 setAction({G_BRINDIRECT, p0}, Legal);
Ahmed Bougachaad30db32016-08-02 15:10:28 +0000193
Tim Northover1d18a992016-08-26 17:46:03 +0000194 // Select
Tim Northover868332d2017-02-06 23:41:27 +0000195 for (auto Ty : {s1, s8, s16})
196 setAction({G_SELECT, Ty}, WidenScalar);
197
198 for (auto Ty : {s32, s64, p0})
Quentin Colombete15e4602017-01-27 01:13:25 +0000199 setAction({G_SELECT, Ty}, Legal);
Tim Northover1d18a992016-08-26 17:46:03 +0000200
Quentin Colombete15e4602017-01-27 01:13:25 +0000201 setAction({G_SELECT, 1, s1}, Legal);
Tim Northover1d18a992016-08-26 17:46:03 +0000202
Tim Northoverb3a0be42016-08-23 21:01:20 +0000203 // Pointer-handling
Quentin Colombete15e4602017-01-27 01:13:25 +0000204 setAction({G_FRAME_INDEX, p0}, Legal);
205 setAction({G_GLOBAL_VALUE, p0}, Legal);
Ahmed Bougacha0306b5e2016-08-16 14:02:42 +0000206
Tim Northover037af52c2016-10-31 18:31:09 +0000207 for (auto Ty : {s1, s8, s16, s32, s64})
Quentin Colombete15e4602017-01-27 01:13:25 +0000208 setAction({G_PTRTOINT, 0, Ty}, Legal);
Tim Northover037af52c2016-10-31 18:31:09 +0000209
Quentin Colombete15e4602017-01-27 01:13:25 +0000210 setAction({G_PTRTOINT, 1, p0}, Legal);
Tim Northovera01bece2016-08-23 19:30:42 +0000211
Quentin Colombete15e4602017-01-27 01:13:25 +0000212 setAction({G_INTTOPTR, 0, p0}, Legal);
213 setAction({G_INTTOPTR, 1, s64}, Legal);
Tim Northover456a3c02016-08-23 19:30:38 +0000214
Quentin Colombet404e4352016-10-12 03:57:43 +0000215 // Casts for 32 and 64-bit width type are just copies.
Tim Northoverc1d8c2b2016-10-11 22:29:23 +0000216 for (auto Ty : {s1, s8, s16, s32, s64}) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000217 setAction({G_BITCAST, 0, Ty}, Legal);
218 setAction({G_BITCAST, 1, Ty}, Legal);
Tim Northoverc1d8c2b2016-10-11 22:29:23 +0000219 }
220
Quentin Colombetdb643d92016-10-13 00:12:01 +0000221 // For the sake of copying bits around, the type does not really
222 // matter as long as it fits a register.
Tim Northoverc1d8c2b2016-10-11 22:29:23 +0000223 for (int EltSize = 8; EltSize <= 64; EltSize *= 2) {
Quentin Colombete15e4602017-01-27 01:13:25 +0000224 setAction({G_BITCAST, 0, LLT::vector(128/EltSize, EltSize)}, Legal);
225 setAction({G_BITCAST, 1, LLT::vector(128/EltSize, EltSize)}, Legal);
Quentin Colombetdb643d92016-10-13 00:12:01 +0000226 if (EltSize >= 64)
Tim Northoverc1d8c2b2016-10-11 22:29:23 +0000227 continue;
228
Quentin Colombete15e4602017-01-27 01:13:25 +0000229 setAction({G_BITCAST, 0, LLT::vector(64/EltSize, EltSize)}, Legal);
230 setAction({G_BITCAST, 1, LLT::vector(64/EltSize, EltSize)}, Legal);
Quentin Colombetdb643d92016-10-13 00:12:01 +0000231 if (EltSize >= 32)
232 continue;
233
Quentin Colombete15e4602017-01-27 01:13:25 +0000234 setAction({G_BITCAST, 0, LLT::vector(32/EltSize, EltSize)}, Legal);
235 setAction({G_BITCAST, 1, LLT::vector(32/EltSize, EltSize)}, Legal);
Tim Northoverc1d8c2b2016-10-11 22:29:23 +0000236 }
237
Tim Northovere9600d82017-02-08 17:57:27 +0000238 setAction({G_VASTART, p0}, Legal);
239
Tim Northover91366172017-02-15 23:22:50 +0000240 // va_list must be a pointer, but most sized types are pretty easy to handle
241 // as the destination.
242 setAction({G_VAARG, 1, p0}, Legal);
243
244 for (auto Ty : {s8, s16, s32, s64, p0})
245 setAction({G_VAARG, Ty}, Custom);
246
Tim Northover33b07d62016-07-22 20:03:43 +0000247 computeTables();
248}
Tim Northover91366172017-02-15 23:22:50 +0000249
250bool AArch64LegalizerInfo::legalizeCustom(MachineInstr &MI,
251 MachineRegisterInfo &MRI,
252 MachineIRBuilder &MIRBuilder) const {
253 switch (MI.getOpcode()) {
254 default:
255 // No idea what to do.
256 return false;
257 case TargetOpcode::G_VAARG:
258 return legalizeVaArg(MI, MRI, MIRBuilder);
259 }
260
261 llvm_unreachable("expected switch to return");
262}
263
264bool AArch64LegalizerInfo::legalizeVaArg(MachineInstr &MI,
265 MachineRegisterInfo &MRI,
266 MachineIRBuilder &MIRBuilder) const {
267 MIRBuilder.setInstr(MI);
268 MachineFunction &MF = MIRBuilder.getMF();
269 unsigned Align = MI.getOperand(2).getImm();
270 unsigned Dst = MI.getOperand(0).getReg();
271 unsigned ListPtr = MI.getOperand(1).getReg();
272
273 LLT PtrTy = MRI.getType(ListPtr);
274 LLT IntPtrTy = LLT::scalar(PtrTy.getSizeInBits());
275
276 const unsigned PtrSize = PtrTy.getSizeInBits() / 8;
277 unsigned List = MRI.createGenericVirtualRegister(PtrTy);
278 MIRBuilder.buildLoad(
279 List, ListPtr,
280 *MF.getMachineMemOperand(MachinePointerInfo(), MachineMemOperand::MOLoad,
281 PtrSize, /* Align = */ PtrSize));
282
283 unsigned DstPtr;
284 if (Align > PtrSize) {
285 // Realign the list to the actual required alignment.
286 unsigned AlignMinus1 = MRI.createGenericVirtualRegister(IntPtrTy);
287 MIRBuilder.buildConstant(AlignMinus1, Align - 1);
288
289 unsigned ListTmp = MRI.createGenericVirtualRegister(PtrTy);
290 MIRBuilder.buildGEP(ListTmp, List, AlignMinus1);
291
292 DstPtr = MRI.createGenericVirtualRegister(PtrTy);
293 MIRBuilder.buildPtrMask(DstPtr, ListTmp, Log2_64(Align));
294 } else
295 DstPtr = List;
296
297 uint64_t ValSize = MRI.getType(Dst).getSizeInBits() / 8;
298 MIRBuilder.buildLoad(
299 Dst, DstPtr,
300 *MF.getMachineMemOperand(MachinePointerInfo(), MachineMemOperand::MOLoad,
301 ValSize, std::max(Align, PtrSize)));
302
303 unsigned SizeReg = MRI.createGenericVirtualRegister(IntPtrTy);
304 MIRBuilder.buildConstant(SizeReg, alignTo(ValSize, PtrSize));
305
306 unsigned NewList = MRI.createGenericVirtualRegister(PtrTy);
307 MIRBuilder.buildGEP(NewList, DstPtr, SizeReg);
308
309 MIRBuilder.buildStore(
310 NewList, ListPtr,
311 *MF.getMachineMemOperand(MachinePointerInfo(), MachineMemOperand::MOStore,
312 PtrSize, /* Align = */ PtrSize));
313
314 MI.eraseFromParent();
315 return true;
316}