blob: 197bf25658458656401a6e5bd0bdfb1e0e87643a [file] [log] [blame]
Tim Northover69fa84a2016-10-14 22:18:18 +00001//===-- llvm/CodeGen/GlobalISel/LegalizerHelper.cpp -----------------------===//
Tim Northover33b07d62016-07-22 20:03:43 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Tim Northover69fa84a2016-10-14 22:18:18 +000010/// \file This file implements the LegalizerHelper class to legalize
Tim Northover33b07d62016-07-22 20:03:43 +000011/// individual instructions and the LegalizeMachineIR wrapper pass for the
12/// primary legalization.
13//
14//===----------------------------------------------------------------------===//
15
Tim Northover69fa84a2016-10-14 22:18:18 +000016#include "llvm/CodeGen/GlobalISel/LegalizerHelper.h"
Tim Northoveredb3c8c2016-08-29 19:07:16 +000017#include "llvm/CodeGen/GlobalISel/CallLowering.h"
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +000018#include "llvm/CodeGen/GlobalISel/GISelChangeObserver.h"
Tim Northover69fa84a2016-10-14 22:18:18 +000019#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
Tim Northover33b07d62016-07-22 20:03:43 +000020#include "llvm/CodeGen/MachineRegisterInfo.h"
Aditya Nandakumarc0333f72018-08-21 17:30:31 +000021#include "llvm/CodeGen/TargetInstrInfo.h"
David Blaikieb3bde2e2017-11-17 01:07:10 +000022#include "llvm/CodeGen/TargetLowering.h"
23#include "llvm/CodeGen/TargetSubtargetInfo.h"
Tim Northover33b07d62016-07-22 20:03:43 +000024#include "llvm/Support/Debug.h"
Aditya Nandakumarc0333f72018-08-21 17:30:31 +000025#include "llvm/Support/MathExtras.h"
Tim Northover33b07d62016-07-22 20:03:43 +000026#include "llvm/Support/raw_ostream.h"
Tim Northover33b07d62016-07-22 20:03:43 +000027
Daniel Sanders5377fb32017-04-20 15:46:12 +000028#define DEBUG_TYPE "legalizer"
Tim Northover33b07d62016-07-22 20:03:43 +000029
30using namespace llvm;
Daniel Sanders9ade5592018-01-29 17:37:29 +000031using namespace LegalizeActions;
Tim Northover33b07d62016-07-22 20:03:43 +000032
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +000033LegalizerHelper::LegalizerHelper(MachineFunction &MF,
34 GISelChangeObserver &Observer)
35 : MRI(MF.getRegInfo()), LI(*MF.getSubtarget().getLegalizerInfo()),
36 Observer(Observer) {
Tim Northover33b07d62016-07-22 20:03:43 +000037 MIRBuilder.setMF(MF);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +000038 MIRBuilder.setChangeObserver(Observer);
Tim Northover33b07d62016-07-22 20:03:43 +000039}
40
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +000041LegalizerHelper::LegalizerHelper(MachineFunction &MF, const LegalizerInfo &LI,
42 GISelChangeObserver &Observer)
43 : MRI(MF.getRegInfo()), LI(LI), Observer(Observer) {
Aditya Nandakumarc0333f72018-08-21 17:30:31 +000044 MIRBuilder.setMF(MF);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +000045 MIRBuilder.setChangeObserver(Observer);
Aditya Nandakumarc0333f72018-08-21 17:30:31 +000046}
Tim Northover69fa84a2016-10-14 22:18:18 +000047LegalizerHelper::LegalizeResult
Volkan Keles685fbda2017-03-10 18:34:57 +000048LegalizerHelper::legalizeInstrStep(MachineInstr &MI) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +000049 LLVM_DEBUG(dbgs() << "Legalizing: "; MI.print(dbgs()));
Daniel Sanders5377fb32017-04-20 15:46:12 +000050
Daniel Sanders262ed0e2018-01-24 17:17:46 +000051 auto Step = LI.getAction(MI, MRI);
52 switch (Step.Action) {
Daniel Sanders9ade5592018-01-29 17:37:29 +000053 case Legal:
Nicola Zaghend34e60c2018-05-14 12:53:11 +000054 LLVM_DEBUG(dbgs() << ".. Already legal\n");
Tim Northover33b07d62016-07-22 20:03:43 +000055 return AlreadyLegal;
Daniel Sanders9ade5592018-01-29 17:37:29 +000056 case Libcall:
Nicola Zaghend34e60c2018-05-14 12:53:11 +000057 LLVM_DEBUG(dbgs() << ".. Convert to libcall\n");
Tim Northoveredb3c8c2016-08-29 19:07:16 +000058 return libcall(MI);
Daniel Sanders9ade5592018-01-29 17:37:29 +000059 case NarrowScalar:
Nicola Zaghend34e60c2018-05-14 12:53:11 +000060 LLVM_DEBUG(dbgs() << ".. Narrow scalar\n");
Daniel Sanders262ed0e2018-01-24 17:17:46 +000061 return narrowScalar(MI, Step.TypeIdx, Step.NewType);
Daniel Sanders9ade5592018-01-29 17:37:29 +000062 case WidenScalar:
Nicola Zaghend34e60c2018-05-14 12:53:11 +000063 LLVM_DEBUG(dbgs() << ".. Widen scalar\n");
Daniel Sanders262ed0e2018-01-24 17:17:46 +000064 return widenScalar(MI, Step.TypeIdx, Step.NewType);
Daniel Sanders9ade5592018-01-29 17:37:29 +000065 case Lower:
Nicola Zaghend34e60c2018-05-14 12:53:11 +000066 LLVM_DEBUG(dbgs() << ".. Lower\n");
Daniel Sanders262ed0e2018-01-24 17:17:46 +000067 return lower(MI, Step.TypeIdx, Step.NewType);
Daniel Sanders9ade5592018-01-29 17:37:29 +000068 case FewerElements:
Nicola Zaghend34e60c2018-05-14 12:53:11 +000069 LLVM_DEBUG(dbgs() << ".. Reduce number of elements\n");
Daniel Sanders262ed0e2018-01-24 17:17:46 +000070 return fewerElementsVector(MI, Step.TypeIdx, Step.NewType);
Daniel Sanders9ade5592018-01-29 17:37:29 +000071 case Custom:
Nicola Zaghend34e60c2018-05-14 12:53:11 +000072 LLVM_DEBUG(dbgs() << ".. Custom legalization\n");
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +000073 return LI.legalizeCustom(MI, MRI, MIRBuilder, Observer) ? Legalized
74 : UnableToLegalize;
Tim Northover33b07d62016-07-22 20:03:43 +000075 default:
Nicola Zaghend34e60c2018-05-14 12:53:11 +000076 LLVM_DEBUG(dbgs() << ".. Unable to legalize\n");
Tim Northover33b07d62016-07-22 20:03:43 +000077 return UnableToLegalize;
78 }
79}
80
Tim Northover69fa84a2016-10-14 22:18:18 +000081void LegalizerHelper::extractParts(unsigned Reg, LLT Ty, int NumParts,
82 SmallVectorImpl<unsigned> &VRegs) {
Tim Northoverbf017292017-03-03 22:46:09 +000083 for (int i = 0; i < NumParts; ++i)
Tim Northover0f140c72016-09-09 11:46:34 +000084 VRegs.push_back(MRI.createGenericVirtualRegister(Ty));
Tim Northoverbf017292017-03-03 22:46:09 +000085 MIRBuilder.buildUnmerge(VRegs, Reg);
Tim Northover33b07d62016-07-22 20:03:43 +000086}
87
Tim Northovere0418412017-02-08 23:23:39 +000088static RTLIB::Libcall getRTLibDesc(unsigned Opcode, unsigned Size) {
89 switch (Opcode) {
Diana Picuse97822e2017-04-24 07:22:31 +000090 case TargetOpcode::G_SDIV:
91 assert(Size == 32 && "Unsupported size");
92 return RTLIB::SDIV_I32;
93 case TargetOpcode::G_UDIV:
94 assert(Size == 32 && "Unsupported size");
95 return RTLIB::UDIV_I32;
Diana Picus02e11012017-06-15 10:53:31 +000096 case TargetOpcode::G_SREM:
97 assert(Size == 32 && "Unsupported size");
98 return RTLIB::SREM_I32;
99 case TargetOpcode::G_UREM:
100 assert(Size == 32 && "Unsupported size");
101 return RTLIB::UREM_I32;
Diana Picus0528e2c2018-11-26 11:07:02 +0000102 case TargetOpcode::G_CTLZ_ZERO_UNDEF:
103 assert(Size == 32 && "Unsupported size");
104 return RTLIB::CTLZ_I32;
Diana Picus1314a282017-04-11 10:52:34 +0000105 case TargetOpcode::G_FADD:
106 assert((Size == 32 || Size == 64) && "Unsupported size");
107 return Size == 64 ? RTLIB::ADD_F64 : RTLIB::ADD_F32;
Javed Absar5cde1cc2017-10-30 13:51:56 +0000108 case TargetOpcode::G_FSUB:
109 assert((Size == 32 || Size == 64) && "Unsupported size");
110 return Size == 64 ? RTLIB::SUB_F64 : RTLIB::SUB_F32;
Diana Picus9faa09b2017-11-23 12:44:20 +0000111 case TargetOpcode::G_FMUL:
112 assert((Size == 32 || Size == 64) && "Unsupported size");
113 return Size == 64 ? RTLIB::MUL_F64 : RTLIB::MUL_F32;
Diana Picusc01f7f12017-11-23 13:26:07 +0000114 case TargetOpcode::G_FDIV:
115 assert((Size == 32 || Size == 64) && "Unsupported size");
116 return Size == 64 ? RTLIB::DIV_F64 : RTLIB::DIV_F32;
Tim Northovere0418412017-02-08 23:23:39 +0000117 case TargetOpcode::G_FREM:
118 return Size == 64 ? RTLIB::REM_F64 : RTLIB::REM_F32;
119 case TargetOpcode::G_FPOW:
120 return Size == 64 ? RTLIB::POW_F64 : RTLIB::POW_F32;
Diana Picuse74243d2018-01-12 11:30:45 +0000121 case TargetOpcode::G_FMA:
122 assert((Size == 32 || Size == 64) && "Unsupported size");
123 return Size == 64 ? RTLIB::FMA_F64 : RTLIB::FMA_F32;
Tim Northovere0418412017-02-08 23:23:39 +0000124 }
125 llvm_unreachable("Unknown libcall function");
126}
127
Diana Picusfc1675e2017-07-05 12:57:24 +0000128LegalizerHelper::LegalizeResult
129llvm::createLibcall(MachineIRBuilder &MIRBuilder, RTLIB::Libcall Libcall,
130 const CallLowering::ArgInfo &Result,
131 ArrayRef<CallLowering::ArgInfo> Args) {
Diana Picuse97822e2017-04-24 07:22:31 +0000132 auto &CLI = *MIRBuilder.getMF().getSubtarget().getCallLowering();
133 auto &TLI = *MIRBuilder.getMF().getSubtarget().getTargetLowering();
Diana Picuse97822e2017-04-24 07:22:31 +0000134 const char *Name = TLI.getLibcallName(Libcall);
Diana Picusd0104ea2017-07-06 09:09:33 +0000135
Diana Picuse97822e2017-04-24 07:22:31 +0000136 MIRBuilder.getMF().getFrameInfo().setHasCalls(true);
Diana Picus02e11012017-06-15 10:53:31 +0000137 if (!CLI.lowerCall(MIRBuilder, TLI.getLibcallCallingConv(Libcall),
138 MachineOperand::CreateES(Name), Result, Args))
139 return LegalizerHelper::UnableToLegalize;
Diana Picusd0104ea2017-07-06 09:09:33 +0000140
Diana Picuse97822e2017-04-24 07:22:31 +0000141 return LegalizerHelper::Legalized;
142}
143
Diana Picus65ed3642018-01-17 13:34:10 +0000144// Useful for libcalls where all operands have the same type.
Diana Picus02e11012017-06-15 10:53:31 +0000145static LegalizerHelper::LegalizeResult
146simpleLibcall(MachineInstr &MI, MachineIRBuilder &MIRBuilder, unsigned Size,
147 Type *OpType) {
148 auto Libcall = getRTLibDesc(MI.getOpcode(), Size);
Diana Picuse74243d2018-01-12 11:30:45 +0000149
150 SmallVector<CallLowering::ArgInfo, 3> Args;
151 for (unsigned i = 1; i < MI.getNumOperands(); i++)
152 Args.push_back({MI.getOperand(i).getReg(), OpType});
Diana Picusfc1675e2017-07-05 12:57:24 +0000153 return createLibcall(MIRBuilder, Libcall, {MI.getOperand(0).getReg(), OpType},
Diana Picuse74243d2018-01-12 11:30:45 +0000154 Args);
Diana Picus02e11012017-06-15 10:53:31 +0000155}
156
Diana Picus65ed3642018-01-17 13:34:10 +0000157static RTLIB::Libcall getConvRTLibDesc(unsigned Opcode, Type *ToType,
158 Type *FromType) {
159 auto ToMVT = MVT::getVT(ToType);
160 auto FromMVT = MVT::getVT(FromType);
161
162 switch (Opcode) {
163 case TargetOpcode::G_FPEXT:
164 return RTLIB::getFPEXT(FromMVT, ToMVT);
165 case TargetOpcode::G_FPTRUNC:
166 return RTLIB::getFPROUND(FromMVT, ToMVT);
Diana Picus4ed0ee72018-01-30 07:54:52 +0000167 case TargetOpcode::G_FPTOSI:
168 return RTLIB::getFPTOSINT(FromMVT, ToMVT);
169 case TargetOpcode::G_FPTOUI:
170 return RTLIB::getFPTOUINT(FromMVT, ToMVT);
Diana Picus517531e2018-01-30 09:15:17 +0000171 case TargetOpcode::G_SITOFP:
172 return RTLIB::getSINTTOFP(FromMVT, ToMVT);
173 case TargetOpcode::G_UITOFP:
174 return RTLIB::getUINTTOFP(FromMVT, ToMVT);
Diana Picus65ed3642018-01-17 13:34:10 +0000175 }
176 llvm_unreachable("Unsupported libcall function");
177}
178
179static LegalizerHelper::LegalizeResult
180conversionLibcall(MachineInstr &MI, MachineIRBuilder &MIRBuilder, Type *ToType,
181 Type *FromType) {
182 RTLIB::Libcall Libcall = getConvRTLibDesc(MI.getOpcode(), ToType, FromType);
183 return createLibcall(MIRBuilder, Libcall, {MI.getOperand(0).getReg(), ToType},
184 {{MI.getOperand(1).getReg(), FromType}});
185}
186
Tim Northover69fa84a2016-10-14 22:18:18 +0000187LegalizerHelper::LegalizeResult
188LegalizerHelper::libcall(MachineInstr &MI) {
Diana Picus02e11012017-06-15 10:53:31 +0000189 LLT LLTy = MRI.getType(MI.getOperand(0).getReg());
190 unsigned Size = LLTy.getSizeInBits();
Matthias Braunf1caa282017-12-15 22:22:58 +0000191 auto &Ctx = MIRBuilder.getMF().getFunction().getContext();
Tim Northoveredb3c8c2016-08-29 19:07:16 +0000192
Diana Picusfc1675e2017-07-05 12:57:24 +0000193 MIRBuilder.setInstr(MI);
194
Tim Northoveredb3c8c2016-08-29 19:07:16 +0000195 switch (MI.getOpcode()) {
196 default:
197 return UnableToLegalize;
Diana Picuse97822e2017-04-24 07:22:31 +0000198 case TargetOpcode::G_SDIV:
Diana Picus02e11012017-06-15 10:53:31 +0000199 case TargetOpcode::G_UDIV:
200 case TargetOpcode::G_SREM:
Diana Picus0528e2c2018-11-26 11:07:02 +0000201 case TargetOpcode::G_UREM:
202 case TargetOpcode::G_CTLZ_ZERO_UNDEF: {
Diana Picus02e11012017-06-15 10:53:31 +0000203 Type *HLTy = Type::getInt32Ty(Ctx);
Diana Picusfc1675e2017-07-05 12:57:24 +0000204 auto Status = simpleLibcall(MI, MIRBuilder, Size, HLTy);
205 if (Status != Legalized)
206 return Status;
207 break;
Diana Picuse97822e2017-04-24 07:22:31 +0000208 }
Diana Picus1314a282017-04-11 10:52:34 +0000209 case TargetOpcode::G_FADD:
Javed Absar5cde1cc2017-10-30 13:51:56 +0000210 case TargetOpcode::G_FSUB:
Diana Picus9faa09b2017-11-23 12:44:20 +0000211 case TargetOpcode::G_FMUL:
Diana Picusc01f7f12017-11-23 13:26:07 +0000212 case TargetOpcode::G_FDIV:
Diana Picuse74243d2018-01-12 11:30:45 +0000213 case TargetOpcode::G_FMA:
Tim Northovere0418412017-02-08 23:23:39 +0000214 case TargetOpcode::G_FPOW:
Tim Northoveredb3c8c2016-08-29 19:07:16 +0000215 case TargetOpcode::G_FREM: {
Diana Picus02e11012017-06-15 10:53:31 +0000216 Type *HLTy = Size == 64 ? Type::getDoubleTy(Ctx) : Type::getFloatTy(Ctx);
Diana Picusfc1675e2017-07-05 12:57:24 +0000217 auto Status = simpleLibcall(MI, MIRBuilder, Size, HLTy);
218 if (Status != Legalized)
219 return Status;
220 break;
Tim Northoveredb3c8c2016-08-29 19:07:16 +0000221 }
Diana Picus65ed3642018-01-17 13:34:10 +0000222 case TargetOpcode::G_FPEXT: {
223 // FIXME: Support other floating point types (half, fp128 etc)
224 unsigned FromSize = MRI.getType(MI.getOperand(1).getReg()).getSizeInBits();
225 unsigned ToSize = MRI.getType(MI.getOperand(0).getReg()).getSizeInBits();
226 if (ToSize != 64 || FromSize != 32)
227 return UnableToLegalize;
228 LegalizeResult Status = conversionLibcall(
229 MI, MIRBuilder, Type::getDoubleTy(Ctx), Type::getFloatTy(Ctx));
230 if (Status != Legalized)
231 return Status;
232 break;
233 }
234 case TargetOpcode::G_FPTRUNC: {
235 // FIXME: Support other floating point types (half, fp128 etc)
236 unsigned FromSize = MRI.getType(MI.getOperand(1).getReg()).getSizeInBits();
237 unsigned ToSize = MRI.getType(MI.getOperand(0).getReg()).getSizeInBits();
238 if (ToSize != 32 || FromSize != 64)
239 return UnableToLegalize;
240 LegalizeResult Status = conversionLibcall(
241 MI, MIRBuilder, Type::getFloatTy(Ctx), Type::getDoubleTy(Ctx));
242 if (Status != Legalized)
243 return Status;
244 break;
245 }
Diana Picus4ed0ee72018-01-30 07:54:52 +0000246 case TargetOpcode::G_FPTOSI:
247 case TargetOpcode::G_FPTOUI: {
248 // FIXME: Support other types
249 unsigned FromSize = MRI.getType(MI.getOperand(1).getReg()).getSizeInBits();
250 unsigned ToSize = MRI.getType(MI.getOperand(0).getReg()).getSizeInBits();
251 if (ToSize != 32 || (FromSize != 32 && FromSize != 64))
252 return UnableToLegalize;
253 LegalizeResult Status = conversionLibcall(
254 MI, MIRBuilder, Type::getInt32Ty(Ctx),
255 FromSize == 64 ? Type::getDoubleTy(Ctx) : Type::getFloatTy(Ctx));
256 if (Status != Legalized)
257 return Status;
258 break;
259 }
Diana Picus517531e2018-01-30 09:15:17 +0000260 case TargetOpcode::G_SITOFP:
261 case TargetOpcode::G_UITOFP: {
262 // FIXME: Support other types
263 unsigned FromSize = MRI.getType(MI.getOperand(1).getReg()).getSizeInBits();
264 unsigned ToSize = MRI.getType(MI.getOperand(0).getReg()).getSizeInBits();
265 if (FromSize != 32 || (ToSize != 32 && ToSize != 64))
266 return UnableToLegalize;
267 LegalizeResult Status = conversionLibcall(
268 MI, MIRBuilder,
269 ToSize == 64 ? Type::getDoubleTy(Ctx) : Type::getFloatTy(Ctx),
270 Type::getInt32Ty(Ctx));
271 if (Status != Legalized)
272 return Status;
273 break;
274 }
Tim Northoveredb3c8c2016-08-29 19:07:16 +0000275 }
Diana Picusfc1675e2017-07-05 12:57:24 +0000276
277 MI.eraseFromParent();
278 return Legalized;
Tim Northoveredb3c8c2016-08-29 19:07:16 +0000279}
280
Tim Northover69fa84a2016-10-14 22:18:18 +0000281LegalizerHelper::LegalizeResult LegalizerHelper::narrowScalar(MachineInstr &MI,
282 unsigned TypeIdx,
283 LLT NarrowTy) {
Quentin Colombet5e60bcd2016-08-27 02:38:21 +0000284 // FIXME: Don't know how to handle secondary types yet.
Tim Northoverc2d5e6d2017-06-26 20:34:13 +0000285 if (TypeIdx != 0 && MI.getOpcode() != TargetOpcode::G_EXTRACT)
Quentin Colombet5e60bcd2016-08-27 02:38:21 +0000286 return UnableToLegalize;
Justin Bognerfde01042017-01-18 17:29:54 +0000287
288 MIRBuilder.setInstr(MI);
289
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000290 uint64_t SizeOp0 = MRI.getType(MI.getOperand(0).getReg()).getSizeInBits();
291 uint64_t NarrowSize = NarrowTy.getSizeInBits();
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000292
Tim Northover9656f142016-08-04 20:54:13 +0000293 switch (MI.getOpcode()) {
294 default:
295 return UnableToLegalize;
Tim Northoverff5e7e12017-06-30 20:27:36 +0000296 case TargetOpcode::G_IMPLICIT_DEF: {
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000297 // FIXME: add support for when SizeOp0 isn't an exact multiple of
298 // NarrowSize.
299 if (SizeOp0 % NarrowSize != 0)
300 return UnableToLegalize;
301 int NumParts = SizeOp0 / NarrowSize;
Tim Northoverff5e7e12017-06-30 20:27:36 +0000302
303 SmallVector<unsigned, 2> DstRegs;
Volkan Keles02bb1742018-02-14 19:58:36 +0000304 for (int i = 0; i < NumParts; ++i)
305 DstRegs.push_back(
306 MIRBuilder.buildUndef(NarrowTy)->getOperand(0).getReg());
Amara Emerson5ec14602018-12-10 18:44:58 +0000307
308 unsigned DstReg = MI.getOperand(0).getReg();
309 if(MRI.getType(DstReg).isVector())
310 MIRBuilder.buildBuildVector(DstReg, DstRegs);
311 else
312 MIRBuilder.buildMerge(DstReg, DstRegs);
Tim Northoverff5e7e12017-06-30 20:27:36 +0000313 MI.eraseFromParent();
314 return Legalized;
315 }
Tim Northover9656f142016-08-04 20:54:13 +0000316 case TargetOpcode::G_ADD: {
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000317 // FIXME: add support for when SizeOp0 isn't an exact multiple of
318 // NarrowSize.
319 if (SizeOp0 % NarrowSize != 0)
320 return UnableToLegalize;
Tim Northover9656f142016-08-04 20:54:13 +0000321 // Expand in terms of carry-setting/consuming G_ADDE instructions.
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000322 int NumParts = SizeOp0 / NarrowTy.getSizeInBits();
Tim Northover9656f142016-08-04 20:54:13 +0000323
Tim Northoverb18ea162016-09-20 15:20:36 +0000324 SmallVector<unsigned, 2> Src1Regs, Src2Regs, DstRegs;
Tim Northover9656f142016-08-04 20:54:13 +0000325 extractParts(MI.getOperand(1).getReg(), NarrowTy, NumParts, Src1Regs);
326 extractParts(MI.getOperand(2).getReg(), NarrowTy, NumParts, Src2Regs);
327
Tim Northover0f140c72016-09-09 11:46:34 +0000328 unsigned CarryIn = MRI.createGenericVirtualRegister(LLT::scalar(1));
329 MIRBuilder.buildConstant(CarryIn, 0);
Tim Northover9656f142016-08-04 20:54:13 +0000330
331 for (int i = 0; i < NumParts; ++i) {
Tim Northover0f140c72016-09-09 11:46:34 +0000332 unsigned DstReg = MRI.createGenericVirtualRegister(NarrowTy);
333 unsigned CarryOut = MRI.createGenericVirtualRegister(LLT::scalar(1));
Tim Northover9656f142016-08-04 20:54:13 +0000334
Tim Northover0f140c72016-09-09 11:46:34 +0000335 MIRBuilder.buildUAdde(DstReg, CarryOut, Src1Regs[i],
Tim Northover91c81732016-08-19 17:17:06 +0000336 Src2Regs[i], CarryIn);
Tim Northover9656f142016-08-04 20:54:13 +0000337
338 DstRegs.push_back(DstReg);
339 CarryIn = CarryOut;
340 }
Tim Northover0f140c72016-09-09 11:46:34 +0000341 unsigned DstReg = MI.getOperand(0).getReg();
Amara Emerson5ec14602018-12-10 18:44:58 +0000342 if(MRI.getType(DstReg).isVector())
343 MIRBuilder.buildBuildVector(DstReg, DstRegs);
344 else
345 MIRBuilder.buildMerge(DstReg, DstRegs);
Tim Northover9656f142016-08-04 20:54:13 +0000346 MI.eraseFromParent();
347 return Legalized;
348 }
Tim Northoverc2d5e6d2017-06-26 20:34:13 +0000349 case TargetOpcode::G_EXTRACT: {
350 if (TypeIdx != 1)
351 return UnableToLegalize;
352
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000353 int64_t SizeOp1 = MRI.getType(MI.getOperand(1).getReg()).getSizeInBits();
354 // FIXME: add support for when SizeOp1 isn't an exact multiple of
355 // NarrowSize.
356 if (SizeOp1 % NarrowSize != 0)
357 return UnableToLegalize;
358 int NumParts = SizeOp1 / NarrowSize;
Tim Northoverc2d5e6d2017-06-26 20:34:13 +0000359
360 SmallVector<unsigned, 2> SrcRegs, DstRegs;
361 SmallVector<uint64_t, 2> Indexes;
362 extractParts(MI.getOperand(1).getReg(), NarrowTy, NumParts, SrcRegs);
363
364 unsigned OpReg = MI.getOperand(0).getReg();
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000365 uint64_t OpStart = MI.getOperand(2).getImm();
366 uint64_t OpSize = MRI.getType(OpReg).getSizeInBits();
Tim Northoverc2d5e6d2017-06-26 20:34:13 +0000367 for (int i = 0; i < NumParts; ++i) {
368 unsigned SrcStart = i * NarrowSize;
369
370 if (SrcStart + NarrowSize <= OpStart || SrcStart >= OpStart + OpSize) {
371 // No part of the extract uses this subregister, ignore it.
372 continue;
373 } else if (SrcStart == OpStart && NarrowTy == MRI.getType(OpReg)) {
374 // The entire subregister is extracted, forward the value.
375 DstRegs.push_back(SrcRegs[i]);
376 continue;
377 }
378
379 // OpSegStart is where this destination segment would start in OpReg if it
380 // extended infinitely in both directions.
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000381 int64_t ExtractOffset;
382 uint64_t SegSize;
Tim Northoverc2d5e6d2017-06-26 20:34:13 +0000383 if (OpStart < SrcStart) {
384 ExtractOffset = 0;
385 SegSize = std::min(NarrowSize, OpStart + OpSize - SrcStart);
386 } else {
387 ExtractOffset = OpStart - SrcStart;
388 SegSize = std::min(SrcStart + NarrowSize - OpStart, OpSize);
389 }
390
391 unsigned SegReg = SrcRegs[i];
392 if (ExtractOffset != 0 || SegSize != NarrowSize) {
393 // A genuine extract is needed.
394 SegReg = MRI.createGenericVirtualRegister(LLT::scalar(SegSize));
395 MIRBuilder.buildExtract(SegReg, SrcRegs[i], ExtractOffset);
396 }
397
398 DstRegs.push_back(SegReg);
399 }
400
Amara Emerson5ec14602018-12-10 18:44:58 +0000401 unsigned DstReg = MI.getOperand(0).getReg();
402 if(MRI.getType(DstReg).isVector())
403 MIRBuilder.buildBuildVector(DstReg, DstRegs);
404 else
405 MIRBuilder.buildMerge(DstReg, DstRegs);
Tim Northoverc2d5e6d2017-06-26 20:34:13 +0000406 MI.eraseFromParent();
407 return Legalized;
408 }
Tim Northover0e6afbd2017-02-06 21:56:47 +0000409 case TargetOpcode::G_INSERT: {
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000410 // FIXME: add support for when SizeOp0 isn't an exact multiple of
411 // NarrowSize.
412 if (SizeOp0 % NarrowSize != 0)
Tim Northover0e6afbd2017-02-06 21:56:47 +0000413 return UnableToLegalize;
414
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000415 int NumParts = SizeOp0 / NarrowSize;
Tim Northover0e6afbd2017-02-06 21:56:47 +0000416
417 SmallVector<unsigned, 2> SrcRegs, DstRegs;
418 SmallVector<uint64_t, 2> Indexes;
419 extractParts(MI.getOperand(1).getReg(), NarrowTy, NumParts, SrcRegs);
420
Tim Northover75e0b912017-03-06 18:23:04 +0000421 unsigned OpReg = MI.getOperand(2).getReg();
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000422 uint64_t OpStart = MI.getOperand(3).getImm();
423 uint64_t OpSize = MRI.getType(OpReg).getSizeInBits();
Tim Northover0e6afbd2017-02-06 21:56:47 +0000424 for (int i = 0; i < NumParts; ++i) {
425 unsigned DstStart = i * NarrowSize;
Tim Northover0e6afbd2017-02-06 21:56:47 +0000426
Tim Northover75e0b912017-03-06 18:23:04 +0000427 if (DstStart + NarrowSize <= OpStart || DstStart >= OpStart + OpSize) {
Tim Northover0e6afbd2017-02-06 21:56:47 +0000428 // No part of the insert affects this subregister, forward the original.
429 DstRegs.push_back(SrcRegs[i]);
430 continue;
Tim Northover75e0b912017-03-06 18:23:04 +0000431 } else if (DstStart == OpStart && NarrowTy == MRI.getType(OpReg)) {
Tim Northover0e6afbd2017-02-06 21:56:47 +0000432 // The entire subregister is defined by this insert, forward the new
433 // value.
Tim Northover75e0b912017-03-06 18:23:04 +0000434 DstRegs.push_back(OpReg);
Tim Northover0e6afbd2017-02-06 21:56:47 +0000435 continue;
436 }
437
Tim Northover2eb18d32017-03-07 21:24:33 +0000438 // OpSegStart is where this destination segment would start in OpReg if it
439 // extended infinitely in both directions.
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000440 int64_t ExtractOffset, InsertOffset;
441 uint64_t SegSize;
Tim Northover2eb18d32017-03-07 21:24:33 +0000442 if (OpStart < DstStart) {
443 InsertOffset = 0;
444 ExtractOffset = DstStart - OpStart;
445 SegSize = std::min(NarrowSize, OpStart + OpSize - DstStart);
446 } else {
447 InsertOffset = OpStart - DstStart;
448 ExtractOffset = 0;
449 SegSize =
450 std::min(NarrowSize - InsertOffset, OpStart + OpSize - DstStart);
451 }
452
453 unsigned SegReg = OpReg;
454 if (ExtractOffset != 0 || SegSize != OpSize) {
Tim Northover75e0b912017-03-06 18:23:04 +0000455 // A genuine extract is needed.
Tim Northover2eb18d32017-03-07 21:24:33 +0000456 SegReg = MRI.createGenericVirtualRegister(LLT::scalar(SegSize));
457 MIRBuilder.buildExtract(SegReg, OpReg, ExtractOffset);
Tim Northover0e6afbd2017-02-06 21:56:47 +0000458 }
459
Tim Northover75e0b912017-03-06 18:23:04 +0000460 unsigned DstReg = MRI.createGenericVirtualRegister(NarrowTy);
Tim Northover2eb18d32017-03-07 21:24:33 +0000461 MIRBuilder.buildInsert(DstReg, SrcRegs[i], SegReg, InsertOffset);
Tim Northover0e6afbd2017-02-06 21:56:47 +0000462 DstRegs.push_back(DstReg);
463 }
464
465 assert(DstRegs.size() == (unsigned)NumParts && "not all parts covered");
Amara Emerson5ec14602018-12-10 18:44:58 +0000466 unsigned DstReg = MI.getOperand(0).getReg();
467 if(MRI.getType(DstReg).isVector())
468 MIRBuilder.buildBuildVector(DstReg, DstRegs);
469 else
470 MIRBuilder.buildMerge(DstReg, DstRegs);
Tim Northover0e6afbd2017-02-06 21:56:47 +0000471 MI.eraseFromParent();
472 return Legalized;
473 }
Justin Bognerd09c3ce2017-01-19 01:05:48 +0000474 case TargetOpcode::G_LOAD: {
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000475 // FIXME: add support for when SizeOp0 isn't an exact multiple of
476 // NarrowSize.
477 if (SizeOp0 % NarrowSize != 0)
478 return UnableToLegalize;
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000479
480 const auto &MMO = **MI.memoperands_begin();
481 // This implementation doesn't work for atomics. Give up instead of doing
482 // something invalid.
483 if (MMO.getOrdering() != AtomicOrdering::NotAtomic ||
484 MMO.getFailureOrdering() != AtomicOrdering::NotAtomic)
485 return UnableToLegalize;
486
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000487 int NumParts = SizeOp0 / NarrowSize;
Daniel Sanders4e523662017-06-13 23:42:32 +0000488 LLT OffsetTy = LLT::scalar(
489 MRI.getType(MI.getOperand(1).getReg()).getScalarSizeInBits());
Justin Bognerd09c3ce2017-01-19 01:05:48 +0000490
491 SmallVector<unsigned, 2> DstRegs;
Justin Bognerd09c3ce2017-01-19 01:05:48 +0000492 for (int i = 0; i < NumParts; ++i) {
493 unsigned DstReg = MRI.createGenericVirtualRegister(NarrowTy);
Daniel Sanders4e523662017-06-13 23:42:32 +0000494 unsigned SrcReg = 0;
495 unsigned Adjustment = i * NarrowSize / 8;
Volkan Keles60c6aff2018-10-25 17:52:19 +0000496 unsigned Alignment = MinAlign(MMO.getAlignment(), Adjustment);
Justin Bognerd09c3ce2017-01-19 01:05:48 +0000497
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000498 MachineMemOperand *SplitMMO = MIRBuilder.getMF().getMachineMemOperand(
499 MMO.getPointerInfo().getWithOffset(Adjustment), MMO.getFlags(),
Volkan Keles60c6aff2018-10-25 17:52:19 +0000500 NarrowSize / 8, Alignment, MMO.getAAInfo(), MMO.getRanges(),
501 MMO.getSyncScopeID(), MMO.getOrdering(), MMO.getFailureOrdering());
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000502
Daniel Sanders4e523662017-06-13 23:42:32 +0000503 MIRBuilder.materializeGEP(SrcReg, MI.getOperand(1).getReg(), OffsetTy,
504 Adjustment);
505
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000506 MIRBuilder.buildLoad(DstReg, SrcReg, *SplitMMO);
Justin Bognerd09c3ce2017-01-19 01:05:48 +0000507
508 DstRegs.push_back(DstReg);
Justin Bognerd09c3ce2017-01-19 01:05:48 +0000509 }
510 unsigned DstReg = MI.getOperand(0).getReg();
Amara Emerson5ec14602018-12-10 18:44:58 +0000511 if(MRI.getType(DstReg).isVector())
512 MIRBuilder.buildBuildVector(DstReg, DstRegs);
513 else
514 MIRBuilder.buildMerge(DstReg, DstRegs);
Justin Bognerd09c3ce2017-01-19 01:05:48 +0000515 MI.eraseFromParent();
516 return Legalized;
517 }
Justin Bognerfde01042017-01-18 17:29:54 +0000518 case TargetOpcode::G_STORE: {
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000519 // FIXME: add support for when SizeOp0 isn't an exact multiple of
520 // NarrowSize.
521 if (SizeOp0 % NarrowSize != 0)
522 return UnableToLegalize;
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000523
524 const auto &MMO = **MI.memoperands_begin();
525 // This implementation doesn't work for atomics. Give up instead of doing
526 // something invalid.
527 if (MMO.getOrdering() != AtomicOrdering::NotAtomic ||
528 MMO.getFailureOrdering() != AtomicOrdering::NotAtomic)
529 return UnableToLegalize;
530
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000531 int NumParts = SizeOp0 / NarrowSize;
Daniel Sanders4e523662017-06-13 23:42:32 +0000532 LLT OffsetTy = LLT::scalar(
533 MRI.getType(MI.getOperand(1).getReg()).getScalarSizeInBits());
Justin Bognerfde01042017-01-18 17:29:54 +0000534
535 SmallVector<unsigned, 2> SrcRegs;
536 extractParts(MI.getOperand(0).getReg(), NarrowTy, NumParts, SrcRegs);
537
538 for (int i = 0; i < NumParts; ++i) {
Daniel Sanders4e523662017-06-13 23:42:32 +0000539 unsigned DstReg = 0;
540 unsigned Adjustment = i * NarrowSize / 8;
Volkan Keles60c6aff2018-10-25 17:52:19 +0000541 unsigned Alignment = MinAlign(MMO.getAlignment(), Adjustment);
Daniel Sanders4e523662017-06-13 23:42:32 +0000542
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000543 MachineMemOperand *SplitMMO = MIRBuilder.getMF().getMachineMemOperand(
544 MMO.getPointerInfo().getWithOffset(Adjustment), MMO.getFlags(),
Volkan Keles60c6aff2018-10-25 17:52:19 +0000545 NarrowSize / 8, Alignment, MMO.getAAInfo(), MMO.getRanges(),
546 MMO.getSyncScopeID(), MMO.getOrdering(), MMO.getFailureOrdering());
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000547
Daniel Sanders4e523662017-06-13 23:42:32 +0000548 MIRBuilder.materializeGEP(DstReg, MI.getOperand(1).getReg(), OffsetTy,
549 Adjustment);
550
Daniel Sanders27fe8a52018-04-27 19:48:53 +0000551 MIRBuilder.buildStore(SrcRegs[i], DstReg, *SplitMMO);
Justin Bognerfde01042017-01-18 17:29:54 +0000552 }
553 MI.eraseFromParent();
554 return Legalized;
555 }
Igor Breger29537882017-04-07 14:41:59 +0000556 case TargetOpcode::G_CONSTANT: {
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000557 // FIXME: add support for when SizeOp0 isn't an exact multiple of
558 // NarrowSize.
559 if (SizeOp0 % NarrowSize != 0)
560 return UnableToLegalize;
561 int NumParts = SizeOp0 / NarrowSize;
Igor Breger29537882017-04-07 14:41:59 +0000562 const APInt &Cst = MI.getOperand(1).getCImm()->getValue();
Matthias Braunf1caa282017-12-15 22:22:58 +0000563 LLVMContext &Ctx = MIRBuilder.getMF().getFunction().getContext();
Igor Breger29537882017-04-07 14:41:59 +0000564
565 SmallVector<unsigned, 2> DstRegs;
566 for (int i = 0; i < NumParts; ++i) {
567 unsigned DstReg = MRI.createGenericVirtualRegister(NarrowTy);
568 ConstantInt *CI =
569 ConstantInt::get(Ctx, Cst.lshr(NarrowSize * i).trunc(NarrowSize));
570 MIRBuilder.buildConstant(DstReg, *CI);
571 DstRegs.push_back(DstReg);
572 }
573 unsigned DstReg = MI.getOperand(0).getReg();
Amara Emerson5ec14602018-12-10 18:44:58 +0000574 if(MRI.getType(DstReg).isVector())
575 MIRBuilder.buildBuildVector(DstReg, DstRegs);
576 else
577 MIRBuilder.buildMerge(DstReg, DstRegs);
Igor Breger29537882017-04-07 14:41:59 +0000578 MI.eraseFromParent();
579 return Legalized;
580 }
Quentin Colombetc2f3cea2017-10-03 04:53:56 +0000581 case TargetOpcode::G_OR: {
582 // Legalize bitwise operation:
583 // A = BinOp<Ty> B, C
584 // into:
585 // B1, ..., BN = G_UNMERGE_VALUES B
586 // C1, ..., CN = G_UNMERGE_VALUES C
587 // A1 = BinOp<Ty/N> B1, C2
588 // ...
589 // AN = BinOp<Ty/N> BN, CN
590 // A = G_MERGE_VALUES A1, ..., AN
Kristof Beylsaf9814a2017-11-07 10:34:34 +0000591
592 // FIXME: add support for when SizeOp0 isn't an exact multiple of
593 // NarrowSize.
594 if (SizeOp0 % NarrowSize != 0)
595 return UnableToLegalize;
596 int NumParts = SizeOp0 / NarrowSize;
Quentin Colombetc2f3cea2017-10-03 04:53:56 +0000597
598 // List the registers where the destination will be scattered.
599 SmallVector<unsigned, 2> DstRegs;
600 // List the registers where the first argument will be split.
601 SmallVector<unsigned, 2> SrcsReg1;
602 // List the registers where the second argument will be split.
603 SmallVector<unsigned, 2> SrcsReg2;
604 // Create all the temporary registers.
605 for (int i = 0; i < NumParts; ++i) {
606 unsigned DstReg = MRI.createGenericVirtualRegister(NarrowTy);
607 unsigned SrcReg1 = MRI.createGenericVirtualRegister(NarrowTy);
608 unsigned SrcReg2 = MRI.createGenericVirtualRegister(NarrowTy);
609
610 DstRegs.push_back(DstReg);
611 SrcsReg1.push_back(SrcReg1);
612 SrcsReg2.push_back(SrcReg2);
613 }
614 // Explode the big arguments into smaller chunks.
615 MIRBuilder.buildUnmerge(SrcsReg1, MI.getOperand(1).getReg());
616 MIRBuilder.buildUnmerge(SrcsReg2, MI.getOperand(2).getReg());
617
618 // Do the operation on each small part.
619 for (int i = 0; i < NumParts; ++i)
620 MIRBuilder.buildOr(DstRegs[i], SrcsReg1[i], SrcsReg2[i]);
621
622 // Gather the destination registers into the final destination.
623 unsigned DstReg = MI.getOperand(0).getReg();
Amara Emerson5ec14602018-12-10 18:44:58 +0000624 if(MRI.getType(DstReg).isVector())
625 MIRBuilder.buildBuildVector(DstReg, DstRegs);
626 else
627 MIRBuilder.buildMerge(DstReg, DstRegs);
Quentin Colombetc2f3cea2017-10-03 04:53:56 +0000628 MI.eraseFromParent();
629 return Legalized;
630 }
Tim Northover9656f142016-08-04 20:54:13 +0000631 }
Tim Northover33b07d62016-07-22 20:03:43 +0000632}
633
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000634void LegalizerHelper::widenScalarSrc(MachineInstr &MI, LLT WideTy,
635 unsigned OpIdx, unsigned ExtOpcode) {
636 MachineOperand &MO = MI.getOperand(OpIdx);
Aditya Nandakumarcef44a22018-12-11 00:48:50 +0000637 auto ExtB = MIRBuilder.buildInstr(ExtOpcode, {WideTy}, {MO.getReg()});
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000638 MO.setReg(ExtB->getOperand(0).getReg());
639}
640
641void LegalizerHelper::widenScalarDst(MachineInstr &MI, LLT WideTy,
642 unsigned OpIdx, unsigned TruncOpcode) {
643 MachineOperand &MO = MI.getOperand(OpIdx);
644 unsigned DstExt = MRI.createGenericVirtualRegister(WideTy);
645 MIRBuilder.setInsertPt(MIRBuilder.getMBB(), ++MIRBuilder.getInsertPt());
Aditya Nandakumarcef44a22018-12-11 00:48:50 +0000646 MIRBuilder.buildInstr(TruncOpcode, {MO.getReg()}, {DstExt});
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000647 MO.setReg(DstExt);
648}
649
Tim Northover69fa84a2016-10-14 22:18:18 +0000650LegalizerHelper::LegalizeResult
651LegalizerHelper::widenScalar(MachineInstr &MI, unsigned TypeIdx, LLT WideTy) {
Tim Northover3c73e362016-08-23 18:20:09 +0000652 MIRBuilder.setInstr(MI);
653
Tim Northover32335812016-08-04 18:35:11 +0000654 switch (MI.getOpcode()) {
655 default:
656 return UnableToLegalize;
Aditya Nandakumar6d47a412018-08-29 03:17:08 +0000657 case TargetOpcode::G_UADDO:
658 case TargetOpcode::G_USUBO: {
659 if (TypeIdx == 1)
660 return UnableToLegalize; // TODO
Aditya Nandakumarcef44a22018-12-11 00:48:50 +0000661 auto LHSZext = MIRBuilder.buildInstr(TargetOpcode::G_ZEXT, {WideTy},
662 {MI.getOperand(2).getReg()});
663 auto RHSZext = MIRBuilder.buildInstr(TargetOpcode::G_ZEXT, {WideTy},
664 {MI.getOperand(3).getReg()});
Aditya Nandakumar6d47a412018-08-29 03:17:08 +0000665 unsigned Opcode = MI.getOpcode() == TargetOpcode::G_UADDO
666 ? TargetOpcode::G_ADD
667 : TargetOpcode::G_SUB;
668 // Do the arithmetic in the larger type.
Aditya Nandakumarcef44a22018-12-11 00:48:50 +0000669 auto NewOp = MIRBuilder.buildInstr(Opcode, {WideTy}, {LHSZext, RHSZext});
Aditya Nandakumar6d47a412018-08-29 03:17:08 +0000670 LLT OrigTy = MRI.getType(MI.getOperand(0).getReg());
671 APInt Mask = APInt::getAllOnesValue(OrigTy.getSizeInBits());
672 auto AndOp = MIRBuilder.buildInstr(
Aditya Nandakumarcef44a22018-12-11 00:48:50 +0000673 TargetOpcode::G_AND, {WideTy},
674 {NewOp, MIRBuilder.buildConstant(WideTy, Mask.getZExtValue())});
Aditya Nandakumar6d47a412018-08-29 03:17:08 +0000675 // There is no overflow if the AndOp is the same as NewOp.
676 MIRBuilder.buildICmp(CmpInst::ICMP_NE, MI.getOperand(1).getReg(), NewOp,
677 AndOp);
678 // Now trunc the NewOp to the original result.
679 MIRBuilder.buildTrunc(MI.getOperand(0).getReg(), NewOp);
680 MI.eraseFromParent();
681 return Legalized;
682 }
Aditya Nandakumarc1061832018-08-22 17:59:18 +0000683 case TargetOpcode::G_CTTZ:
684 case TargetOpcode::G_CTTZ_ZERO_UNDEF:
685 case TargetOpcode::G_CTLZ:
686 case TargetOpcode::G_CTLZ_ZERO_UNDEF:
687 case TargetOpcode::G_CTPOP: {
688 // First ZEXT the input.
689 auto MIBSrc = MIRBuilder.buildZExt(WideTy, MI.getOperand(1).getReg());
690 LLT CurTy = MRI.getType(MI.getOperand(0).getReg());
691 if (MI.getOpcode() == TargetOpcode::G_CTTZ) {
692 // The count is the same in the larger type except if the original
693 // value was zero. This can be handled by setting the bit just off
694 // the top of the original type.
695 auto TopBit =
696 APInt::getOneBitSet(WideTy.getSizeInBits(), CurTy.getSizeInBits());
697 MIBSrc = MIRBuilder.buildInstr(
Aditya Nandakumarcef44a22018-12-11 00:48:50 +0000698 TargetOpcode::G_OR, {WideTy},
699 {MIBSrc, MIRBuilder.buildConstant(WideTy, TopBit.getSExtValue())});
Aditya Nandakumarc1061832018-08-22 17:59:18 +0000700 }
701 // Perform the operation at the larger size.
Aditya Nandakumarcef44a22018-12-11 00:48:50 +0000702 auto MIBNewOp = MIRBuilder.buildInstr(MI.getOpcode(), {WideTy}, {MIBSrc});
Aditya Nandakumarc1061832018-08-22 17:59:18 +0000703 // This is already the correct result for CTPOP and CTTZs
704 if (MI.getOpcode() == TargetOpcode::G_CTLZ ||
705 MI.getOpcode() == TargetOpcode::G_CTLZ_ZERO_UNDEF) {
706 // The correct result is NewOp - (Difference in widety and current ty).
707 unsigned SizeDiff = WideTy.getSizeInBits() - CurTy.getSizeInBits();
Aditya Nandakumarcef44a22018-12-11 00:48:50 +0000708 MIBNewOp = MIRBuilder.buildInstr(
709 TargetOpcode::G_SUB, {WideTy},
710 {MIBNewOp, MIRBuilder.buildConstant(WideTy, SizeDiff)});
Aditya Nandakumarc1061832018-08-22 17:59:18 +0000711 }
712 auto &TII = *MI.getMF()->getSubtarget().getInstrInfo();
Diana Picus30887bf2018-11-26 11:06:53 +0000713 // Make the original instruction a trunc now, and update its source.
Aditya Nandakumarc1061832018-08-22 17:59:18 +0000714 MI.setDesc(TII.get(TargetOpcode::G_TRUNC));
715 MI.getOperand(1).setReg(MIBNewOp->getOperand(0).getReg());
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000716 Observer.changedInstr(MI);
Aditya Nandakumarc1061832018-08-22 17:59:18 +0000717 return Legalized;
718 }
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000719
Tim Northover61c16142016-08-04 21:39:49 +0000720 case TargetOpcode::G_ADD:
721 case TargetOpcode::G_AND:
722 case TargetOpcode::G_MUL:
723 case TargetOpcode::G_OR:
724 case TargetOpcode::G_XOR:
Justin Bognerddb80ae2017-01-19 07:51:17 +0000725 case TargetOpcode::G_SUB:
Tim Northover32335812016-08-04 18:35:11 +0000726 // Perform operation at larger width (any extension is fine here, high bits
727 // don't affect the result) and then truncate the result back to the
728 // original type.
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000729 widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_ANYEXT);
730 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_ANYEXT);
731 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000732 Observer.changedInstr(MI);
Roman Tereshin27bba442018-05-09 01:43:12 +0000733 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000734
Roman Tereshin6d266382018-05-09 21:43:30 +0000735 case TargetOpcode::G_SHL:
736 widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_ANYEXT);
737 // The "number of bits to shift" operand must preserve its value as an
738 // unsigned integer:
739 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_ZEXT);
740 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000741 Observer.changedInstr(MI);
Roman Tereshin6d266382018-05-09 21:43:30 +0000742 return Legalized;
743
Tim Northover7a753d92016-08-26 17:46:06 +0000744 case TargetOpcode::G_SDIV:
Roman Tereshin27bba442018-05-09 01:43:12 +0000745 case TargetOpcode::G_SREM:
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000746 widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_SEXT);
747 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_SEXT);
748 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000749 Observer.changedInstr(MI);
Roman Tereshin27bba442018-05-09 01:43:12 +0000750 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000751
Roman Tereshin6d266382018-05-09 21:43:30 +0000752 case TargetOpcode::G_ASHR:
753 widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_SEXT);
754 // The "number of bits to shift" operand must preserve its value as an
755 // unsigned integer:
756 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_ZEXT);
757 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000758 Observer.changedInstr(MI);
Roman Tereshin6d266382018-05-09 21:43:30 +0000759 return Legalized;
760
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000761 case TargetOpcode::G_UDIV:
762 case TargetOpcode::G_UREM:
763 case TargetOpcode::G_LSHR:
764 widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_ZEXT);
765 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_ZEXT);
766 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000767 Observer.changedInstr(MI);
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000768 return Legalized;
769
770 case TargetOpcode::G_SELECT:
Tim Northover868332d2017-02-06 23:41:27 +0000771 if (TypeIdx != 0)
772 return UnableToLegalize;
Tim Northover868332d2017-02-06 23:41:27 +0000773 // Perform operation at larger width (any extension is fine here, high bits
774 // don't affect the result) and then truncate the result back to the
775 // original type.
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000776 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_ANYEXT);
777 widenScalarSrc(MI, WideTy, 3, TargetOpcode::G_ANYEXT);
778 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000779 Observer.changedInstr(MI);
Roman Tereshin27bba442018-05-09 01:43:12 +0000780 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000781
Ahmed Bougachab6137062017-01-23 21:10:14 +0000782 case TargetOpcode::G_FPTOSI:
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000783 case TargetOpcode::G_FPTOUI:
Ahmed Bougachab6137062017-01-23 21:10:14 +0000784 if (TypeIdx != 0)
785 return UnableToLegalize;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000786 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000787 Observer.changedInstr(MI);
Roman Tereshin27bba442018-05-09 01:43:12 +0000788 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000789
Ahmed Bougachad2948232017-01-20 01:37:24 +0000790 case TargetOpcode::G_SITOFP:
Ahmed Bougachad2948232017-01-20 01:37:24 +0000791 if (TypeIdx != 1)
792 return UnableToLegalize;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000793 widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_SEXT);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000794 Observer.changedInstr(MI);
Roman Tereshin27bba442018-05-09 01:43:12 +0000795 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000796
797 case TargetOpcode::G_UITOFP:
798 if (TypeIdx != 1)
799 return UnableToLegalize;
800 widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_ZEXT);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000801 Observer.changedInstr(MI);
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000802 return Legalized;
803
804 case TargetOpcode::G_INSERT:
Tim Northover0e6afbd2017-02-06 21:56:47 +0000805 if (TypeIdx != 0)
806 return UnableToLegalize;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000807 widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_ANYEXT);
808 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000809 Observer.changedInstr(MI);
Roman Tereshin27bba442018-05-09 01:43:12 +0000810 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000811
Daniel Sanders5eb9f582018-04-28 18:14:50 +0000812 case TargetOpcode::G_LOAD:
Amara Emersoncbc02c72018-02-01 20:47:03 +0000813 // For some types like i24, we might try to widen to i32. To properly handle
814 // this we should be using a dedicated extending load, until then avoid
815 // trying to legalize.
816 if (alignTo(MRI.getType(MI.getOperand(0).getReg()).getSizeInBits(), 8) !=
817 WideTy.getSizeInBits())
818 return UnableToLegalize;
Daniel Sanders5eb9f582018-04-28 18:14:50 +0000819 LLVM_FALLTHROUGH;
820 case TargetOpcode::G_SEXTLOAD:
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000821 case TargetOpcode::G_ZEXTLOAD:
822 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000823 Observer.changedInstr(MI);
Tim Northover3c73e362016-08-23 18:20:09 +0000824 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000825
Tim Northover3c73e362016-08-23 18:20:09 +0000826 case TargetOpcode::G_STORE: {
Tim Northover548feee2017-03-21 22:22:05 +0000827 if (MRI.getType(MI.getOperand(0).getReg()) != LLT::scalar(1) ||
828 WideTy != LLT::scalar(8))
829 return UnableToLegalize;
830
Amara Emerson5a3bb682018-06-01 13:20:32 +0000831 widenScalarSrc(MI, WideTy, 0, TargetOpcode::G_ZEXT);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000832 Observer.changedInstr(MI);
Tim Northover3c73e362016-08-23 18:20:09 +0000833 return Legalized;
834 }
Tim Northoverea904f92016-08-19 22:40:00 +0000835 case TargetOpcode::G_CONSTANT: {
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000836 MachineOperand &SrcMO = MI.getOperand(1);
837 LLVMContext &Ctx = MIRBuilder.getMF().getFunction().getContext();
838 const APInt &Val = SrcMO.getCImm()->getValue().sext(WideTy.getSizeInBits());
839 SrcMO.setCImm(ConstantInt::get(Ctx, Val));
840
841 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000842 Observer.changedInstr(MI);
Tim Northoverea904f92016-08-19 22:40:00 +0000843 return Legalized;
844 }
Tim Northovera11be042016-08-19 22:40:08 +0000845 case TargetOpcode::G_FCONSTANT: {
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000846 MachineOperand &SrcMO = MI.getOperand(1);
Amara Emerson77a5c962018-01-27 07:07:20 +0000847 LLVMContext &Ctx = MIRBuilder.getMF().getFunction().getContext();
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000848 APFloat Val = SrcMO.getFPImm()->getValueAPF();
Amara Emerson77a5c962018-01-27 07:07:20 +0000849 bool LosesInfo;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000850 switch (WideTy.getSizeInBits()) {
851 case 32:
852 Val.convert(APFloat::IEEEsingle(), APFloat::rmTowardZero, &LosesInfo);
853 break;
854 case 64:
855 Val.convert(APFloat::IEEEdouble(), APFloat::rmTowardZero, &LosesInfo);
856 break;
857 default:
858 llvm_unreachable("Unhandled fp widen type");
Tim Northover6cd4b232016-08-23 21:01:26 +0000859 }
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000860 SrcMO.setFPImm(ConstantFP::get(Ctx, Val));
861
862 widenScalarDst(MI, WideTy, 0, TargetOpcode::G_FPTRUNC);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000863 Observer.changedInstr(MI);
Roman Tereshin25cbfe62018-05-08 22:53:09 +0000864 return Legalized;
Roman Tereshin27bba442018-05-09 01:43:12 +0000865 }
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000866 case TargetOpcode::G_BRCOND:
867 widenScalarSrc(MI, WideTy, 0, TargetOpcode::G_ANYEXT);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000868 Observer.changedInstr(MI);
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000869 return Legalized;
870
871 case TargetOpcode::G_FCMP:
872 if (TypeIdx == 0)
873 widenScalarDst(MI, WideTy);
874 else {
875 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_FPEXT);
876 widenScalarSrc(MI, WideTy, 3, TargetOpcode::G_FPEXT);
Roman Tereshin27bba442018-05-09 01:43:12 +0000877 }
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000878 Observer.changedInstr(MI);
Roman Tereshin27bba442018-05-09 01:43:12 +0000879 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000880
881 case TargetOpcode::G_ICMP:
882 if (TypeIdx == 0)
883 widenScalarDst(MI, WideTy);
884 else {
885 unsigned ExtOpcode = CmpInst::isSigned(static_cast<CmpInst::Predicate>(
886 MI.getOperand(1).getPredicate()))
887 ? TargetOpcode::G_SEXT
888 : TargetOpcode::G_ZEXT;
889 widenScalarSrc(MI, WideTy, 2, ExtOpcode);
890 widenScalarSrc(MI, WideTy, 3, ExtOpcode);
891 }
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000892 Observer.changedInstr(MI);
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000893 return Legalized;
894
895 case TargetOpcode::G_GEP:
Tim Northover22d82cf2016-09-15 11:02:19 +0000896 assert(TypeIdx == 1 && "unable to legalize pointer of GEP");
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000897 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_SEXT);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000898 Observer.changedInstr(MI);
Tim Northover22d82cf2016-09-15 11:02:19 +0000899 return Legalized;
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000900
Aditya Nandakumar892979e2017-08-25 04:57:27 +0000901 case TargetOpcode::G_PHI: {
902 assert(TypeIdx == 0 && "Expecting only Idx 0");
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000903
904 for (unsigned I = 1; I < MI.getNumOperands(); I += 2) {
905 MachineBasicBlock &OpMBB = *MI.getOperand(I + 1).getMBB();
906 MIRBuilder.setInsertPt(OpMBB, OpMBB.getFirstTerminator());
907 widenScalarSrc(MI, WideTy, I, TargetOpcode::G_ANYEXT);
Aditya Nandakumar892979e2017-08-25 04:57:27 +0000908 }
Roman Tereshind5fa9fd2018-05-09 17:28:18 +0000909
910 MachineBasicBlock &MBB = *MI.getParent();
911 MIRBuilder.setInsertPt(MBB, --MBB.getFirstNonPHI());
912 widenScalarDst(MI, WideTy);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000913 Observer.changedInstr(MI);
Aditya Nandakumar892979e2017-08-25 04:57:27 +0000914 return Legalized;
915 }
Amara Emersoncbd86d82018-10-25 14:04:54 +0000916 case TargetOpcode::G_EXTRACT_VECTOR_ELT:
917 if (TypeIdx != 2)
918 return UnableToLegalize;
919 widenScalarSrc(MI, WideTy, 2, TargetOpcode::G_SEXT);
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +0000920 Observer.changedInstr(MI);
Amara Emersoncbd86d82018-10-25 14:04:54 +0000921 return Legalized;
Tim Northover32335812016-08-04 18:35:11 +0000922 }
Tim Northover33b07d62016-07-22 20:03:43 +0000923}
924
Tim Northover69fa84a2016-10-14 22:18:18 +0000925LegalizerHelper::LegalizeResult
926LegalizerHelper::lower(MachineInstr &MI, unsigned TypeIdx, LLT Ty) {
Tim Northovercecee562016-08-26 17:46:13 +0000927 using namespace TargetOpcode;
Tim Northovercecee562016-08-26 17:46:13 +0000928 MIRBuilder.setInstr(MI);
929
930 switch(MI.getOpcode()) {
931 default:
932 return UnableToLegalize;
933 case TargetOpcode::G_SREM:
934 case TargetOpcode::G_UREM: {
Tim Northover0f140c72016-09-09 11:46:34 +0000935 unsigned QuotReg = MRI.createGenericVirtualRegister(Ty);
936 MIRBuilder.buildInstr(MI.getOpcode() == G_SREM ? G_SDIV : G_UDIV)
Tim Northovercecee562016-08-26 17:46:13 +0000937 .addDef(QuotReg)
938 .addUse(MI.getOperand(1).getReg())
939 .addUse(MI.getOperand(2).getReg());
940
Tim Northover0f140c72016-09-09 11:46:34 +0000941 unsigned ProdReg = MRI.createGenericVirtualRegister(Ty);
942 MIRBuilder.buildMul(ProdReg, QuotReg, MI.getOperand(2).getReg());
943 MIRBuilder.buildSub(MI.getOperand(0).getReg(), MI.getOperand(1).getReg(),
944 ProdReg);
Tim Northovercecee562016-08-26 17:46:13 +0000945 MI.eraseFromParent();
946 return Legalized;
947 }
Tim Northover0a9b2792017-02-08 21:22:15 +0000948 case TargetOpcode::G_SMULO:
949 case TargetOpcode::G_UMULO: {
950 // Generate G_UMULH/G_SMULH to check for overflow and a normal G_MUL for the
951 // result.
952 unsigned Res = MI.getOperand(0).getReg();
953 unsigned Overflow = MI.getOperand(1).getReg();
954 unsigned LHS = MI.getOperand(2).getReg();
955 unsigned RHS = MI.getOperand(3).getReg();
956
957 MIRBuilder.buildMul(Res, LHS, RHS);
958
959 unsigned Opcode = MI.getOpcode() == TargetOpcode::G_SMULO
960 ? TargetOpcode::G_SMULH
961 : TargetOpcode::G_UMULH;
962
963 unsigned HiPart = MRI.createGenericVirtualRegister(Ty);
964 MIRBuilder.buildInstr(Opcode)
965 .addDef(HiPart)
966 .addUse(LHS)
967 .addUse(RHS);
968
969 unsigned Zero = MRI.createGenericVirtualRegister(Ty);
970 MIRBuilder.buildConstant(Zero, 0);
Amara Emerson9de62132018-01-03 04:56:56 +0000971
972 // For *signed* multiply, overflow is detected by checking:
973 // (hi != (lo >> bitwidth-1))
974 if (Opcode == TargetOpcode::G_SMULH) {
975 unsigned Shifted = MRI.createGenericVirtualRegister(Ty);
976 unsigned ShiftAmt = MRI.createGenericVirtualRegister(Ty);
977 MIRBuilder.buildConstant(ShiftAmt, Ty.getSizeInBits() - 1);
978 MIRBuilder.buildInstr(TargetOpcode::G_ASHR)
979 .addDef(Shifted)
980 .addUse(Res)
981 .addUse(ShiftAmt);
982 MIRBuilder.buildICmp(CmpInst::ICMP_NE, Overflow, HiPart, Shifted);
983 } else {
984 MIRBuilder.buildICmp(CmpInst::ICMP_NE, Overflow, HiPart, Zero);
985 }
Tim Northover0a9b2792017-02-08 21:22:15 +0000986 MI.eraseFromParent();
987 return Legalized;
988 }
Volkan Keles5698b2a2017-03-08 18:09:14 +0000989 case TargetOpcode::G_FNEG: {
990 // TODO: Handle vector types once we are able to
991 // represent them.
992 if (Ty.isVector())
993 return UnableToLegalize;
994 unsigned Res = MI.getOperand(0).getReg();
995 Type *ZeroTy;
Matthias Braunf1caa282017-12-15 22:22:58 +0000996 LLVMContext &Ctx = MIRBuilder.getMF().getFunction().getContext();
Volkan Keles5698b2a2017-03-08 18:09:14 +0000997 switch (Ty.getSizeInBits()) {
998 case 16:
999 ZeroTy = Type::getHalfTy(Ctx);
1000 break;
1001 case 32:
1002 ZeroTy = Type::getFloatTy(Ctx);
1003 break;
1004 case 64:
1005 ZeroTy = Type::getDoubleTy(Ctx);
1006 break;
Amara Emersonb6ddbef2017-12-19 17:21:35 +00001007 case 128:
1008 ZeroTy = Type::getFP128Ty(Ctx);
1009 break;
Volkan Keles5698b2a2017-03-08 18:09:14 +00001010 default:
1011 llvm_unreachable("unexpected floating-point type");
1012 }
1013 ConstantFP &ZeroForNegation =
1014 *cast<ConstantFP>(ConstantFP::getZeroValueForNegation(ZeroTy));
Volkan Keles02bb1742018-02-14 19:58:36 +00001015 auto Zero = MIRBuilder.buildFConstant(Ty, ZeroForNegation);
Volkan Keles5698b2a2017-03-08 18:09:14 +00001016 MIRBuilder.buildInstr(TargetOpcode::G_FSUB)
1017 .addDef(Res)
Volkan Keles02bb1742018-02-14 19:58:36 +00001018 .addUse(Zero->getOperand(0).getReg())
Volkan Keles5698b2a2017-03-08 18:09:14 +00001019 .addUse(MI.getOperand(1).getReg());
1020 MI.eraseFromParent();
1021 return Legalized;
1022 }
Volkan Keles225921a2017-03-10 21:25:09 +00001023 case TargetOpcode::G_FSUB: {
1024 // Lower (G_FSUB LHS, RHS) to (G_FADD LHS, (G_FNEG RHS)).
1025 // First, check if G_FNEG is marked as Lower. If so, we may
1026 // end up with an infinite loop as G_FSUB is used to legalize G_FNEG.
Daniel Sanders9ade5592018-01-29 17:37:29 +00001027 if (LI.getAction({G_FNEG, {Ty}}).Action == Lower)
Volkan Keles225921a2017-03-10 21:25:09 +00001028 return UnableToLegalize;
1029 unsigned Res = MI.getOperand(0).getReg();
1030 unsigned LHS = MI.getOperand(1).getReg();
1031 unsigned RHS = MI.getOperand(2).getReg();
1032 unsigned Neg = MRI.createGenericVirtualRegister(Ty);
1033 MIRBuilder.buildInstr(TargetOpcode::G_FNEG).addDef(Neg).addUse(RHS);
1034 MIRBuilder.buildInstr(TargetOpcode::G_FADD)
1035 .addDef(Res)
1036 .addUse(LHS)
1037 .addUse(Neg);
1038 MI.eraseFromParent();
1039 return Legalized;
1040 }
Daniel Sandersaef1dfc2017-11-30 20:11:42 +00001041 case TargetOpcode::G_ATOMIC_CMPXCHG_WITH_SUCCESS: {
1042 unsigned OldValRes = MI.getOperand(0).getReg();
1043 unsigned SuccessRes = MI.getOperand(1).getReg();
1044 unsigned Addr = MI.getOperand(2).getReg();
1045 unsigned CmpVal = MI.getOperand(3).getReg();
1046 unsigned NewVal = MI.getOperand(4).getReg();
1047 MIRBuilder.buildAtomicCmpXchg(OldValRes, Addr, CmpVal, NewVal,
1048 **MI.memoperands_begin());
1049 MIRBuilder.buildICmp(CmpInst::ICMP_EQ, SuccessRes, OldValRes, CmpVal);
1050 MI.eraseFromParent();
1051 return Legalized;
1052 }
Daniel Sanders5eb9f582018-04-28 18:14:50 +00001053 case TargetOpcode::G_LOAD:
1054 case TargetOpcode::G_SEXTLOAD:
1055 case TargetOpcode::G_ZEXTLOAD: {
1056 // Lower to a memory-width G_LOAD and a G_SEXT/G_ZEXT/G_ANYEXT
1057 unsigned DstReg = MI.getOperand(0).getReg();
1058 unsigned PtrReg = MI.getOperand(1).getReg();
1059 LLT DstTy = MRI.getType(DstReg);
1060 auto &MMO = **MI.memoperands_begin();
1061
1062 if (DstTy.getSizeInBits() == MMO.getSize() /* in bytes */ * 8) {
Daniel Sanders2de9d4a2018-04-30 17:20:01 +00001063 // In the case of G_LOAD, this was a non-extending load already and we're
1064 // about to lower to the same instruction.
1065 if (MI.getOpcode() == TargetOpcode::G_LOAD)
1066 return UnableToLegalize;
Daniel Sanders5eb9f582018-04-28 18:14:50 +00001067 MIRBuilder.buildLoad(DstReg, PtrReg, MMO);
1068 MI.eraseFromParent();
1069 return Legalized;
1070 }
1071
1072 if (DstTy.isScalar()) {
1073 unsigned TmpReg = MRI.createGenericVirtualRegister(
1074 LLT::scalar(MMO.getSize() /* in bytes */ * 8));
1075 MIRBuilder.buildLoad(TmpReg, PtrReg, MMO);
1076 switch (MI.getOpcode()) {
1077 default:
1078 llvm_unreachable("Unexpected opcode");
1079 case TargetOpcode::G_LOAD:
1080 MIRBuilder.buildAnyExt(DstReg, TmpReg);
1081 break;
1082 case TargetOpcode::G_SEXTLOAD:
1083 MIRBuilder.buildSExt(DstReg, TmpReg);
1084 break;
1085 case TargetOpcode::G_ZEXTLOAD:
1086 MIRBuilder.buildZExt(DstReg, TmpReg);
1087 break;
1088 }
1089 MI.eraseFromParent();
1090 return Legalized;
1091 }
1092
1093 return UnableToLegalize;
1094 }
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001095 case TargetOpcode::G_CTLZ_ZERO_UNDEF:
1096 case TargetOpcode::G_CTTZ_ZERO_UNDEF:
1097 case TargetOpcode::G_CTLZ:
1098 case TargetOpcode::G_CTTZ:
1099 case TargetOpcode::G_CTPOP:
1100 return lowerBitCount(MI, TypeIdx, Ty);
Tim Northovercecee562016-08-26 17:46:13 +00001101 }
1102}
1103
Tim Northover69fa84a2016-10-14 22:18:18 +00001104LegalizerHelper::LegalizeResult
1105LegalizerHelper::fewerElementsVector(MachineInstr &MI, unsigned TypeIdx,
1106 LLT NarrowTy) {
Quentin Colombet5e60bcd2016-08-27 02:38:21 +00001107 // FIXME: Don't know how to handle secondary types yet.
1108 if (TypeIdx != 0)
1109 return UnableToLegalize;
Tim Northover33b07d62016-07-22 20:03:43 +00001110 switch (MI.getOpcode()) {
1111 default:
1112 return UnableToLegalize;
1113 case TargetOpcode::G_ADD: {
1114 unsigned NarrowSize = NarrowTy.getSizeInBits();
Tim Northover0f140c72016-09-09 11:46:34 +00001115 unsigned DstReg = MI.getOperand(0).getReg();
Kristof Beylsaf9814a2017-11-07 10:34:34 +00001116 unsigned Size = MRI.getType(DstReg).getSizeInBits();
1117 int NumParts = Size / NarrowSize;
1118 // FIXME: Don't know how to handle the situation where the small vectors
1119 // aren't all the same size yet.
1120 if (Size % NarrowSize != 0)
1121 return UnableToLegalize;
Tim Northover33b07d62016-07-22 20:03:43 +00001122
1123 MIRBuilder.setInstr(MI);
1124
Tim Northoverb18ea162016-09-20 15:20:36 +00001125 SmallVector<unsigned, 2> Src1Regs, Src2Regs, DstRegs;
Tim Northover33b07d62016-07-22 20:03:43 +00001126 extractParts(MI.getOperand(1).getReg(), NarrowTy, NumParts, Src1Regs);
1127 extractParts(MI.getOperand(2).getReg(), NarrowTy, NumParts, Src2Regs);
1128
1129 for (int i = 0; i < NumParts; ++i) {
Tim Northover0f140c72016-09-09 11:46:34 +00001130 unsigned DstReg = MRI.createGenericVirtualRegister(NarrowTy);
1131 MIRBuilder.buildAdd(DstReg, Src1Regs[i], Src2Regs[i]);
Tim Northover33b07d62016-07-22 20:03:43 +00001132 DstRegs.push_back(DstReg);
1133 }
1134
Amara Emerson5ec14602018-12-10 18:44:58 +00001135 MIRBuilder.buildConcatVectors(DstReg, DstRegs);
Tim Northover33b07d62016-07-22 20:03:43 +00001136 MI.eraseFromParent();
1137 return Legalized;
1138 }
1139 }
1140}
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001141
1142LegalizerHelper::LegalizeResult
1143LegalizerHelper::lowerBitCount(MachineInstr &MI, unsigned TypeIdx, LLT Ty) {
1144 unsigned Opc = MI.getOpcode();
1145 auto &TII = *MI.getMF()->getSubtarget().getInstrInfo();
Diana Picus0528e2c2018-11-26 11:07:02 +00001146 auto isSupported = [this](const LegalityQuery &Q) {
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001147 auto QAction = LI.getAction(Q).Action;
Diana Picus0528e2c2018-11-26 11:07:02 +00001148 return QAction == Legal || QAction == Libcall || QAction == Custom;
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001149 };
1150 switch (Opc) {
1151 default:
1152 return UnableToLegalize;
1153 case TargetOpcode::G_CTLZ_ZERO_UNDEF: {
1154 // This trivially expands to CTLZ.
1155 MI.setDesc(TII.get(TargetOpcode::G_CTLZ));
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +00001156 Observer.changedInstr(MI);
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001157 return Legalized;
1158 }
1159 case TargetOpcode::G_CTLZ: {
1160 unsigned SrcReg = MI.getOperand(1).getReg();
1161 unsigned Len = Ty.getSizeInBits();
Diana Picus0528e2c2018-11-26 11:07:02 +00001162 if (isSupported({TargetOpcode::G_CTLZ_ZERO_UNDEF, {Ty}})) {
1163 // If CTLZ_ZERO_UNDEF is supported, emit that and a select for zero.
Aditya Nandakumarcef44a22018-12-11 00:48:50 +00001164 auto MIBCtlzZU = MIRBuilder.buildInstr(TargetOpcode::G_CTLZ_ZERO_UNDEF,
1165 {Ty}, {SrcReg});
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001166 auto MIBZero = MIRBuilder.buildConstant(Ty, 0);
1167 auto MIBLen = MIRBuilder.buildConstant(Ty, Len);
1168 auto MIBICmp = MIRBuilder.buildICmp(CmpInst::ICMP_EQ, LLT::scalar(1),
1169 SrcReg, MIBZero);
1170 MIRBuilder.buildSelect(MI.getOperand(0).getReg(), MIBICmp, MIBLen,
1171 MIBCtlzZU);
1172 MI.eraseFromParent();
1173 return Legalized;
1174 }
1175 // for now, we do this:
1176 // NewLen = NextPowerOf2(Len);
1177 // x = x | (x >> 1);
1178 // x = x | (x >> 2);
1179 // ...
1180 // x = x | (x >>16);
1181 // x = x | (x >>32); // for 64-bit input
1182 // Upto NewLen/2
1183 // return Len - popcount(x);
1184 //
1185 // Ref: "Hacker's Delight" by Henry Warren
1186 unsigned Op = SrcReg;
1187 unsigned NewLen = PowerOf2Ceil(Len);
1188 for (unsigned i = 0; (1U << i) <= (NewLen / 2); ++i) {
1189 auto MIBShiftAmt = MIRBuilder.buildConstant(Ty, 1ULL << i);
1190 auto MIBOp = MIRBuilder.buildInstr(
Aditya Nandakumarcef44a22018-12-11 00:48:50 +00001191 TargetOpcode::G_OR, {Ty},
1192 {Op, MIRBuilder.buildInstr(TargetOpcode::G_LSHR, {Ty},
1193 {Op, MIBShiftAmt})});
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001194 Op = MIBOp->getOperand(0).getReg();
1195 }
Aditya Nandakumarcef44a22018-12-11 00:48:50 +00001196 auto MIBPop = MIRBuilder.buildInstr(TargetOpcode::G_CTPOP, {Ty}, {Op});
1197 MIRBuilder.buildInstr(TargetOpcode::G_SUB, {MI.getOperand(0).getReg()},
1198 {MIRBuilder.buildConstant(Ty, Len), MIBPop});
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001199 MI.eraseFromParent();
1200 return Legalized;
1201 }
1202 case TargetOpcode::G_CTTZ_ZERO_UNDEF: {
1203 // This trivially expands to CTTZ.
1204 MI.setDesc(TII.get(TargetOpcode::G_CTTZ));
Aditya Nandakumarf75d4f32018-12-05 20:14:52 +00001205 Observer.changedInstr(MI);
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001206 return Legalized;
1207 }
1208 case TargetOpcode::G_CTTZ: {
1209 unsigned SrcReg = MI.getOperand(1).getReg();
1210 unsigned Len = Ty.getSizeInBits();
Diana Picus0528e2c2018-11-26 11:07:02 +00001211 if (isSupported({TargetOpcode::G_CTTZ_ZERO_UNDEF, {Ty}})) {
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001212 // If CTTZ_ZERO_UNDEF is legal or custom, emit that and a select with
1213 // zero.
Aditya Nandakumarcef44a22018-12-11 00:48:50 +00001214 auto MIBCttzZU = MIRBuilder.buildInstr(TargetOpcode::G_CTTZ_ZERO_UNDEF,
1215 {Ty}, {SrcReg});
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001216 auto MIBZero = MIRBuilder.buildConstant(Ty, 0);
1217 auto MIBLen = MIRBuilder.buildConstant(Ty, Len);
1218 auto MIBICmp = MIRBuilder.buildICmp(CmpInst::ICMP_EQ, LLT::scalar(1),
1219 SrcReg, MIBZero);
1220 MIRBuilder.buildSelect(MI.getOperand(0).getReg(), MIBICmp, MIBLen,
1221 MIBCttzZU);
1222 MI.eraseFromParent();
1223 return Legalized;
1224 }
1225 // for now, we use: { return popcount(~x & (x - 1)); }
1226 // unless the target has ctlz but not ctpop, in which case we use:
1227 // { return 32 - nlz(~x & (x-1)); }
1228 // Ref: "Hacker's Delight" by Henry Warren
1229 auto MIBCstNeg1 = MIRBuilder.buildConstant(Ty, -1);
1230 auto MIBNot =
Aditya Nandakumarcef44a22018-12-11 00:48:50 +00001231 MIRBuilder.buildInstr(TargetOpcode::G_XOR, {Ty}, {SrcReg, MIBCstNeg1});
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001232 auto MIBTmp = MIRBuilder.buildInstr(
Aditya Nandakumarcef44a22018-12-11 00:48:50 +00001233 TargetOpcode::G_AND, {Ty},
1234 {MIBNot, MIRBuilder.buildInstr(TargetOpcode::G_ADD, {Ty},
1235 {SrcReg, MIBCstNeg1})});
Diana Picus0528e2c2018-11-26 11:07:02 +00001236 if (!isSupported({TargetOpcode::G_CTPOP, {Ty}}) &&
1237 isSupported({TargetOpcode::G_CTLZ, {Ty}})) {
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001238 auto MIBCstLen = MIRBuilder.buildConstant(Ty, Len);
1239 MIRBuilder.buildInstr(
Aditya Nandakumarcef44a22018-12-11 00:48:50 +00001240 TargetOpcode::G_SUB, {MI.getOperand(0).getReg()},
1241 {MIBCstLen,
1242 MIRBuilder.buildInstr(TargetOpcode::G_CTLZ, {Ty}, {MIBTmp})});
Aditya Nandakumarc0333f72018-08-21 17:30:31 +00001243 MI.eraseFromParent();
1244 return Legalized;
1245 }
1246 MI.setDesc(TII.get(TargetOpcode::G_CTPOP));
1247 MI.getOperand(1).setReg(MIBTmp->getOperand(0).getReg());
1248 return Legalized;
1249 }
1250 }
1251}