blob: d3ee5e8e5dbbc8ed0a12765d129ddc0e5cfe19e9 [file] [log] [blame]
Chandler Carruth7132e002007-08-04 01:51:18 +00001//===-- AutoUpgrade.cpp - Implement auto-upgrade helper functions ---------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chandler Carruth7132e002007-08-04 01:51:18 +00007//
8//===----------------------------------------------------------------------===//
9//
Sanjay Patel19792fb2015-03-10 16:08:36 +000010// This file implements the auto-upgrade helper functions.
11// This is where deprecated IR intrinsics and other IR features are updated to
12// current specifications.
Chandler Carruth7132e002007-08-04 01:51:18 +000013//
14//===----------------------------------------------------------------------===//
15
Chandler Carruth91065212014-03-05 10:34:14 +000016#include "llvm/IR/AutoUpgrade.h"
Chandler Carruth1305dc32014-03-04 11:45:46 +000017#include "llvm/IR/CFG.h"
Chandler Carruth219b89b2014-03-04 11:01:28 +000018#include "llvm/IR/CallSite.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000019#include "llvm/IR/Constants.h"
Chandler Carruthd9903882015-01-14 11:23:27 +000020#include "llvm/IR/DIBuilder.h"
Chandler Carruth9a4c9e52014-03-06 00:46:21 +000021#include "llvm/IR/DebugInfo.h"
Manman Ren2ebfb422014-01-16 01:51:12 +000022#include "llvm/IR/DiagnosticInfo.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000023#include "llvm/IR/Function.h"
24#include "llvm/IR/IRBuilder.h"
25#include "llvm/IR/Instruction.h"
26#include "llvm/IR/IntrinsicInst.h"
27#include "llvm/IR/LLVMContext.h"
28#include "llvm/IR/Module.h"
Torok Edwin56d06592009-07-11 20:10:48 +000029#include "llvm/Support/ErrorHandling.h"
Jeroen Ketemaab99b592015-09-30 10:56:37 +000030#include "llvm/Support/Regex.h"
Anton Korobeynikov579f0712008-02-20 11:08:44 +000031#include <cstring>
Chandler Carruth7132e002007-08-04 01:51:18 +000032using namespace llvm;
33
Nadav Rotem17ee58a2012-06-10 18:42:51 +000034// Upgrade the declarations of the SSE4.1 functions whose arguments have
35// changed their type from v4f32 to v2i64.
36static bool UpgradeSSE41Function(Function* F, Intrinsic::ID IID,
37 Function *&NewFn) {
38 // Check whether this is an old version of the function, which received
39 // v4f32 arguments.
40 Type *Arg0Type = F->getFunctionType()->getParamType(0);
41 if (Arg0Type != VectorType::get(Type::getFloatTy(F->getContext()), 4))
42 return false;
43
44 // Yes, it's old, replace it with new version.
45 F->setName(F->getName() + ".old");
46 NewFn = Intrinsic::getDeclaration(F->getParent(), IID);
47 return true;
48}
Chandler Carruth7132e002007-08-04 01:51:18 +000049
Chandler Carruth373b2b12014-09-06 10:00:01 +000050// Upgrade the declarations of intrinsic functions whose 8-bit immediate mask
51// arguments have changed their type from i32 to i8.
52static bool UpgradeX86IntrinsicsWith8BitMask(Function *F, Intrinsic::ID IID,
53 Function *&NewFn) {
54 // Check that the last argument is an i32.
55 Type *LastArgType = F->getFunctionType()->getParamType(
56 F->getFunctionType()->getNumParams() - 1);
57 if (!LastArgType->isIntegerTy(32))
58 return false;
59
60 // Move this function aside and map down.
61 F->setName(F->getName() + ".old");
62 NewFn = Intrinsic::getDeclaration(F->getParent(), IID);
63 return true;
64}
65
Evan Cheng0e179d02007-12-17 22:33:23 +000066static bool UpgradeIntrinsicFunction1(Function *F, Function *&NewFn) {
Chandler Carruth7132e002007-08-04 01:51:18 +000067 assert(F && "Illegal to upgrade a non-existent Function.");
68
Chandler Carruth7132e002007-08-04 01:51:18 +000069 // Quickly eliminate it, if it's not a candidate.
Chris Lattnerb372f662011-06-18 18:56:39 +000070 StringRef Name = F->getName();
71 if (Name.size() <= 8 || !Name.startswith("llvm."))
Evan Cheng0e179d02007-12-17 22:33:23 +000072 return false;
Chris Lattnerb372f662011-06-18 18:56:39 +000073 Name = Name.substr(5); // Strip off "llvm."
Chris Lattner0bcbde42011-11-27 08:42:07 +000074
Chris Lattnerb372f662011-06-18 18:56:39 +000075 switch (Name[0]) {
Chandler Carruth7132e002007-08-04 01:51:18 +000076 default: break;
Joel Jones43cb8782012-07-13 23:25:25 +000077 case 'a': {
78 if (Name.startswith("arm.neon.vclz")) {
79 Type* args[2] = {
Matt Arsenaultc4c92262013-07-20 17:46:00 +000080 F->arg_begin()->getType(),
Joel Jones43cb8782012-07-13 23:25:25 +000081 Type::getInt1Ty(F->getContext())
82 };
83 // Can't use Intrinsic::getDeclaration here as it adds a ".i1" to
84 // the end of the name. Change name from llvm.arm.neon.vclz.* to
85 // llvm.ctlz.*
86 FunctionType* fType = FunctionType::get(F->getReturnType(), args, false);
Matt Arsenaultc4c92262013-07-20 17:46:00 +000087 NewFn = Function::Create(fType, F->getLinkage(),
Joel Jones43cb8782012-07-13 23:25:25 +000088 "llvm.ctlz." + Name.substr(14), F->getParent());
89 return true;
90 }
Joel Jonesb84f7be2012-07-18 00:02:16 +000091 if (Name.startswith("arm.neon.vcnt")) {
92 NewFn = Intrinsic::getDeclaration(F->getParent(), Intrinsic::ctpop,
93 F->arg_begin()->getType());
94 return true;
95 }
Jeroen Ketemaab99b592015-09-30 10:56:37 +000096 Regex vldRegex("^arm\\.neon\\.vld([1234]|[234]lane)\\.v[a-z0-9]*$");
97 if (vldRegex.match(Name)) {
98 auto fArgs = F->getFunctionType()->params();
99 SmallVector<Type *, 4> Tys(fArgs.begin(), fArgs.end());
100 // Can't use Intrinsic::getDeclaration here as the return types might
101 // then only be structurally equal.
102 FunctionType* fType = FunctionType::get(F->getReturnType(), Tys, false);
103 NewFn = Function::Create(fType, F->getLinkage(),
104 "llvm." + Name + ".p0i8", F->getParent());
105 return true;
106 }
107 Regex vstRegex("^arm\\.neon\\.vst([1234]|[234]lane)\\.v[a-z0-9]*$");
108 if (vstRegex.match(Name)) {
Craig Topper26260942015-10-18 05:15:34 +0000109 static const Intrinsic::ID StoreInts[] = {Intrinsic::arm_neon_vst1,
110 Intrinsic::arm_neon_vst2,
111 Intrinsic::arm_neon_vst3,
112 Intrinsic::arm_neon_vst4};
Jeroen Ketemaab99b592015-09-30 10:56:37 +0000113
Craig Topper26260942015-10-18 05:15:34 +0000114 static const Intrinsic::ID StoreLaneInts[] = {
115 Intrinsic::arm_neon_vst2lane, Intrinsic::arm_neon_vst3lane,
116 Intrinsic::arm_neon_vst4lane
117 };
Jeroen Ketemaab99b592015-09-30 10:56:37 +0000118
119 auto fArgs = F->getFunctionType()->params();
120 Type *Tys[] = {fArgs[0], fArgs[1]};
121 if (Name.find("lane") == StringRef::npos)
122 NewFn = Intrinsic::getDeclaration(F->getParent(),
123 StoreInts[fArgs.size() - 3], Tys);
124 else
125 NewFn = Intrinsic::getDeclaration(F->getParent(),
126 StoreLaneInts[fArgs.size() - 5], Tys);
127 return true;
128 }
Marcin Koscielnicki3fdc2572016-04-19 20:51:05 +0000129 if (Name == "aarch64.thread.pointer" || Name == "arm.thread.pointer") {
130 NewFn = Intrinsic::getDeclaration(F->getParent(), Intrinsic::thread_pointer);
131 return true;
132 }
Joel Jones43cb8782012-07-13 23:25:25 +0000133 break;
134 }
Jeroen Ketemaab99b592015-09-30 10:56:37 +0000135
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000136 case 'c': {
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000137 if (Name.startswith("ctlz.") && F->arg_size() == 1) {
138 F->setName(Name + ".old");
Chandler Carruthd4a02402011-12-12 10:57:20 +0000139 NewFn = Intrinsic::getDeclaration(F->getParent(), Intrinsic::ctlz,
140 F->arg_begin()->getType());
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000141 return true;
142 }
143 if (Name.startswith("cttz.") && F->arg_size() == 1) {
144 F->setName(Name + ".old");
Chandler Carruthd4a02402011-12-12 10:57:20 +0000145 NewFn = Intrinsic::getDeclaration(F->getParent(), Intrinsic::cttz,
146 F->arg_begin()->getType());
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000147 return true;
148 }
149 break;
150 }
Adrian Prantl87b7eb92014-10-01 18:55:02 +0000151
Matt Arsenaultfbcbce42013-10-07 18:06:48 +0000152 case 'o':
153 // We only need to change the name to match the mangling including the
154 // address space.
155 if (F->arg_size() == 2 && Name.startswith("objectsize.")) {
156 Type *Tys[2] = { F->getReturnType(), F->arg_begin()->getType() };
157 if (F->getName() != Intrinsic::getName(Intrinsic::objectsize, Tys)) {
158 F->setName(Name + ".old");
159 NewFn = Intrinsic::getDeclaration(F->getParent(),
160 Intrinsic::objectsize, Tys);
161 return true;
162 }
163 }
164 break;
165
Tim Shen00127562016-04-08 21:26:31 +0000166 case 's':
167 if (Name == "stackprotectorcheck") {
168 NewFn = nullptr;
169 return true;
170 }
171
Craig Topper3b1817d2012-02-03 06:10:55 +0000172 case 'x': {
173 if (Name.startswith("x86.sse2.pcmpeq.") ||
174 Name.startswith("x86.sse2.pcmpgt.") ||
175 Name.startswith("x86.avx2.pcmpeq.") ||
Craig Topperd3c9e402012-04-18 05:24:00 +0000176 Name.startswith("x86.avx2.pcmpgt.") ||
Sanjay Patel51ab7572016-06-16 15:48:30 +0000177 Name == "x86.sse41.pmaxsb" ||
178 Name == "x86.sse2.pmaxs.w" ||
179 Name == "x86.sse41.pmaxsd" ||
180 Name == "x86.sse2.pmaxu.b" ||
181 Name == "x86.sse41.pmaxuw" ||
182 Name == "x86.sse41.pmaxud" ||
183 Name == "x86.sse41.pminsb" ||
184 Name == "x86.sse2.pmins.w" ||
185 Name == "x86.sse41.pminsd" ||
186 Name == "x86.sse2.pminu.b" ||
187 Name == "x86.sse41.pminuw" ||
188 Name == "x86.sse41.pminud" ||
Sanjay Patel0e9afea2016-06-16 18:44:20 +0000189 Name.startswith("x86.avx2.pmax") ||
190 Name.startswith("x86.avx2.pmin") ||
Ahmed Bougacha1a4987052015-08-20 20:36:19 +0000191 Name.startswith("x86.avx2.vbroadcast") ||
192 Name.startswith("x86.avx2.pbroadcast") ||
Craig Topper7daf8972012-05-08 06:58:15 +0000193 Name.startswith("x86.avx.vpermil.") ||
Craig Topper10679862016-06-12 14:11:32 +0000194 Name.startswith("x86.sse2.pshuf") ||
Craig Topper13cf7ca2016-06-13 02:36:48 +0000195 Name.startswith("x86.avx512.mask.pshuf.d.") ||
196 Name.startswith("x86.avx512.mask.pshufl.w.") ||
197 Name.startswith("x86.avx512.mask.pshufh.w.") ||
Simon Pilgrim9cb018b2015-09-23 08:48:33 +0000198 Name.startswith("x86.sse41.pmovsx") ||
Simon Pilgrim9602d672016-05-28 18:03:41 +0000199 Name.startswith("x86.sse41.pmovzx") ||
200 Name.startswith("x86.avx2.pmovsx") ||
201 Name.startswith("x86.avx2.pmovzx") ||
Simon Pilgrim4298d062016-05-25 08:59:18 +0000202 Name == "x86.sse2.cvtdq2pd" ||
203 Name == "x86.sse2.cvtps2pd" ||
204 Name == "x86.avx.cvtdq2.pd.256" ||
205 Name == "x86.avx.cvt.ps2.pd.256" ||
Simon Pilgrim0afd5a42016-06-02 10:55:21 +0000206 Name == "x86.sse2.cvttps2dq" ||
207 Name.startswith("x86.avx.cvtt.") ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000208 Name.startswith("x86.avx.vinsertf128.") ||
Sanjay Patel4339abe2015-03-12 23:16:18 +0000209 Name == "x86.avx2.vinserti128" ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000210 Name.startswith("x86.avx.vextractf128.") ||
Sanjay Patel4339abe2015-03-12 23:16:18 +0000211 Name == "x86.avx2.vextracti128" ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000212 Name.startswith("x86.avx.movnt.") ||
Craig Topper12e322a2016-05-25 06:56:32 +0000213 Name == "x86.sse2.storel.dq" ||
Craig Topper8287fd82016-05-30 23:15:56 +0000214 Name.startswith("x86.sse.storeu.") ||
215 Name.startswith("x86.sse2.storeu.") ||
216 Name.startswith("x86.avx.storeu.") ||
Craig Topper50f85c22016-05-31 01:50:02 +0000217 Name.startswith("x86.avx512.mask.storeu.p") ||
218 Name.startswith("x86.avx512.mask.storeu.b.") ||
219 Name.startswith("x86.avx512.mask.storeu.w.") ||
220 Name.startswith("x86.avx512.mask.storeu.d.") ||
221 Name.startswith("x86.avx512.mask.storeu.q.") ||
222 Name.startswith("x86.avx512.mask.store.p") ||
223 Name.startswith("x86.avx512.mask.store.b.") ||
224 Name.startswith("x86.avx512.mask.store.w.") ||
225 Name.startswith("x86.avx512.mask.store.d.") ||
226 Name.startswith("x86.avx512.mask.store.q.") ||
Craig Topperf10fbfa2016-06-02 04:19:36 +0000227 Name.startswith("x86.avx512.mask.loadu.p") ||
228 Name.startswith("x86.avx512.mask.loadu.b.") ||
229 Name.startswith("x86.avx512.mask.loadu.w.") ||
230 Name.startswith("x86.avx512.mask.loadu.d.") ||
231 Name.startswith("x86.avx512.mask.loadu.q.") ||
232 Name.startswith("x86.avx512.mask.load.p") ||
233 Name.startswith("x86.avx512.mask.load.b.") ||
234 Name.startswith("x86.avx512.mask.load.w.") ||
235 Name.startswith("x86.avx512.mask.load.d.") ||
236 Name.startswith("x86.avx512.mask.load.q.") ||
Craig Topperef9e9932013-10-15 05:20:47 +0000237 Name == "x86.sse42.crc32.64.8" ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000238 Name.startswith("x86.avx.vbroadcast.s") ||
Craig Topper33350cc2016-06-06 06:12:54 +0000239 Name.startswith("x86.avx512.mask.palignr.") ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000240 Name.startswith("x86.sse2.psll.dq") ||
241 Name.startswith("x86.sse2.psrl.dq") ||
242 Name.startswith("x86.avx2.psll.dq") ||
243 Name.startswith("x86.avx2.psrl.dq") ||
Simon Pilgrimf7186822016-06-09 21:09:03 +0000244 Name.startswith("x86.avx512.psll.dq") ||
245 Name.startswith("x86.avx512.psrl.dq") ||
Craig Topper782d6202015-02-28 19:33:17 +0000246 Name == "x86.sse41.pblendw" ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000247 Name.startswith("x86.sse41.blendp") ||
248 Name.startswith("x86.avx.blend.p") ||
Craig Topper782d6202015-02-28 19:33:17 +0000249 Name == "x86.avx2.pblendw" ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000250 Name.startswith("x86.avx2.pblendd.") ||
Juergen Ributzka1f7a1762015-03-04 00:13:25 +0000251 Name == "x86.avx2.vbroadcasti128" ||
Simon Pilgrime88dc042015-11-03 20:27:01 +0000252 Name == "x86.xop.vpcmov" ||
Craig Topper3352ba52012-06-09 16:46:13 +0000253 (Name.startswith("x86.xop.vpcom") && F->arg_size() == 2)) {
Craig Topperc6207612014-04-09 06:08:46 +0000254 NewFn = nullptr;
Craig Topper3b1817d2012-02-03 06:10:55 +0000255 return true;
256 }
Nadav Rotem17ee58a2012-06-10 18:42:51 +0000257 // SSE4.1 ptest functions may have an old signature.
258 if (Name.startswith("x86.sse41.ptest")) {
259 if (Name == "x86.sse41.ptestc")
260 return UpgradeSSE41Function(F, Intrinsic::x86_sse41_ptestc, NewFn);
261 if (Name == "x86.sse41.ptestz")
262 return UpgradeSSE41Function(F, Intrinsic::x86_sse41_ptestz, NewFn);
263 if (Name == "x86.sse41.ptestnzc")
264 return UpgradeSSE41Function(F, Intrinsic::x86_sse41_ptestnzc, NewFn);
265 }
Sanjay Patel1c3eaec2015-02-28 22:25:06 +0000266 // Several blend and other instructions with masks used the wrong number of
Chandler Carruth373b2b12014-09-06 10:00:01 +0000267 // bits.
Chandler Carruth373b2b12014-09-06 10:00:01 +0000268 if (Name == "x86.sse41.insertps")
269 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_sse41_insertps,
270 NewFn);
271 if (Name == "x86.sse41.dppd")
272 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_sse41_dppd,
273 NewFn);
274 if (Name == "x86.sse41.dpps")
275 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_sse41_dpps,
276 NewFn);
277 if (Name == "x86.sse41.mpsadbw")
278 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_sse41_mpsadbw,
279 NewFn);
Chandler Carruth373b2b12014-09-06 10:00:01 +0000280 if (Name == "x86.avx.dp.ps.256")
281 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_avx_dp_ps_256,
282 NewFn);
Chandler Carruth373b2b12014-09-06 10:00:01 +0000283 if (Name == "x86.avx2.mpsadbw")
284 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_avx2_mpsadbw,
285 NewFn);
Craig Topper29f2e952015-01-25 23:26:02 +0000286
Craig Topper71dc02d2012-06-13 07:18:53 +0000287 // frcz.ss/sd may need to have an argument dropped
288 if (Name.startswith("x86.xop.vfrcz.ss") && F->arg_size() == 2) {
289 F->setName(Name + ".old");
290 NewFn = Intrinsic::getDeclaration(F->getParent(),
291 Intrinsic::x86_xop_vfrcz_ss);
292 return true;
293 }
294 if (Name.startswith("x86.xop.vfrcz.sd") && F->arg_size() == 2) {
295 F->setName(Name + ".old");
296 NewFn = Intrinsic::getDeclaration(F->getParent(),
297 Intrinsic::x86_xop_vfrcz_sd);
298 return true;
299 }
Craig Topper720c7bd2012-06-03 08:07:25 +0000300 // Fix the FMA4 intrinsics to remove the 4
301 if (Name.startswith("x86.fma4.")) {
Craig Topper2c5ccd82012-06-03 16:48:52 +0000302 F->setName("llvm.x86.fma" + Name.substr(8));
303 NewFn = F;
304 return true;
Craig Topper720c7bd2012-06-03 08:07:25 +0000305 }
Simon Pilgrime85506b2016-06-03 08:06:03 +0000306 // Upgrade any XOP PERMIL2 index operand still using a float/double vector.
307 if (Name.startswith("x86.xop.vpermil2")) {
308 auto Params = F->getFunctionType()->params();
309 auto Idx = Params[2];
310 if (Idx->getScalarType()->isFloatingPointTy()) {
311 F->setName(Name + ".old");
312 unsigned IdxSize = Idx->getPrimitiveSizeInBits();
313 unsigned EltSize = Idx->getScalarSizeInBits();
314 Intrinsic::ID Permil2ID;
315 if (EltSize == 64 && IdxSize == 128)
316 Permil2ID = Intrinsic::x86_xop_vpermil2pd;
317 else if (EltSize == 32 && IdxSize == 128)
318 Permil2ID = Intrinsic::x86_xop_vpermil2ps;
319 else if (EltSize == 64 && IdxSize == 256)
320 Permil2ID = Intrinsic::x86_xop_vpermil2pd_256;
321 else
322 Permil2ID = Intrinsic::x86_xop_vpermil2ps_256;
323 NewFn = Intrinsic::getDeclaration(F->getParent(), Permil2ID);
324 return true;
325 }
326 }
Craig Topper3b1817d2012-02-03 06:10:55 +0000327 break;
328 }
Chris Lattnerb372f662011-06-18 18:56:39 +0000329 }
Chandler Carruth7132e002007-08-04 01:51:18 +0000330
Nadav Rotem17ee58a2012-06-10 18:42:51 +0000331 // This may not belong here. This function is effectively being overloaded
332 // to both detect an intrinsic which needs upgrading, and to provide the
333 // upgraded form of the intrinsic. We should perhaps have two separate
Chandler Carruth7132e002007-08-04 01:51:18 +0000334 // functions for this.
Evan Cheng0e179d02007-12-17 22:33:23 +0000335 return false;
Chandler Carruth7132e002007-08-04 01:51:18 +0000336}
337
Evan Cheng0e179d02007-12-17 22:33:23 +0000338bool llvm::UpgradeIntrinsicFunction(Function *F, Function *&NewFn) {
Craig Topperc6207612014-04-09 06:08:46 +0000339 NewFn = nullptr;
Evan Cheng0e179d02007-12-17 22:33:23 +0000340 bool Upgraded = UpgradeIntrinsicFunction1(F, NewFn);
Filipe Cabecinhas0011c582015-07-03 20:12:01 +0000341 assert(F != NewFn && "Intrinsic function upgraded to the same function");
Duncan Sands38ef3a82007-12-03 20:06:50 +0000342
343 // Upgrade intrinsic attributes. This does not change the function.
Evan Cheng0e179d02007-12-17 22:33:23 +0000344 if (NewFn)
345 F = NewFn;
Pete Cooper9e1d3352015-05-20 17:16:39 +0000346 if (Intrinsic::ID id = F->getIntrinsicID())
347 F->setAttributes(Intrinsic::getAttributes(F->getContext(), id));
Duncan Sands38ef3a82007-12-03 20:06:50 +0000348 return Upgraded;
349}
350
Bill Wendlinge26fffc2010-09-10 18:51:56 +0000351bool llvm::UpgradeGlobalVariable(GlobalVariable *GV) {
Chris Lattner80ed9dc2011-06-18 06:05:24 +0000352 // Nothing to do yet.
Bill Wendlinge26fffc2010-09-10 18:51:56 +0000353 return false;
354}
355
Simon Pilgrimf7186822016-06-09 21:09:03 +0000356// Handles upgrading SSE2/AVX2/AVX512BW PSLLDQ intrinsics by converting them
Craig Topperb324e432015-02-18 06:24:44 +0000357// to byte shuffles.
358static Value *UpgradeX86PSLLDQIntrinsics(IRBuilder<> &Builder, LLVMContext &C,
Craig Topper7355ac32016-05-29 06:37:33 +0000359 Value *Op, unsigned Shift) {
360 Type *ResultTy = Op->getType();
361 unsigned NumElts = ResultTy->getVectorNumElements() * 8;
Craig Topperb324e432015-02-18 06:24:44 +0000362
363 // Bitcast from a 64-bit element type to a byte element type.
Craig Topper7355ac32016-05-29 06:37:33 +0000364 Type *VecTy = VectorType::get(Type::getInt8Ty(C), NumElts);
365 Op = Builder.CreateBitCast(Op, VecTy, "cast");
366
Craig Topperb324e432015-02-18 06:24:44 +0000367 // We'll be shuffling in zeroes.
Craig Topper7355ac32016-05-29 06:37:33 +0000368 Value *Res = Constant::getNullValue(VecTy);
Craig Topperb324e432015-02-18 06:24:44 +0000369
370 // If shift is less than 16, emit a shuffle to move the bytes. Otherwise,
371 // we'll just return the zero vector.
372 if (Shift < 16) {
Craig Topper99d1eab2016-06-12 00:41:19 +0000373 uint32_t Idxs[64];
Simon Pilgrimf7186822016-06-09 21:09:03 +0000374 // 256/512-bit version is split into 2/4 16-byte lanes.
Craig Topperb324e432015-02-18 06:24:44 +0000375 for (unsigned l = 0; l != NumElts; l += 16)
376 for (unsigned i = 0; i != 16; ++i) {
377 unsigned Idx = NumElts + i - Shift;
378 if (Idx < NumElts)
379 Idx -= NumElts - 16; // end of lane, switch operand.
Craig Topper7355ac32016-05-29 06:37:33 +0000380 Idxs[l + i] = Idx + l;
Craig Topperb324e432015-02-18 06:24:44 +0000381 }
382
Craig Topper7355ac32016-05-29 06:37:33 +0000383 Res = Builder.CreateShuffleVector(Res, Op, makeArrayRef(Idxs, NumElts));
Craig Topperb324e432015-02-18 06:24:44 +0000384 }
385
386 // Bitcast back to a 64-bit element type.
Craig Topper7355ac32016-05-29 06:37:33 +0000387 return Builder.CreateBitCast(Res, ResultTy, "cast");
Craig Topperb324e432015-02-18 06:24:44 +0000388}
389
Craig Topperea703ae2016-06-13 02:36:42 +0000390// Handles upgrading SSE2/AVX2/AVX512BW PSRLDQ intrinsics by converting them
391// to byte shuffles.
392static Value *UpgradeX86PSRLDQIntrinsics(IRBuilder<> &Builder, LLVMContext &C,
393 Value *Op,
394 unsigned Shift) {
395 Type *ResultTy = Op->getType();
396 unsigned NumElts = ResultTy->getVectorNumElements() * 8;
397
398 // Bitcast from a 64-bit element type to a byte element type.
399 Type *VecTy = VectorType::get(Type::getInt8Ty(C), NumElts);
400 Op = Builder.CreateBitCast(Op, VecTy, "cast");
401
402 // We'll be shuffling in zeroes.
403 Value *Res = Constant::getNullValue(VecTy);
404
405 // If shift is less than 16, emit a shuffle to move the bytes. Otherwise,
406 // we'll just return the zero vector.
407 if (Shift < 16) {
408 uint32_t Idxs[64];
409 // 256/512-bit version is split into 2/4 16-byte lanes.
410 for (unsigned l = 0; l != NumElts; l += 16)
411 for (unsigned i = 0; i != 16; ++i) {
412 unsigned Idx = i + Shift;
413 if (Idx >= 16)
414 Idx += NumElts - 16; // end of lane, switch operand.
415 Idxs[l + i] = Idx + l;
416 }
417
418 Res = Builder.CreateShuffleVector(Op, Res, makeArrayRef(Idxs, NumElts));
419 }
420
421 // Bitcast back to a 64-bit element type.
422 return Builder.CreateBitCast(Res, ResultTy, "cast");
423}
424
425static Value *getX86MaskVec(IRBuilder<> &Builder, Value *Mask,
426 unsigned NumElts) {
427 llvm::VectorType *MaskTy = llvm::VectorType::get(Builder.getInt1Ty(),
428 cast<IntegerType>(Mask->getType())->getBitWidth());
429 Mask = Builder.CreateBitCast(Mask, MaskTy);
430
431 // If we have less than 8 elements, then the starting mask was an i8 and
432 // we need to extract down to the right number of elements.
433 if (NumElts < 8) {
434 uint32_t Indices[4];
435 for (unsigned i = 0; i != NumElts; ++i)
436 Indices[i] = i;
437 Mask = Builder.CreateShuffleVector(Mask, Mask,
438 makeArrayRef(Indices, NumElts),
439 "extract");
440 }
441
442 return Mask;
443}
444
445static Value *EmitX86Select(IRBuilder<> &Builder, Value *Mask,
446 Value *Op0, Value *Op1) {
447 // If the mask is all ones just emit the align operation.
448 if (const auto *C = dyn_cast<Constant>(Mask))
449 if (C->isAllOnesValue())
450 return Op0;
451
452 Mask = getX86MaskVec(Builder, Mask, Op0->getType()->getVectorNumElements());
453 return Builder.CreateSelect(Mask, Op0, Op1);
454}
455
Craig Topper33350cc2016-06-06 06:12:54 +0000456static Value *UpgradeX86PALIGNRIntrinsics(IRBuilder<> &Builder, LLVMContext &C,
457 Value *Op0, Value *Op1, Value *Shift,
458 Value *Passthru, Value *Mask) {
459 unsigned ShiftVal = cast<llvm::ConstantInt>(Shift)->getZExtValue();
460
461 unsigned NumElts = Op0->getType()->getVectorNumElements();
462 assert(NumElts % 16 == 0);
463
464 // If palignr is shifting the pair of vectors more than the size of two
465 // lanes, emit zero.
466 if (ShiftVal >= 32)
467 return llvm::Constant::getNullValue(Op0->getType());
468
469 // If palignr is shifting the pair of input vectors more than one lane,
470 // but less than two lanes, convert to shifting in zeroes.
471 if (ShiftVal > 16) {
472 ShiftVal -= 16;
473 Op1 = Op0;
474 Op0 = llvm::Constant::getNullValue(Op0->getType());
475 }
476
Craig Topper99d1eab2016-06-12 00:41:19 +0000477 uint32_t Indices[64];
Craig Topper33350cc2016-06-06 06:12:54 +0000478 // 256-bit palignr operates on 128-bit lanes so we need to handle that
479 for (unsigned l = 0; l != NumElts; l += 16) {
480 for (unsigned i = 0; i != 16; ++i) {
481 unsigned Idx = ShiftVal + i;
482 if (Idx >= 16)
483 Idx += NumElts - 16; // End of lane, switch operand.
484 Indices[l + i] = Idx + l;
485 }
486 }
487
488 Value *Align = Builder.CreateShuffleVector(Op1, Op0,
489 makeArrayRef(Indices, NumElts),
490 "palignr");
491
Craig Topperea703ae2016-06-13 02:36:42 +0000492 return EmitX86Select(Builder, Mask, Align, Passthru);
Craig Topperb324e432015-02-18 06:24:44 +0000493}
494
Craig Topper50f85c22016-05-31 01:50:02 +0000495static Value *UpgradeMaskedStore(IRBuilder<> &Builder, LLVMContext &C,
496 Value *Ptr, Value *Data, Value *Mask,
497 bool Aligned) {
498 // Cast the pointer to the right type.
499 Ptr = Builder.CreateBitCast(Ptr,
500 llvm::PointerType::getUnqual(Data->getType()));
501 unsigned Align =
502 Aligned ? cast<VectorType>(Data->getType())->getBitWidth() / 8 : 1;
503
504 // If the mask is all ones just emit a regular store.
505 if (const auto *C = dyn_cast<Constant>(Mask))
506 if (C->isAllOnesValue())
507 return Builder.CreateAlignedStore(Data, Ptr, Align);
508
509 // Convert the mask from an integer type to a vector of i1.
510 unsigned NumElts = Data->getType()->getVectorNumElements();
Craig Topperea703ae2016-06-13 02:36:42 +0000511 Mask = getX86MaskVec(Builder, Mask, NumElts);
Craig Topper50f85c22016-05-31 01:50:02 +0000512 return Builder.CreateMaskedStore(Data, Ptr, Align, Mask);
513}
514
Craig Topperf10fbfa2016-06-02 04:19:36 +0000515static Value *UpgradeMaskedLoad(IRBuilder<> &Builder, LLVMContext &C,
516 Value *Ptr, Value *Passthru, Value *Mask,
517 bool Aligned) {
518 // Cast the pointer to the right type.
519 Ptr = Builder.CreateBitCast(Ptr,
520 llvm::PointerType::getUnqual(Passthru->getType()));
521 unsigned Align =
522 Aligned ? cast<VectorType>(Passthru->getType())->getBitWidth() / 8 : 1;
523
524 // If the mask is all ones just emit a regular store.
525 if (const auto *C = dyn_cast<Constant>(Mask))
526 if (C->isAllOnesValue())
527 return Builder.CreateAlignedLoad(Ptr, Align);
528
529 // Convert the mask from an integer type to a vector of i1.
530 unsigned NumElts = Passthru->getType()->getVectorNumElements();
Craig Topperea703ae2016-06-13 02:36:42 +0000531 Mask = getX86MaskVec(Builder, Mask, NumElts);
Craig Topperf10fbfa2016-06-02 04:19:36 +0000532 return Builder.CreateMaskedLoad(Ptr, Align, Mask, Passthru);
533}
534
Sanjay Patel51ab7572016-06-16 15:48:30 +0000535static Value *upgradeIntMinMax(IRBuilder<> &Builder, CallInst &CI,
536 ICmpInst::Predicate Pred) {
537 Value *Op0 = CI.getArgOperand(0);
538 Value *Op1 = CI.getArgOperand(1);
539 Value *Cmp = Builder.CreateICmp(Pred, Op0, Op1);
540 return Builder.CreateSelect(Cmp, Op0, Op1);
541}
542
Sanjay Patel595098f2016-06-15 22:01:28 +0000543/// Upgrade a call to an old intrinsic. All argument and return casting must be
544/// provided to seamlessly integrate with existing context.
Chandler Carruth7132e002007-08-04 01:51:18 +0000545void llvm::UpgradeIntrinsicCall(CallInst *CI, Function *NewFn) {
Craig Topper3b1817d2012-02-03 06:10:55 +0000546 Function *F = CI->getCalledFunction();
Nick Lewycky2eb3ade2011-12-12 22:59:34 +0000547 LLVMContext &C = CI->getContext();
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000548 IRBuilder<> Builder(C);
Duncan P. N. Exon Smith52888a62015-10-08 23:49:46 +0000549 Builder.SetInsertPoint(CI->getParent(), CI->getIterator());
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000550
Craig Topper3b1817d2012-02-03 06:10:55 +0000551 assert(F && "Intrinsic call is not direct?");
552
553 if (!NewFn) {
554 // Get the Function's name.
555 StringRef Name = F->getName();
556
557 Value *Rep;
Sanjay Patel595098f2016-06-15 22:01:28 +0000558 // Upgrade packed integer vector compare intrinsics to compare instructions.
Craig Topper3b1817d2012-02-03 06:10:55 +0000559 if (Name.startswith("llvm.x86.sse2.pcmpeq.") ||
560 Name.startswith("llvm.x86.avx2.pcmpeq.")) {
561 Rep = Builder.CreateICmpEQ(CI->getArgOperand(0), CI->getArgOperand(1),
562 "pcmpeq");
Craig Topper3b1817d2012-02-03 06:10:55 +0000563 Rep = Builder.CreateSExt(Rep, CI->getType(), "");
564 } else if (Name.startswith("llvm.x86.sse2.pcmpgt.") ||
565 Name.startswith("llvm.x86.avx2.pcmpgt.")) {
566 Rep = Builder.CreateICmpSGT(CI->getArgOperand(0), CI->getArgOperand(1),
567 "pcmpgt");
Craig Topper3b1817d2012-02-03 06:10:55 +0000568 Rep = Builder.CreateSExt(Rep, CI->getType(), "");
Sanjay Patel51ab7572016-06-16 15:48:30 +0000569 } else if (Name == "llvm.x86.sse41.pmaxsb" ||
570 Name == "llvm.x86.sse2.pmaxs.w" ||
Sanjay Patel0e9afea2016-06-16 18:44:20 +0000571 Name == "llvm.x86.sse41.pmaxsd" ||
572 Name.startswith("llvm.x86.avx2.pmaxs")) {
Sanjay Patel51ab7572016-06-16 15:48:30 +0000573 Rep = upgradeIntMinMax(Builder, *CI, ICmpInst::ICMP_SGT);
574 } else if (Name == "llvm.x86.sse2.pmaxu.b" ||
575 Name == "llvm.x86.sse41.pmaxuw" ||
Sanjay Patel0e9afea2016-06-16 18:44:20 +0000576 Name == "llvm.x86.sse41.pmaxud" ||
577 Name.startswith("llvm.x86.avx2.pmaxu")) {
Sanjay Patel51ab7572016-06-16 15:48:30 +0000578 Rep = upgradeIntMinMax(Builder, *CI, ICmpInst::ICMP_UGT);
579 } else if (Name == "llvm.x86.sse41.pminsb" ||
580 Name == "llvm.x86.sse2.pmins.w" ||
Sanjay Patel0e9afea2016-06-16 18:44:20 +0000581 Name == "llvm.x86.sse41.pminsd" ||
582 Name.startswith("llvm.x86.avx2.pmins")) {
Sanjay Patel51ab7572016-06-16 15:48:30 +0000583 Rep = upgradeIntMinMax(Builder, *CI, ICmpInst::ICMP_SLT);
584 } else if (Name == "llvm.x86.sse2.pminu.b" ||
585 Name == "llvm.x86.sse41.pminuw" ||
Sanjay Patel0e9afea2016-06-16 18:44:20 +0000586 Name == "llvm.x86.sse41.pminud" ||
587 Name.startswith("llvm.x86.avx2.pminu")) {
Sanjay Patel51ab7572016-06-16 15:48:30 +0000588 Rep = upgradeIntMinMax(Builder, *CI, ICmpInst::ICMP_ULT);
Simon Pilgrim4298d062016-05-25 08:59:18 +0000589 } else if (Name == "llvm.x86.sse2.cvtdq2pd" ||
590 Name == "llvm.x86.sse2.cvtps2pd" ||
591 Name == "llvm.x86.avx.cvtdq2.pd.256" ||
592 Name == "llvm.x86.avx.cvt.ps2.pd.256") {
593 // Lossless i32/float to double conversion.
594 // Extract the bottom elements if necessary and convert to double vector.
595 Value *Src = CI->getArgOperand(0);
596 VectorType *SrcTy = cast<VectorType>(Src->getType());
597 VectorType *DstTy = cast<VectorType>(CI->getType());
598 Rep = CI->getArgOperand(0);
599
600 unsigned NumDstElts = DstTy->getNumElements();
601 if (NumDstElts < SrcTy->getNumElements()) {
602 assert(NumDstElts == 2 && "Unexpected vector size");
Craig Topper99d1eab2016-06-12 00:41:19 +0000603 uint32_t ShuffleMask[2] = { 0, 1 };
604 Rep = Builder.CreateShuffleVector(Rep, UndefValue::get(SrcTy),
605 ShuffleMask);
Simon Pilgrim4298d062016-05-25 08:59:18 +0000606 }
607
608 bool Int2Double = (StringRef::npos != Name.find("cvtdq2"));
609 if (Int2Double)
610 Rep = Builder.CreateSIToFP(Rep, DstTy, "cvtdq2pd");
611 else
612 Rep = Builder.CreateFPExt(Rep, DstTy, "cvtps2pd");
Simon Pilgrim0afd5a42016-06-02 10:55:21 +0000613 } else if (Name == "llvm.x86.sse2.cvttps2dq" ||
614 Name.startswith("llvm.x86.avx.cvtt.")) {
615 // Truncation (round to zero) float/double to i32 vector conversion.
616 Value *Src = CI->getArgOperand(0);
617 VectorType *DstTy = cast<VectorType>(CI->getType());
618 Rep = Builder.CreateFPToSI(Src, DstTy, "cvtt");
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000619 } else if (Name.startswith("llvm.x86.avx.movnt.")) {
Craig Topper7daf8972012-05-08 06:58:15 +0000620 Module *M = F->getParent();
Duncan P. N. Exon Smith5bf8fef2014-12-09 18:38:53 +0000621 SmallVector<Metadata *, 1> Elts;
622 Elts.push_back(
623 ConstantAsMetadata::get(ConstantInt::get(Type::getInt32Ty(C), 1)));
Craig Topper7daf8972012-05-08 06:58:15 +0000624 MDNode *Node = MDNode::get(C, Elts);
625
626 Value *Arg0 = CI->getArgOperand(0);
627 Value *Arg1 = CI->getArgOperand(1);
628
629 // Convert the type of the pointer to a pointer to the stored type.
630 Value *BC = Builder.CreateBitCast(Arg0,
631 PointerType::getUnqual(Arg1->getType()),
632 "cast");
Craig Topper29ce55d2016-05-30 22:54:12 +0000633 StoreInst *SI = Builder.CreateAlignedStore(Arg1, BC, 32);
Craig Topper7daf8972012-05-08 06:58:15 +0000634 SI->setMetadata(M->getMDKindID("nontemporal"), Node);
Craig Topper7daf8972012-05-08 06:58:15 +0000635
636 // Remove intrinsic.
637 CI->eraseFromParent();
638 return;
Craig Topper12e322a2016-05-25 06:56:32 +0000639 } else if (Name == "llvm.x86.sse2.storel.dq") {
Craig Topper12e322a2016-05-25 06:56:32 +0000640 Value *Arg0 = CI->getArgOperand(0);
641 Value *Arg1 = CI->getArgOperand(1);
642
643 Type *NewVecTy = VectorType::get(Type::getInt64Ty(C), 2);
644 Value *BC0 = Builder.CreateBitCast(Arg1, NewVecTy, "cast");
645 Value *Elt = Builder.CreateExtractElement(BC0, (uint64_t)0);
646 Value *BC = Builder.CreateBitCast(Arg0,
647 PointerType::getUnqual(Elt->getType()),
648 "cast");
Craig Topper29ce55d2016-05-30 22:54:12 +0000649 Builder.CreateAlignedStore(Elt, BC, 1);
Craig Topper12e322a2016-05-25 06:56:32 +0000650
651 // Remove intrinsic.
652 CI->eraseFromParent();
653 return;
Craig Topper8287fd82016-05-30 23:15:56 +0000654 } else if (Name.startswith("llvm.x86.sse.storeu.") ||
655 Name.startswith("llvm.x86.sse2.storeu.") ||
656 Name.startswith("llvm.x86.avx.storeu.")) {
657 Value *Arg0 = CI->getArgOperand(0);
658 Value *Arg1 = CI->getArgOperand(1);
659
660 Arg0 = Builder.CreateBitCast(Arg0,
661 PointerType::getUnqual(Arg1->getType()),
662 "cast");
663 Builder.CreateAlignedStore(Arg1, Arg0, 1);
664
665 // Remove intrinsic.
666 CI->eraseFromParent();
667 return;
Craig Topper50f85c22016-05-31 01:50:02 +0000668 } else if (Name.startswith("llvm.x86.avx512.mask.storeu.p") ||
669 Name.startswith("llvm.x86.avx512.mask.storeu.b.") ||
670 Name.startswith("llvm.x86.avx512.mask.storeu.w.") ||
671 Name.startswith("llvm.x86.avx512.mask.storeu.d.") ||
672 Name.startswith("llvm.x86.avx512.mask.storeu.q.")) {
673 UpgradeMaskedStore(Builder, C, CI->getArgOperand(0), CI->getArgOperand(1),
674 CI->getArgOperand(2), /*Aligned*/false);
675
676 // Remove intrinsic.
677 CI->eraseFromParent();
678 return;
679 } else if (Name.startswith("llvm.x86.avx512.mask.store.p") ||
680 Name.startswith("llvm.x86.avx512.mask.store.b.") ||
681 Name.startswith("llvm.x86.avx512.mask.store.w.") ||
682 Name.startswith("llvm.x86.avx512.mask.store.d.") ||
683 Name.startswith("llvm.x86.avx512.mask.store.q.")) {
684 UpgradeMaskedStore(Builder, C, CI->getArgOperand(0), CI->getArgOperand(1),
685 CI->getArgOperand(2), /*Aligned*/true);
686
687 // Remove intrinsic.
688 CI->eraseFromParent();
689 return;
Craig Topperf10fbfa2016-06-02 04:19:36 +0000690 } else if (Name.startswith("llvm.x86.avx512.mask.loadu.p") ||
691 Name.startswith("llvm.x86.avx512.mask.loadu.b.") ||
692 Name.startswith("llvm.x86.avx512.mask.loadu.w.") ||
693 Name.startswith("llvm.x86.avx512.mask.loadu.d.") ||
694 Name.startswith("llvm.x86.avx512.mask.loadu.q.")) {
695 Rep = UpgradeMaskedLoad(Builder, C, CI->getArgOperand(0),
696 CI->getArgOperand(1), CI->getArgOperand(2),
697 /*Aligned*/false);
698 } else if (Name.startswith("llvm.x86.avx512.mask.load.p") ||
699 Name.startswith("llvm.x86.avx512.mask.load.b.") ||
700 Name.startswith("llvm.x86.avx512.mask.load.w.") ||
701 Name.startswith("llvm.x86.avx512.mask.load.d.") ||
702 Name.startswith("llvm.x86.avx512.mask.load.q.")) {
703 Rep = UpgradeMaskedLoad(Builder, C, CI->getArgOperand(0),
704 CI->getArgOperand(1),CI->getArgOperand(2),
705 /*Aligned*/true);
Craig Topper3352ba52012-06-09 16:46:13 +0000706 } else if (Name.startswith("llvm.x86.xop.vpcom")) {
707 Intrinsic::ID intID;
708 if (Name.endswith("ub"))
709 intID = Intrinsic::x86_xop_vpcomub;
710 else if (Name.endswith("uw"))
711 intID = Intrinsic::x86_xop_vpcomuw;
712 else if (Name.endswith("ud"))
713 intID = Intrinsic::x86_xop_vpcomud;
714 else if (Name.endswith("uq"))
715 intID = Intrinsic::x86_xop_vpcomuq;
716 else if (Name.endswith("b"))
717 intID = Intrinsic::x86_xop_vpcomb;
718 else if (Name.endswith("w"))
719 intID = Intrinsic::x86_xop_vpcomw;
720 else if (Name.endswith("d"))
721 intID = Intrinsic::x86_xop_vpcomd;
722 else if (Name.endswith("q"))
723 intID = Intrinsic::x86_xop_vpcomq;
724 else
725 llvm_unreachable("Unknown suffix");
726
727 Name = Name.substr(18); // strip off "llvm.x86.xop.vpcom"
728 unsigned Imm;
729 if (Name.startswith("lt"))
730 Imm = 0;
731 else if (Name.startswith("le"))
732 Imm = 1;
733 else if (Name.startswith("gt"))
734 Imm = 2;
735 else if (Name.startswith("ge"))
736 Imm = 3;
737 else if (Name.startswith("eq"))
738 Imm = 4;
739 else if (Name.startswith("ne"))
740 Imm = 5;
Craig Topper3352ba52012-06-09 16:46:13 +0000741 else if (Name.startswith("false"))
Craig Toppere32546d2015-02-13 07:42:15 +0000742 Imm = 6;
743 else if (Name.startswith("true"))
Craig Topper3352ba52012-06-09 16:46:13 +0000744 Imm = 7;
745 else
746 llvm_unreachable("Unknown condition");
747
748 Function *VPCOM = Intrinsic::getDeclaration(F->getParent(), intID);
David Blaikieff6409d2015-05-18 22:13:54 +0000749 Rep =
750 Builder.CreateCall(VPCOM, {CI->getArgOperand(0), CI->getArgOperand(1),
751 Builder.getInt8(Imm)});
Simon Pilgrime88dc042015-11-03 20:27:01 +0000752 } else if (Name == "llvm.x86.xop.vpcmov") {
753 Value *Arg0 = CI->getArgOperand(0);
754 Value *Arg1 = CI->getArgOperand(1);
755 Value *Sel = CI->getArgOperand(2);
756 unsigned NumElts = CI->getType()->getVectorNumElements();
757 Constant *MinusOne = ConstantVector::getSplat(NumElts, Builder.getInt64(-1));
758 Value *NotSel = Builder.CreateXor(Sel, MinusOne);
759 Value *Sel0 = Builder.CreateAnd(Arg0, Sel);
760 Value *Sel1 = Builder.CreateAnd(Arg1, NotSel);
761 Rep = Builder.CreateOr(Sel0, Sel1);
Craig Topperef9e9932013-10-15 05:20:47 +0000762 } else if (Name == "llvm.x86.sse42.crc32.64.8") {
763 Function *CRC32 = Intrinsic::getDeclaration(F->getParent(),
764 Intrinsic::x86_sse42_crc32_32_8);
765 Value *Trunc0 = Builder.CreateTrunc(CI->getArgOperand(0), Type::getInt32Ty(C));
David Blaikieff6409d2015-05-18 22:13:54 +0000766 Rep = Builder.CreateCall(CRC32, {Trunc0, CI->getArgOperand(1)});
Craig Topperef9e9932013-10-15 05:20:47 +0000767 Rep = Builder.CreateZExt(Rep, CI->getType(), "");
Adam Nemet39066802014-05-29 23:35:33 +0000768 } else if (Name.startswith("llvm.x86.avx.vbroadcast")) {
769 // Replace broadcasts with a series of insertelements.
770 Type *VecTy = CI->getType();
771 Type *EltTy = VecTy->getVectorElementType();
772 unsigned EltNum = VecTy->getVectorNumElements();
773 Value *Cast = Builder.CreateBitCast(CI->getArgOperand(0),
774 EltTy->getPointerTo());
David Blaikie0c28fd72015-05-20 21:46:30 +0000775 Value *Load = Builder.CreateLoad(EltTy, Cast);
Adam Nemet39066802014-05-29 23:35:33 +0000776 Type *I32Ty = Type::getInt32Ty(C);
777 Rep = UndefValue::get(VecTy);
778 for (unsigned I = 0; I < EltNum; ++I)
779 Rep = Builder.CreateInsertElement(Rep, Load,
780 ConstantInt::get(I32Ty, I));
Simon Pilgrim9602d672016-05-28 18:03:41 +0000781 } else if (Name.startswith("llvm.x86.sse41.pmovsx") ||
782 Name.startswith("llvm.x86.sse41.pmovzx") ||
783 Name.startswith("llvm.x86.avx2.pmovsx") ||
784 Name.startswith("llvm.x86.avx2.pmovzx")) {
Simon Pilgrim9cb018b2015-09-23 08:48:33 +0000785 VectorType *SrcTy = cast<VectorType>(CI->getArgOperand(0)->getType());
786 VectorType *DstTy = cast<VectorType>(CI->getType());
787 unsigned NumDstElts = DstTy->getNumElements();
788
Simon Pilgrim9602d672016-05-28 18:03:41 +0000789 // Extract a subvector of the first NumDstElts lanes and sign/zero extend.
Craig Topperc0a5fa02016-06-12 04:48:00 +0000790 SmallVector<uint32_t, 8> ShuffleMask(NumDstElts);
Craig Topper99d1eab2016-06-12 00:41:19 +0000791 for (unsigned i = 0; i != NumDstElts; ++i)
Craig Topperc0a5fa02016-06-12 04:48:00 +0000792 ShuffleMask[i] = i;
Simon Pilgrim9cb018b2015-09-23 08:48:33 +0000793
794 Value *SV = Builder.CreateShuffleVector(
795 CI->getArgOperand(0), UndefValue::get(SrcTy), ShuffleMask);
Simon Pilgrim9602d672016-05-28 18:03:41 +0000796
797 bool DoSext = (StringRef::npos != Name.find("pmovsx"));
798 Rep = DoSext ? Builder.CreateSExt(SV, DstTy)
799 : Builder.CreateZExt(SV, DstTy);
Juergen Ributzka1f7a1762015-03-04 00:13:25 +0000800 } else if (Name == "llvm.x86.avx2.vbroadcasti128") {
801 // Replace vbroadcasts with a vector shuffle.
David Blaikie0c28fd72015-05-20 21:46:30 +0000802 Type *VT = VectorType::get(Type::getInt64Ty(C), 2);
803 Value *Op = Builder.CreatePointerCast(CI->getArgOperand(0),
804 PointerType::getUnqual(VT));
805 Value *Load = Builder.CreateLoad(VT, Op);
Craig Topper99d1eab2016-06-12 00:41:19 +0000806 uint32_t Idxs[4] = { 0, 1, 0, 1 };
Juergen Ributzka1f7a1762015-03-04 00:13:25 +0000807 Rep = Builder.CreateShuffleVector(Load, UndefValue::get(Load->getType()),
Sanjay Patel2db6d382015-03-12 15:27:07 +0000808 Idxs);
Ahmed Bougacha1a4987052015-08-20 20:36:19 +0000809 } else if (Name.startswith("llvm.x86.avx2.pbroadcast") ||
810 Name.startswith("llvm.x86.avx2.vbroadcast")) {
811 // Replace vp?broadcasts with a vector shuffle.
812 Value *Op = CI->getArgOperand(0);
813 unsigned NumElts = CI->getType()->getVectorNumElements();
814 Type *MaskTy = VectorType::get(Type::getInt32Ty(C), NumElts);
815 Rep = Builder.CreateShuffleVector(Op, UndefValue::get(Op->getType()),
816 Constant::getNullValue(MaskTy));
Craig Topper33350cc2016-06-06 06:12:54 +0000817 } else if (Name.startswith("llvm.x86.avx512.mask.palignr.")) {
818 Rep = UpgradeX86PALIGNRIntrinsics(Builder, C, CI->getArgOperand(0),
819 CI->getArgOperand(1),
820 CI->getArgOperand(2),
821 CI->getArgOperand(3),
822 CI->getArgOperand(4));
Craig Topper7355ac32016-05-29 06:37:33 +0000823 } else if (Name == "llvm.x86.sse2.psll.dq" ||
824 Name == "llvm.x86.avx2.psll.dq") {
825 // 128/256-bit shift left specified in bits.
Craig Topperb324e432015-02-18 06:24:44 +0000826 unsigned Shift = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
Craig Topper7355ac32016-05-29 06:37:33 +0000827 Rep = UpgradeX86PSLLDQIntrinsics(Builder, C, CI->getArgOperand(0),
Craig Topperb324e432015-02-18 06:24:44 +0000828 Shift / 8); // Shift is in bits.
Craig Topper7355ac32016-05-29 06:37:33 +0000829 } else if (Name == "llvm.x86.sse2.psrl.dq" ||
830 Name == "llvm.x86.avx2.psrl.dq") {
831 // 128/256-bit shift right specified in bits.
Craig Topperb324e432015-02-18 06:24:44 +0000832 unsigned Shift = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
Craig Topper7355ac32016-05-29 06:37:33 +0000833 Rep = UpgradeX86PSRLDQIntrinsics(Builder, C, CI->getArgOperand(0),
Craig Topperb324e432015-02-18 06:24:44 +0000834 Shift / 8); // Shift is in bits.
Craig Topper7355ac32016-05-29 06:37:33 +0000835 } else if (Name == "llvm.x86.sse2.psll.dq.bs" ||
Simon Pilgrimf7186822016-06-09 21:09:03 +0000836 Name == "llvm.x86.avx2.psll.dq.bs" ||
837 Name == "llvm.x86.avx512.psll.dq.512") {
838 // 128/256/512-bit shift left specified in bytes.
Craig Topperb324e432015-02-18 06:24:44 +0000839 unsigned Shift = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
Craig Topper7355ac32016-05-29 06:37:33 +0000840 Rep = UpgradeX86PSLLDQIntrinsics(Builder, C, CI->getArgOperand(0), Shift);
841 } else if (Name == "llvm.x86.sse2.psrl.dq.bs" ||
Simon Pilgrimf7186822016-06-09 21:09:03 +0000842 Name == "llvm.x86.avx2.psrl.dq.bs" ||
843 Name == "llvm.x86.avx512.psrl.dq.512") {
844 // 128/256/512-bit shift right specified in bytes.
Craig Topperb324e432015-02-18 06:24:44 +0000845 unsigned Shift = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
Craig Topper7355ac32016-05-29 06:37:33 +0000846 Rep = UpgradeX86PSRLDQIntrinsics(Builder, C, CI->getArgOperand(0), Shift);
Craig Topper782d6202015-02-28 19:33:17 +0000847 } else if (Name == "llvm.x86.sse41.pblendw" ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000848 Name.startswith("llvm.x86.sse41.blendp") ||
849 Name.startswith("llvm.x86.avx.blend.p") ||
Craig Topper782d6202015-02-28 19:33:17 +0000850 Name == "llvm.x86.avx2.pblendw" ||
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000851 Name.startswith("llvm.x86.avx2.pblendd.")) {
Craig Topper782d6202015-02-28 19:33:17 +0000852 Value *Op0 = CI->getArgOperand(0);
853 Value *Op1 = CI->getArgOperand(1);
854 unsigned Imm = cast <ConstantInt>(CI->getArgOperand(2))->getZExtValue();
855 VectorType *VecTy = cast<VectorType>(CI->getType());
856 unsigned NumElts = VecTy->getNumElements();
857
Craig Topperc0a5fa02016-06-12 04:48:00 +0000858 SmallVector<uint32_t, 16> Idxs(NumElts);
859 for (unsigned i = 0; i != NumElts; ++i)
860 Idxs[i] = ((Imm >> (i%8)) & 1) ? i + NumElts : i;
Craig Topper782d6202015-02-28 19:33:17 +0000861
Craig Topper2f561822016-06-12 01:05:59 +0000862 Rep = Builder.CreateShuffleVector(Op0, Op1, Idxs);
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000863 } else if (Name.startswith("llvm.x86.avx.vinsertf128.") ||
Sanjay Patel4339abe2015-03-12 23:16:18 +0000864 Name == "llvm.x86.avx2.vinserti128") {
Sanjay Patel19792fb2015-03-10 16:08:36 +0000865 Value *Op0 = CI->getArgOperand(0);
866 Value *Op1 = CI->getArgOperand(1);
867 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(2))->getZExtValue();
868 VectorType *VecTy = cast<VectorType>(CI->getType());
869 unsigned NumElts = VecTy->getNumElements();
Simon Pilgrim9cb018b2015-09-23 08:48:33 +0000870
Sanjay Patel19792fb2015-03-10 16:08:36 +0000871 // Mask off the high bits of the immediate value; hardware ignores those.
872 Imm = Imm & 1;
Simon Pilgrim9cb018b2015-09-23 08:48:33 +0000873
Sanjay Patel19792fb2015-03-10 16:08:36 +0000874 // Extend the second operand into a vector that is twice as big.
875 Value *UndefV = UndefValue::get(Op1->getType());
Craig Topperc0a5fa02016-06-12 04:48:00 +0000876 SmallVector<uint32_t, 8> Idxs(NumElts);
877 for (unsigned i = 0; i != NumElts; ++i)
878 Idxs[i] = i;
Craig Topper2f561822016-06-12 01:05:59 +0000879 Rep = Builder.CreateShuffleVector(Op1, UndefV, Idxs);
Sanjay Patel19792fb2015-03-10 16:08:36 +0000880
881 // Insert the second operand into the first operand.
882
883 // Note that there is no guarantee that instruction lowering will actually
884 // produce a vinsertf128 instruction for the created shuffles. In
885 // particular, the 0 immediate case involves no lane changes, so it can
886 // be handled as a blend.
887
888 // Example of shuffle mask for 32-bit elements:
889 // Imm = 1 <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 10, i32 11>
890 // Imm = 0 <i32 8, i32 9, i32 10, i32 11, i32 4, i32 5, i32 6, i32 7 >
891
Sanjay Patel19792fb2015-03-10 16:08:36 +0000892 // The low half of the result is either the low half of the 1st operand
893 // or the low half of the 2nd operand (the inserted vector).
Craig Topperc0a5fa02016-06-12 04:48:00 +0000894 for (unsigned i = 0; i != NumElts / 2; ++i)
895 Idxs[i] = Imm ? i : (i + NumElts);
Sanjay Patel19792fb2015-03-10 16:08:36 +0000896 // The high half of the result is either the low half of the 2nd operand
897 // (the inserted vector) or the high half of the 1st operand.
Craig Topperc0a5fa02016-06-12 04:48:00 +0000898 for (unsigned i = NumElts / 2; i != NumElts; ++i)
899 Idxs[i] = Imm ? (i + NumElts / 2) : i;
Craig Topper2f561822016-06-12 01:05:59 +0000900 Rep = Builder.CreateShuffleVector(Op0, Rep, Idxs);
Craig Topperf9f1ecc2016-05-30 22:54:05 +0000901 } else if (Name.startswith("llvm.x86.avx.vextractf128.") ||
Sanjay Patel4339abe2015-03-12 23:16:18 +0000902 Name == "llvm.x86.avx2.vextracti128") {
Sanjay Patelaf1846c2015-03-12 15:15:19 +0000903 Value *Op0 = CI->getArgOperand(0);
904 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
905 VectorType *VecTy = cast<VectorType>(CI->getType());
906 unsigned NumElts = VecTy->getNumElements();
Simon Pilgrim9cb018b2015-09-23 08:48:33 +0000907
Sanjay Patelaf1846c2015-03-12 15:15:19 +0000908 // Mask off the high bits of the immediate value; hardware ignores those.
909 Imm = Imm & 1;
910
911 // Get indexes for either the high half or low half of the input vector.
Craig Topper2f561822016-06-12 01:05:59 +0000912 SmallVector<uint32_t, 4> Idxs(NumElts);
Sanjay Patelaf1846c2015-03-12 15:15:19 +0000913 for (unsigned i = 0; i != NumElts; ++i) {
Craig Topper2f561822016-06-12 01:05:59 +0000914 Idxs[i] = Imm ? (i + NumElts) : i;
Sanjay Patelaf1846c2015-03-12 15:15:19 +0000915 }
916
917 Value *UndefV = UndefValue::get(Op0->getType());
Craig Topper2f561822016-06-12 01:05:59 +0000918 Rep = Builder.CreateShuffleVector(Op0, UndefV, Idxs);
Tim Shen00127562016-04-08 21:26:31 +0000919 } else if (Name == "llvm.stackprotectorcheck") {
920 Rep = nullptr;
Craig Topper10679862016-06-12 14:11:32 +0000921 } else if (Name.startswith("llvm.x86.avx.vpermil.") ||
Craig Topper13cf7ca2016-06-13 02:36:48 +0000922 Name == "llvm.x86.sse2.pshuf.d" ||
923 Name.startswith("llvm.x86.avx512.mask.pshuf.d.")) {
Craig Topper8a105052016-06-12 03:10:47 +0000924 Value *Op0 = CI->getArgOperand(0);
925 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
926 VectorType *VecTy = cast<VectorType>(CI->getType());
927 unsigned NumElts = VecTy->getNumElements();
928 // Calcuate the size of each index in the immediate.
929 unsigned IdxSize = 64 / VecTy->getScalarSizeInBits();
930 unsigned IdxMask = ((1 << IdxSize) - 1);
931
932 SmallVector<uint32_t, 8> Idxs(NumElts);
933 // Lookup the bits for this element, wrapping around the immediate every
934 // 8-bits. Elements are grouped into sets of 2 or 4 elements so we need
935 // to offset by the first index of each group.
936 for (unsigned i = 0; i != NumElts; ++i)
937 Idxs[i] = ((Imm >> ((i * IdxSize) % 8)) & IdxMask) | (i & ~IdxMask);
938
939 Rep = Builder.CreateShuffleVector(Op0, Op0, Idxs);
Craig Topper13cf7ca2016-06-13 02:36:48 +0000940
941 if (CI->getNumArgOperands() == 4)
942 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
943 CI->getArgOperand(2));
944 } else if (Name == "llvm.x86.sse2.pshufl.w" ||
945 Name.startswith("llvm.x86.avx512.mask.pshufl.w.")) {
Craig Topper10679862016-06-12 14:11:32 +0000946 Value *Op0 = CI->getArgOperand(0);
947 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
948 unsigned NumElts = CI->getType()->getVectorNumElements();
949
950 SmallVector<uint32_t, 16> Idxs(NumElts);
951 for (unsigned l = 0; l != NumElts; l += 8) {
952 for (unsigned i = 0; i != 4; ++i)
953 Idxs[i + l] = ((Imm >> (2 * i)) & 0x3) + l;
954 for (unsigned i = 4; i != 8; ++i)
955 Idxs[i + l] = i + l;
956 }
957
958 Rep = Builder.CreateShuffleVector(Op0, Op0, Idxs);
Craig Topper13cf7ca2016-06-13 02:36:48 +0000959
960 if (CI->getNumArgOperands() == 4)
961 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
962 CI->getArgOperand(2));
963 } else if (Name == "llvm.x86.sse2.pshufh.w" ||
964 Name.startswith("llvm.x86.avx512.mask.pshufh.w.")) {
Craig Topper10679862016-06-12 14:11:32 +0000965 Value *Op0 = CI->getArgOperand(0);
966 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
967 unsigned NumElts = CI->getType()->getVectorNumElements();
968
969 SmallVector<uint32_t, 16> Idxs(NumElts);
970 for (unsigned l = 0; l != NumElts; l += 8) {
971 for (unsigned i = 0; i != 4; ++i)
972 Idxs[i + l] = i + l;
973 for (unsigned i = 0; i != 4; ++i)
974 Idxs[i + l + 4] = ((Imm >> (2 * i)) & 0x3) + 4 + l;
975 }
976
977 Rep = Builder.CreateShuffleVector(Op0, Op0, Idxs);
Craig Topper13cf7ca2016-06-13 02:36:48 +0000978
979 if (CI->getNumArgOperands() == 4)
980 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
981 CI->getArgOperand(2));
Craig Topper3b1817d2012-02-03 06:10:55 +0000982 } else {
Craig Topper8a105052016-06-12 03:10:47 +0000983 llvm_unreachable("Unknown function for CallInst upgrade.");
Craig Topper3b1817d2012-02-03 06:10:55 +0000984 }
985
Tim Shen00127562016-04-08 21:26:31 +0000986 if (Rep)
987 CI->replaceAllUsesWith(Rep);
Craig Topper3b1817d2012-02-03 06:10:55 +0000988 CI->eraseFromParent();
989 return;
990 }
991
Yaron Kerend1fdbe72015-03-30 16:10:39 +0000992 std::string Name = CI->getName();
Adrian Prantl87b7eb92014-10-01 18:55:02 +0000993 if (!Name.empty())
994 CI->setName(Name + ".old");
Nadav Rotem17ee58a2012-06-10 18:42:51 +0000995
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000996 switch (NewFn->getIntrinsicID()) {
997 default:
Chris Lattner0bcbde42011-11-27 08:42:07 +0000998 llvm_unreachable("Unknown function for CallInst upgrade.");
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000999
Jeroen Ketemaab99b592015-09-30 10:56:37 +00001000 case Intrinsic::arm_neon_vld1:
1001 case Intrinsic::arm_neon_vld2:
1002 case Intrinsic::arm_neon_vld3:
1003 case Intrinsic::arm_neon_vld4:
1004 case Intrinsic::arm_neon_vld2lane:
1005 case Intrinsic::arm_neon_vld3lane:
1006 case Intrinsic::arm_neon_vld4lane:
1007 case Intrinsic::arm_neon_vst1:
1008 case Intrinsic::arm_neon_vst2:
1009 case Intrinsic::arm_neon_vst3:
1010 case Intrinsic::arm_neon_vst4:
1011 case Intrinsic::arm_neon_vst2lane:
1012 case Intrinsic::arm_neon_vst3lane:
1013 case Intrinsic::arm_neon_vst4lane: {
1014 SmallVector<Value *, 4> Args(CI->arg_operands().begin(),
1015 CI->arg_operands().end());
1016 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, Args));
1017 CI->eraseFromParent();
1018 return;
1019 }
1020
Chandler Carruth58a71ed2011-12-12 04:26:04 +00001021 case Intrinsic::ctlz:
Nuno Lopesad40c0a2012-05-22 15:25:31 +00001022 case Intrinsic::cttz:
Chandler Carruth58a71ed2011-12-12 04:26:04 +00001023 assert(CI->getNumArgOperands() == 1 &&
1024 "Mismatch between function args and call args");
David Blaikieff6409d2015-05-18 22:13:54 +00001025 CI->replaceAllUsesWith(Builder.CreateCall(
1026 NewFn, {CI->getArgOperand(0), Builder.getFalse()}, Name));
Chandler Carruth58a71ed2011-12-12 04:26:04 +00001027 CI->eraseFromParent();
1028 return;
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001029
Matt Arsenaultfbcbce42013-10-07 18:06:48 +00001030 case Intrinsic::objectsize:
David Blaikieff6409d2015-05-18 22:13:54 +00001031 CI->replaceAllUsesWith(Builder.CreateCall(
1032 NewFn, {CI->getArgOperand(0), CI->getArgOperand(1)}, Name));
Matt Arsenaultfbcbce42013-10-07 18:06:48 +00001033 CI->eraseFromParent();
1034 return;
1035
Joel Jonesb84f7be2012-07-18 00:02:16 +00001036 case Intrinsic::ctpop: {
David Blaikieff6409d2015-05-18 22:13:54 +00001037 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, {CI->getArgOperand(0)}));
Joel Jonesb84f7be2012-07-18 00:02:16 +00001038 CI->eraseFromParent();
1039 return;
1040 }
Joel Jones43cb8782012-07-13 23:25:25 +00001041
Craig Topper71dc02d2012-06-13 07:18:53 +00001042 case Intrinsic::x86_xop_vfrcz_ss:
1043 case Intrinsic::x86_xop_vfrcz_sd:
David Blaikieff6409d2015-05-18 22:13:54 +00001044 CI->replaceAllUsesWith(
1045 Builder.CreateCall(NewFn, {CI->getArgOperand(1)}, Name));
Craig Topper71dc02d2012-06-13 07:18:53 +00001046 CI->eraseFromParent();
1047 return;
1048
Simon Pilgrime85506b2016-06-03 08:06:03 +00001049 case Intrinsic::x86_xop_vpermil2pd:
1050 case Intrinsic::x86_xop_vpermil2ps:
1051 case Intrinsic::x86_xop_vpermil2pd_256:
1052 case Intrinsic::x86_xop_vpermil2ps_256: {
1053 SmallVector<Value *, 4> Args(CI->arg_operands().begin(),
1054 CI->arg_operands().end());
1055 VectorType *FltIdxTy = cast<VectorType>(Args[2]->getType());
1056 VectorType *IntIdxTy = VectorType::getInteger(FltIdxTy);
1057 Args[2] = Builder.CreateBitCast(Args[2], IntIdxTy);
1058 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, Args, Name));
1059 CI->eraseFromParent();
1060 return;
1061 }
1062
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001063 case Intrinsic::x86_sse41_ptestc:
1064 case Intrinsic::x86_sse41_ptestz:
Craig Topper71dc02d2012-06-13 07:18:53 +00001065 case Intrinsic::x86_sse41_ptestnzc: {
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001066 // The arguments for these intrinsics used to be v4f32, and changed
1067 // to v2i64. This is purely a nop, since those are bitwise intrinsics.
1068 // So, the only thing required is a bitcast for both arguments.
1069 // First, check the arguments have the old type.
1070 Value *Arg0 = CI->getArgOperand(0);
1071 if (Arg0->getType() != VectorType::get(Type::getFloatTy(C), 4))
1072 return;
1073
1074 // Old intrinsic, add bitcasts
1075 Value *Arg1 = CI->getArgOperand(1);
1076
David Blaikie5bacf372015-04-24 21:16:07 +00001077 Type *NewVecTy = VectorType::get(Type::getInt64Ty(C), 2);
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001078
David Blaikie5bacf372015-04-24 21:16:07 +00001079 Value *BC0 = Builder.CreateBitCast(Arg0, NewVecTy, "cast");
1080 Value *BC1 = Builder.CreateBitCast(Arg1, NewVecTy, "cast");
1081
David Blaikieff6409d2015-05-18 22:13:54 +00001082 CallInst *NewCall = Builder.CreateCall(NewFn, {BC0, BC1}, Name);
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001083 CI->replaceAllUsesWith(NewCall);
1084 CI->eraseFromParent();
1085 return;
Evan Cheng0e179d02007-12-17 22:33:23 +00001086 }
Chandler Carruth373b2b12014-09-06 10:00:01 +00001087
Chandler Carruth373b2b12014-09-06 10:00:01 +00001088 case Intrinsic::x86_sse41_insertps:
1089 case Intrinsic::x86_sse41_dppd:
1090 case Intrinsic::x86_sse41_dpps:
1091 case Intrinsic::x86_sse41_mpsadbw:
Chandler Carruth373b2b12014-09-06 10:00:01 +00001092 case Intrinsic::x86_avx_dp_ps_256:
Chandler Carruth373b2b12014-09-06 10:00:01 +00001093 case Intrinsic::x86_avx2_mpsadbw: {
1094 // Need to truncate the last argument from i32 to i8 -- this argument models
1095 // an inherently 8-bit immediate operand to these x86 instructions.
1096 SmallVector<Value *, 4> Args(CI->arg_operands().begin(),
1097 CI->arg_operands().end());
1098
1099 // Replace the last argument with a trunc.
1100 Args.back() = Builder.CreateTrunc(Args.back(), Type::getInt8Ty(C), "trunc");
1101
1102 CallInst *NewCall = Builder.CreateCall(NewFn, Args);
1103 CI->replaceAllUsesWith(NewCall);
1104 CI->eraseFromParent();
1105 return;
1106 }
Marcin Koscielnicki3fdc2572016-04-19 20:51:05 +00001107
1108 case Intrinsic::thread_pointer: {
1109 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, {}));
1110 CI->eraseFromParent();
1111 return;
1112 }
Craig Topper71dc02d2012-06-13 07:18:53 +00001113 }
Chandler Carruth7132e002007-08-04 01:51:18 +00001114}
1115
Sanjay Patelfdf0d5f2016-04-18 19:11:57 +00001116void llvm::UpgradeCallsToIntrinsic(Function *F) {
Chandler Carruth7132e002007-08-04 01:51:18 +00001117 assert(F && "Illegal attempt to upgrade a non-existent intrinsic.");
1118
Sanjay Patelfdf0d5f2016-04-18 19:11:57 +00001119 // Check if this function should be upgraded and get the replacement function
1120 // if there is one.
Chris Lattner80ed9dc2011-06-18 06:05:24 +00001121 Function *NewFn;
Evan Cheng0e179d02007-12-17 22:33:23 +00001122 if (UpgradeIntrinsicFunction(F, NewFn)) {
Sanjay Patelfdf0d5f2016-04-18 19:11:57 +00001123 // Replace all users of the old function with the new function or new
1124 // instructions. This is not a range loop because the call is deleted.
1125 for (auto UI = F->user_begin(), UE = F->user_end(); UI != UE; )
Duncan P. N. Exon Smith93f53c42016-04-17 03:59:37 +00001126 if (CallInst *CI = dyn_cast<CallInst>(*UI++))
Filipe Cabecinhas0011c582015-07-03 20:12:01 +00001127 UpgradeIntrinsicCall(CI, NewFn);
Sanjay Patelfdf0d5f2016-04-18 19:11:57 +00001128
Filipe Cabecinhas0011c582015-07-03 20:12:01 +00001129 // Remove old function, no longer used, from the module.
1130 F->eraseFromParent();
Chandler Carruth7132e002007-08-04 01:51:18 +00001131 }
1132}
Devang Patel80ae3492009-08-28 23:24:31 +00001133
Manman Ren209b17c2013-09-28 00:22:27 +00001134void llvm::UpgradeInstWithTBAATag(Instruction *I) {
Duncan P. N. Exon Smithde36e802014-11-11 21:30:22 +00001135 MDNode *MD = I->getMetadata(LLVMContext::MD_tbaa);
Manman Ren209b17c2013-09-28 00:22:27 +00001136 assert(MD && "UpgradeInstWithTBAATag should have a TBAA tag");
1137 // Check if the tag uses struct-path aware TBAA format.
1138 if (isa<MDNode>(MD->getOperand(0)) && MD->getNumOperands() >= 3)
1139 return;
1140
1141 if (MD->getNumOperands() == 3) {
Duncan P. N. Exon Smith5bf8fef2014-12-09 18:38:53 +00001142 Metadata *Elts[] = {MD->getOperand(0), MD->getOperand(1)};
Manman Ren209b17c2013-09-28 00:22:27 +00001143 MDNode *ScalarType = MDNode::get(I->getContext(), Elts);
1144 // Create a MDNode <ScalarType, ScalarType, offset 0, const>
Duncan P. N. Exon Smith5bf8fef2014-12-09 18:38:53 +00001145 Metadata *Elts2[] = {ScalarType, ScalarType,
1146 ConstantAsMetadata::get(Constant::getNullValue(
1147 Type::getInt64Ty(I->getContext()))),
1148 MD->getOperand(2)};
Manman Ren209b17c2013-09-28 00:22:27 +00001149 I->setMetadata(LLVMContext::MD_tbaa, MDNode::get(I->getContext(), Elts2));
1150 } else {
1151 // Create a MDNode <MD, MD, offset 0>
Duncan P. N. Exon Smith5bf8fef2014-12-09 18:38:53 +00001152 Metadata *Elts[] = {MD, MD, ConstantAsMetadata::get(Constant::getNullValue(
1153 Type::getInt64Ty(I->getContext())))};
Manman Ren209b17c2013-09-28 00:22:27 +00001154 I->setMetadata(LLVMContext::MD_tbaa, MDNode::get(I->getContext(), Elts));
1155 }
1156}
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001157
1158Instruction *llvm::UpgradeBitCastInst(unsigned Opc, Value *V, Type *DestTy,
1159 Instruction *&Temp) {
1160 if (Opc != Instruction::BitCast)
Craig Topperc6207612014-04-09 06:08:46 +00001161 return nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001162
Craig Topperc6207612014-04-09 06:08:46 +00001163 Temp = nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001164 Type *SrcTy = V->getType();
1165 if (SrcTy->isPtrOrPtrVectorTy() && DestTy->isPtrOrPtrVectorTy() &&
1166 SrcTy->getPointerAddressSpace() != DestTy->getPointerAddressSpace()) {
1167 LLVMContext &Context = V->getContext();
1168
1169 // We have no information about target data layout, so we assume that
1170 // the maximum pointer size is 64bit.
1171 Type *MidTy = Type::getInt64Ty(Context);
1172 Temp = CastInst::Create(Instruction::PtrToInt, V, MidTy);
1173
1174 return CastInst::Create(Instruction::IntToPtr, Temp, DestTy);
1175 }
1176
Craig Topperc6207612014-04-09 06:08:46 +00001177 return nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001178}
1179
1180Value *llvm::UpgradeBitCastExpr(unsigned Opc, Constant *C, Type *DestTy) {
1181 if (Opc != Instruction::BitCast)
Craig Topperc6207612014-04-09 06:08:46 +00001182 return nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001183
1184 Type *SrcTy = C->getType();
1185 if (SrcTy->isPtrOrPtrVectorTy() && DestTy->isPtrOrPtrVectorTy() &&
1186 SrcTy->getPointerAddressSpace() != DestTy->getPointerAddressSpace()) {
1187 LLVMContext &Context = C->getContext();
1188
1189 // We have no information about target data layout, so we assume that
1190 // the maximum pointer size is 64bit.
1191 Type *MidTy = Type::getInt64Ty(Context);
1192
1193 return ConstantExpr::getIntToPtr(ConstantExpr::getPtrToInt(C, MidTy),
1194 DestTy);
1195 }
1196
Craig Topperc6207612014-04-09 06:08:46 +00001197 return nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001198}
Manman Ren8b4306c2013-12-02 21:29:56 +00001199
1200/// Check the debug info version number, if it is out-dated, drop the debug
1201/// info. Return true if module is modified.
1202bool llvm::UpgradeDebugInfo(Module &M) {
Manman Ren2ebfb422014-01-16 01:51:12 +00001203 unsigned Version = getDebugMetadataVersionFromModule(M);
1204 if (Version == DEBUG_METADATA_VERSION)
Manman Ren8b4306c2013-12-02 21:29:56 +00001205 return false;
1206
Manman Ren2ebfb422014-01-16 01:51:12 +00001207 bool RetCode = StripDebugInfo(M);
1208 if (RetCode) {
1209 DiagnosticInfoDebugMetadataVersion DiagVersion(M, Version);
1210 M.getContext().diagnose(DiagVersion);
1211 }
1212 return RetCode;
Manman Ren8b4306c2013-12-02 21:29:56 +00001213}
Eli Bendersky5d5e18d2014-06-25 15:41:00 +00001214
Manman Renb5d7ff42016-05-25 23:14:48 +00001215bool llvm::UpgradeModuleFlags(Module &M) {
1216 const NamedMDNode *ModFlags = M.getModuleFlagsMetadata();
1217 if (!ModFlags)
1218 return false;
1219
1220 bool HasObjCFlag = false, HasClassProperties = false;
1221 for (unsigned I = 0, E = ModFlags->getNumOperands(); I != E; ++I) {
1222 MDNode *Op = ModFlags->getOperand(I);
1223 if (Op->getNumOperands() < 2)
1224 continue;
1225 MDString *ID = dyn_cast_or_null<MDString>(Op->getOperand(1));
1226 if (!ID)
1227 continue;
1228 if (ID->getString() == "Objective-C Image Info Version")
1229 HasObjCFlag = true;
1230 if (ID->getString() == "Objective-C Class Properties")
1231 HasClassProperties = true;
1232 }
1233 // "Objective-C Class Properties" is recently added for Objective-C. We
1234 // upgrade ObjC bitcodes to contain a "Objective-C Class Properties" module
1235 // flag of value 0, so we can correclty report error when trying to link
1236 // an ObjC bitcode without this module flag with an ObjC bitcode with this
1237 // module flag.
1238 if (HasObjCFlag && !HasClassProperties) {
1239 M.addModuleFlag(llvm::Module::Error, "Objective-C Class Properties",
1240 (uint32_t)0);
1241 return true;
1242 }
1243 return false;
1244}
1245
Duncan P. N. Exon Smithefe16c82016-03-25 00:56:13 +00001246static bool isOldLoopArgument(Metadata *MD) {
1247 auto *T = dyn_cast_or_null<MDTuple>(MD);
1248 if (!T)
1249 return false;
1250 if (T->getNumOperands() < 1)
1251 return false;
1252 auto *S = dyn_cast_or_null<MDString>(T->getOperand(0));
1253 if (!S)
1254 return false;
1255 return S->getString().startswith("llvm.vectorizer.");
1256}
1257
1258static MDString *upgradeLoopTag(LLVMContext &C, StringRef OldTag) {
1259 StringRef OldPrefix = "llvm.vectorizer.";
1260 assert(OldTag.startswith(OldPrefix) && "Expected old prefix");
1261
1262 if (OldTag == "llvm.vectorizer.unroll")
1263 return MDString::get(C, "llvm.loop.interleave.count");
1264
1265 return MDString::get(
1266 C, (Twine("llvm.loop.vectorize.") + OldTag.drop_front(OldPrefix.size()))
1267 .str());
1268}
1269
1270static Metadata *upgradeLoopArgument(Metadata *MD) {
1271 auto *T = dyn_cast_or_null<MDTuple>(MD);
1272 if (!T)
1273 return MD;
1274 if (T->getNumOperands() < 1)
1275 return MD;
1276 auto *OldTag = dyn_cast_or_null<MDString>(T->getOperand(0));
1277 if (!OldTag)
1278 return MD;
1279 if (!OldTag->getString().startswith("llvm.vectorizer."))
1280 return MD;
1281
1282 // This has an old tag. Upgrade it.
1283 SmallVector<Metadata *, 8> Ops;
1284 Ops.reserve(T->getNumOperands());
1285 Ops.push_back(upgradeLoopTag(T->getContext(), OldTag->getString()));
1286 for (unsigned I = 1, E = T->getNumOperands(); I != E; ++I)
1287 Ops.push_back(T->getOperand(I));
1288
1289 return MDTuple::get(T->getContext(), Ops);
1290}
1291
1292MDNode *llvm::upgradeInstructionLoopAttachment(MDNode &N) {
1293 auto *T = dyn_cast<MDTuple>(&N);
1294 if (!T)
1295 return &N;
1296
1297 if (!llvm::any_of(T->operands(), isOldLoopArgument))
1298 return &N;
1299
1300 SmallVector<Metadata *, 8> Ops;
1301 Ops.reserve(T->getNumOperands());
1302 for (Metadata *MD : T->operands())
1303 Ops.push_back(upgradeLoopArgument(MD));
1304
1305 return MDTuple::get(T->getContext(), Ops);
Eli Bendersky5d5e18d2014-06-25 15:41:00 +00001306}