blob: 08d68d70d5bae063fc14d3b9d2746334584282bd [file] [log] [blame]
Chandler Carruth7132e002007-08-04 01:51:18 +00001//===-- AutoUpgrade.cpp - Implement auto-upgrade helper functions ---------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chandler Carruth7132e002007-08-04 01:51:18 +00007//
8//===----------------------------------------------------------------------===//
9//
Sanjay Patel19792fb2015-03-10 16:08:36 +000010// This file implements the auto-upgrade helper functions.
11// This is where deprecated IR intrinsics and other IR features are updated to
12// current specifications.
Chandler Carruth7132e002007-08-04 01:51:18 +000013//
14//===----------------------------------------------------------------------===//
15
Chandler Carruth91065212014-03-05 10:34:14 +000016#include "llvm/IR/AutoUpgrade.h"
Chandler Carruth1305dc32014-03-04 11:45:46 +000017#include "llvm/IR/CFG.h"
Chandler Carruth219b89b2014-03-04 11:01:28 +000018#include "llvm/IR/CallSite.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000019#include "llvm/IR/Constants.h"
Chandler Carruthd9903882015-01-14 11:23:27 +000020#include "llvm/IR/DIBuilder.h"
Chandler Carruth9a4c9e52014-03-06 00:46:21 +000021#include "llvm/IR/DebugInfo.h"
Manman Ren2ebfb422014-01-16 01:51:12 +000022#include "llvm/IR/DiagnosticInfo.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000023#include "llvm/IR/Function.h"
24#include "llvm/IR/IRBuilder.h"
25#include "llvm/IR/Instruction.h"
26#include "llvm/IR/IntrinsicInst.h"
27#include "llvm/IR/LLVMContext.h"
28#include "llvm/IR/Module.h"
Torok Edwin56d06592009-07-11 20:10:48 +000029#include "llvm/Support/ErrorHandling.h"
Jeroen Ketemaab99b592015-09-30 10:56:37 +000030#include "llvm/Support/Regex.h"
Anton Korobeynikov579f0712008-02-20 11:08:44 +000031#include <cstring>
Chandler Carruth7132e002007-08-04 01:51:18 +000032using namespace llvm;
33
Rafael Espindolad7325ee2016-10-03 15:51:42 +000034static void rename(GlobalValue *GV) { GV->setName(GV->getName() + ".old"); }
35
Nadav Rotem17ee58a2012-06-10 18:42:51 +000036// Upgrade the declarations of the SSE4.1 functions whose arguments have
37// changed their type from v4f32 to v2i64.
38static bool UpgradeSSE41Function(Function* F, Intrinsic::ID IID,
39 Function *&NewFn) {
40 // Check whether this is an old version of the function, which received
41 // v4f32 arguments.
42 Type *Arg0Type = F->getFunctionType()->getParamType(0);
43 if (Arg0Type != VectorType::get(Type::getFloatTy(F->getContext()), 4))
44 return false;
45
46 // Yes, it's old, replace it with new version.
Rafael Espindolad7325ee2016-10-03 15:51:42 +000047 rename(F);
Nadav Rotem17ee58a2012-06-10 18:42:51 +000048 NewFn = Intrinsic::getDeclaration(F->getParent(), IID);
49 return true;
50}
Chandler Carruth7132e002007-08-04 01:51:18 +000051
Chandler Carruth373b2b12014-09-06 10:00:01 +000052// Upgrade the declarations of intrinsic functions whose 8-bit immediate mask
53// arguments have changed their type from i32 to i8.
54static bool UpgradeX86IntrinsicsWith8BitMask(Function *F, Intrinsic::ID IID,
55 Function *&NewFn) {
56 // Check that the last argument is an i32.
57 Type *LastArgType = F->getFunctionType()->getParamType(
58 F->getFunctionType()->getNumParams() - 1);
59 if (!LastArgType->isIntegerTy(32))
60 return false;
61
62 // Move this function aside and map down.
Rafael Espindolad7325ee2016-10-03 15:51:42 +000063 rename(F);
Chandler Carruth373b2b12014-09-06 10:00:01 +000064 NewFn = Intrinsic::getDeclaration(F->getParent(), IID);
65 return true;
66}
67
Evan Cheng0e179d02007-12-17 22:33:23 +000068static bool UpgradeIntrinsicFunction1(Function *F, Function *&NewFn) {
Chandler Carruth7132e002007-08-04 01:51:18 +000069 assert(F && "Illegal to upgrade a non-existent Function.");
70
Chandler Carruth7132e002007-08-04 01:51:18 +000071 // Quickly eliminate it, if it's not a candidate.
Eric Liuc9c68172016-07-08 16:09:51 +000072 StringRef Name = F->getName();
Chris Lattnerb372f662011-06-18 18:56:39 +000073 if (Name.size() <= 8 || !Name.startswith("llvm."))
Evan Cheng0e179d02007-12-17 22:33:23 +000074 return false;
Chris Lattnerb372f662011-06-18 18:56:39 +000075 Name = Name.substr(5); // Strip off "llvm."
Chris Lattner0bcbde42011-11-27 08:42:07 +000076
Chris Lattnerb372f662011-06-18 18:56:39 +000077 switch (Name[0]) {
Chandler Carruth7132e002007-08-04 01:51:18 +000078 default: break;
Joel Jones43cb8782012-07-13 23:25:25 +000079 case 'a': {
80 if (Name.startswith("arm.neon.vclz")) {
81 Type* args[2] = {
Matt Arsenaultc4c92262013-07-20 17:46:00 +000082 F->arg_begin()->getType(),
Joel Jones43cb8782012-07-13 23:25:25 +000083 Type::getInt1Ty(F->getContext())
84 };
85 // Can't use Intrinsic::getDeclaration here as it adds a ".i1" to
86 // the end of the name. Change name from llvm.arm.neon.vclz.* to
87 // llvm.ctlz.*
88 FunctionType* fType = FunctionType::get(F->getReturnType(), args, false);
Matt Arsenaultc4c92262013-07-20 17:46:00 +000089 NewFn = Function::Create(fType, F->getLinkage(),
Joel Jones43cb8782012-07-13 23:25:25 +000090 "llvm.ctlz." + Name.substr(14), F->getParent());
91 return true;
92 }
Joel Jonesb84f7be2012-07-18 00:02:16 +000093 if (Name.startswith("arm.neon.vcnt")) {
94 NewFn = Intrinsic::getDeclaration(F->getParent(), Intrinsic::ctpop,
95 F->arg_begin()->getType());
96 return true;
97 }
Jeroen Ketemaab99b592015-09-30 10:56:37 +000098 Regex vldRegex("^arm\\.neon\\.vld([1234]|[234]lane)\\.v[a-z0-9]*$");
99 if (vldRegex.match(Name)) {
100 auto fArgs = F->getFunctionType()->params();
101 SmallVector<Type *, 4> Tys(fArgs.begin(), fArgs.end());
102 // Can't use Intrinsic::getDeclaration here as the return types might
103 // then only be structurally equal.
104 FunctionType* fType = FunctionType::get(F->getReturnType(), Tys, false);
105 NewFn = Function::Create(fType, F->getLinkage(),
106 "llvm." + Name + ".p0i8", F->getParent());
107 return true;
108 }
109 Regex vstRegex("^arm\\.neon\\.vst([1234]|[234]lane)\\.v[a-z0-9]*$");
110 if (vstRegex.match(Name)) {
Craig Topper26260942015-10-18 05:15:34 +0000111 static const Intrinsic::ID StoreInts[] = {Intrinsic::arm_neon_vst1,
112 Intrinsic::arm_neon_vst2,
113 Intrinsic::arm_neon_vst3,
114 Intrinsic::arm_neon_vst4};
Jeroen Ketemaab99b592015-09-30 10:56:37 +0000115
Craig Topper26260942015-10-18 05:15:34 +0000116 static const Intrinsic::ID StoreLaneInts[] = {
117 Intrinsic::arm_neon_vst2lane, Intrinsic::arm_neon_vst3lane,
118 Intrinsic::arm_neon_vst4lane
119 };
Jeroen Ketemaab99b592015-09-30 10:56:37 +0000120
121 auto fArgs = F->getFunctionType()->params();
122 Type *Tys[] = {fArgs[0], fArgs[1]};
123 if (Name.find("lane") == StringRef::npos)
124 NewFn = Intrinsic::getDeclaration(F->getParent(),
125 StoreInts[fArgs.size() - 3], Tys);
126 else
127 NewFn = Intrinsic::getDeclaration(F->getParent(),
128 StoreLaneInts[fArgs.size() - 5], Tys);
129 return true;
130 }
Marcin Koscielnicki3fdc2572016-04-19 20:51:05 +0000131 if (Name == "aarch64.thread.pointer" || Name == "arm.thread.pointer") {
132 NewFn = Intrinsic::getDeclaration(F->getParent(), Intrinsic::thread_pointer);
133 return true;
134 }
Joel Jones43cb8782012-07-13 23:25:25 +0000135 break;
136 }
Jeroen Ketemaab99b592015-09-30 10:56:37 +0000137
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000138 case 'c': {
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000139 if (Name.startswith("ctlz.") && F->arg_size() == 1) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000140 rename(F);
Chandler Carruthd4a02402011-12-12 10:57:20 +0000141 NewFn = Intrinsic::getDeclaration(F->getParent(), Intrinsic::ctlz,
142 F->arg_begin()->getType());
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000143 return true;
144 }
145 if (Name.startswith("cttz.") && F->arg_size() == 1) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000146 rename(F);
Chandler Carruthd4a02402011-12-12 10:57:20 +0000147 NewFn = Intrinsic::getDeclaration(F->getParent(), Intrinsic::cttz,
148 F->arg_begin()->getType());
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000149 return true;
150 }
151 break;
152 }
Mehdi Amini8c629ec2016-08-13 23:31:24 +0000153 case 'i': {
154 if (Name.startswith("invariant.start")) {
155 auto Args = F->getFunctionType()->params();
156 Type* ObjectPtr[1] = {Args[1]};
157 if (F->getName() !=
158 Intrinsic::getName(Intrinsic::invariant_start, ObjectPtr)) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000159 rename(F);
Mehdi Amini8c629ec2016-08-13 23:31:24 +0000160 NewFn = Intrinsic::getDeclaration(
161 F->getParent(), Intrinsic::invariant_start, ObjectPtr);
162 return true;
163 }
164 }
165 if (Name.startswith("invariant.end")) {
166 auto Args = F->getFunctionType()->params();
167 Type* ObjectPtr[1] = {Args[2]};
168 if (F->getName() !=
169 Intrinsic::getName(Intrinsic::invariant_end, ObjectPtr)) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000170 rename(F);
Mehdi Amini8c629ec2016-08-13 23:31:24 +0000171 NewFn = Intrinsic::getDeclaration(F->getParent(),
172 Intrinsic::invariant_end, ObjectPtr);
173 return true;
174 }
175 }
176 break;
177 }
Artur Pilipenko7ad95ec2016-06-28 18:27:25 +0000178 case 'm': {
179 if (Name.startswith("masked.load.")) {
180 Type *Tys[] = { F->getReturnType(), F->arg_begin()->getType() };
181 if (F->getName() != Intrinsic::getName(Intrinsic::masked_load, Tys)) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000182 rename(F);
Artur Pilipenko7ad95ec2016-06-28 18:27:25 +0000183 NewFn = Intrinsic::getDeclaration(F->getParent(),
184 Intrinsic::masked_load,
185 Tys);
186 return true;
187 }
188 }
189 if (Name.startswith("masked.store.")) {
190 auto Args = F->getFunctionType()->params();
191 Type *Tys[] = { Args[0], Args[1] };
192 if (F->getName() != Intrinsic::getName(Intrinsic::masked_store, Tys)) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000193 rename(F);
Artur Pilipenko7ad95ec2016-06-28 18:27:25 +0000194 NewFn = Intrinsic::getDeclaration(F->getParent(),
195 Intrinsic::masked_store,
196 Tys);
197 return true;
198 }
199 }
200 break;
201 }
202
Matt Arsenaultfbcbce42013-10-07 18:06:48 +0000203 case 'o':
204 // We only need to change the name to match the mangling including the
205 // address space.
206 if (F->arg_size() == 2 && Name.startswith("objectsize.")) {
207 Type *Tys[2] = { F->getReturnType(), F->arg_begin()->getType() };
208 if (F->getName() != Intrinsic::getName(Intrinsic::objectsize, Tys)) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000209 rename(F);
Matt Arsenaultfbcbce42013-10-07 18:06:48 +0000210 NewFn = Intrinsic::getDeclaration(F->getParent(),
211 Intrinsic::objectsize, Tys);
212 return true;
213 }
214 }
215 break;
216
Tim Shen00127562016-04-08 21:26:31 +0000217 case 's':
218 if (Name == "stackprotectorcheck") {
219 NewFn = nullptr;
220 return true;
221 }
222
Craig Topper3b1817d2012-02-03 06:10:55 +0000223 case 'x': {
Craig Topper5aebb862016-07-04 20:56:38 +0000224 bool IsX86 = Name.startswith("x86.");
225 if (IsX86)
226 Name = Name.substr(4);
227
228 if (IsX86 &&
229 (Name.startswith("sse2.pcmpeq.") ||
230 Name.startswith("sse2.pcmpgt.") ||
231 Name.startswith("avx2.pcmpeq.") ||
232 Name.startswith("avx2.pcmpgt.") ||
233 Name.startswith("avx512.mask.pcmpeq.") ||
234 Name.startswith("avx512.mask.pcmpgt.") ||
235 Name == "sse41.pmaxsb" ||
236 Name == "sse2.pmaxs.w" ||
237 Name == "sse41.pmaxsd" ||
238 Name == "sse2.pmaxu.b" ||
239 Name == "sse41.pmaxuw" ||
240 Name == "sse41.pmaxud" ||
241 Name == "sse41.pminsb" ||
242 Name == "sse2.pmins.w" ||
243 Name == "sse41.pminsd" ||
244 Name == "sse2.pminu.b" ||
245 Name == "sse41.pminuw" ||
246 Name == "sse41.pminud" ||
247 Name.startswith("avx2.pmax") ||
248 Name.startswith("avx2.pmin") ||
249 Name.startswith("avx2.vbroadcast") ||
250 Name.startswith("avx2.pbroadcast") ||
251 Name.startswith("avx.vpermil.") ||
252 Name.startswith("sse2.pshuf") ||
Simon Pilgrim4e96fbf2016-07-05 13:58:47 +0000253 Name.startswith("avx512.pbroadcast") ||
254 Name.startswith("avx512.mask.broadcast.s") ||
Craig Topper5aebb862016-07-04 20:56:38 +0000255 Name.startswith("avx512.mask.movddup") ||
256 Name.startswith("avx512.mask.movshdup") ||
257 Name.startswith("avx512.mask.movsldup") ||
258 Name.startswith("avx512.mask.pshuf.d.") ||
259 Name.startswith("avx512.mask.pshufl.w.") ||
260 Name.startswith("avx512.mask.pshufh.w.") ||
Craig Topper4619c9e2016-09-13 07:40:53 +0000261 Name.startswith("avx512.mask.shuf.p") ||
Craig Topper5aebb862016-07-04 20:56:38 +0000262 Name.startswith("avx512.mask.vpermil.p") ||
263 Name.startswith("avx512.mask.perm.df.") ||
264 Name.startswith("avx512.mask.perm.di.") ||
265 Name.startswith("avx512.mask.punpckl") ||
266 Name.startswith("avx512.mask.punpckh") ||
267 Name.startswith("avx512.mask.unpckl.") ||
268 Name.startswith("avx512.mask.unpckh.") ||
Craig Toppera6e6feb2016-07-12 05:27:53 +0000269 Name.startswith("avx512.mask.pand.") ||
270 Name.startswith("avx512.mask.pandn.") ||
271 Name.startswith("avx512.mask.por.") ||
272 Name.startswith("avx512.mask.pxor.") ||
Craig Toppere75c4952016-09-02 05:29:17 +0000273 Name.startswith("avx512.mask.and.") ||
274 Name.startswith("avx512.mask.andn.") ||
275 Name.startswith("avx512.mask.or.") ||
276 Name.startswith("avx512.mask.xor.") ||
Craig Topperaf0d63d2016-09-04 02:09:53 +0000277 Name.startswith("avx512.mask.padd.") ||
278 Name.startswith("avx512.mask.psub.") ||
279 Name.startswith("avx512.mask.pmull.") ||
Craig Topper41773452016-09-04 18:13:33 +0000280 Name.startswith("avx512.mask.add.pd.128") ||
281 Name.startswith("avx512.mask.add.pd.256") ||
282 Name.startswith("avx512.mask.add.ps.128") ||
283 Name.startswith("avx512.mask.add.ps.256") ||
284 Name.startswith("avx512.mask.div.pd.128") ||
285 Name.startswith("avx512.mask.div.pd.256") ||
286 Name.startswith("avx512.mask.div.ps.128") ||
287 Name.startswith("avx512.mask.div.ps.256") ||
288 Name.startswith("avx512.mask.mul.pd.128") ||
289 Name.startswith("avx512.mask.mul.pd.256") ||
290 Name.startswith("avx512.mask.mul.ps.128") ||
291 Name.startswith("avx512.mask.mul.ps.256") ||
292 Name.startswith("avx512.mask.sub.pd.128") ||
293 Name.startswith("avx512.mask.sub.pd.256") ||
294 Name.startswith("avx512.mask.sub.ps.128") ||
295 Name.startswith("avx512.mask.sub.ps.256") ||
Craig Topper5aebb862016-07-04 20:56:38 +0000296 Name.startswith("sse41.pmovsx") ||
297 Name.startswith("sse41.pmovzx") ||
298 Name.startswith("avx2.pmovsx") ||
299 Name.startswith("avx2.pmovzx") ||
300 Name == "sse2.cvtdq2pd" ||
301 Name == "sse2.cvtps2pd" ||
302 Name == "avx.cvtdq2.pd.256" ||
303 Name == "avx.cvt.ps2.pd.256" ||
Craig Topper5aebb862016-07-04 20:56:38 +0000304 Name.startswith("avx.vinsertf128.") ||
305 Name == "avx2.vinserti128" ||
306 Name.startswith("avx.vextractf128.") ||
307 Name == "avx2.vextracti128" ||
308 Name.startswith("sse4a.movnt.") ||
309 Name.startswith("avx.movnt.") ||
Craig Topper70610cf2016-07-09 04:38:27 +0000310 Name.startswith("avx512.storent.") ||
Craig Topper5aebb862016-07-04 20:56:38 +0000311 Name == "sse2.storel.dq" ||
312 Name.startswith("sse.storeu.") ||
313 Name.startswith("sse2.storeu.") ||
314 Name.startswith("avx.storeu.") ||
Craig Toppera57d2ca2016-09-03 23:55:13 +0000315 Name.startswith("avx512.mask.storeu.") ||
Craig Topper5aebb862016-07-04 20:56:38 +0000316 Name.startswith("avx512.mask.store.p") ||
317 Name.startswith("avx512.mask.store.b.") ||
318 Name.startswith("avx512.mask.store.w.") ||
319 Name.startswith("avx512.mask.store.d.") ||
320 Name.startswith("avx512.mask.store.q.") ||
Craig Toppera57d2ca2016-09-03 23:55:13 +0000321 Name.startswith("avx512.mask.loadu.") ||
322 Name.startswith("avx512.mask.load.") ||
Craig Topper5aebb862016-07-04 20:56:38 +0000323 Name == "sse42.crc32.64.8" ||
324 Name.startswith("avx.vbroadcast.s") ||
325 Name.startswith("avx512.mask.palignr.") ||
326 Name.startswith("sse2.psll.dq") ||
327 Name.startswith("sse2.psrl.dq") ||
328 Name.startswith("avx2.psll.dq") ||
329 Name.startswith("avx2.psrl.dq") ||
330 Name.startswith("avx512.psll.dq") ||
331 Name.startswith("avx512.psrl.dq") ||
332 Name == "sse41.pblendw" ||
333 Name.startswith("sse41.blendp") ||
334 Name.startswith("avx.blend.p") ||
335 Name == "avx2.pblendw" ||
336 Name.startswith("avx2.pblendd.") ||
Simon Pilgrimea0d4f92016-07-22 13:58:44 +0000337 Name.startswith("avx.vbroadcastf128") ||
Craig Topper5aebb862016-07-04 20:56:38 +0000338 Name == "avx2.vbroadcasti128" ||
339 Name == "xop.vpcmov" ||
340 (Name.startswith("xop.vpcom") && F->arg_size() == 2))) {
Craig Topperc6207612014-04-09 06:08:46 +0000341 NewFn = nullptr;
Craig Topper3b1817d2012-02-03 06:10:55 +0000342 return true;
343 }
Nadav Rotem17ee58a2012-06-10 18:42:51 +0000344 // SSE4.1 ptest functions may have an old signature.
Craig Topper5aebb862016-07-04 20:56:38 +0000345 if (IsX86 && Name.startswith("sse41.ptest")) {
346 if (Name.substr(11) == "c")
Nadav Rotem17ee58a2012-06-10 18:42:51 +0000347 return UpgradeSSE41Function(F, Intrinsic::x86_sse41_ptestc, NewFn);
Craig Topper5aebb862016-07-04 20:56:38 +0000348 if (Name.substr(11) == "z")
Nadav Rotem17ee58a2012-06-10 18:42:51 +0000349 return UpgradeSSE41Function(F, Intrinsic::x86_sse41_ptestz, NewFn);
Craig Topper5aebb862016-07-04 20:56:38 +0000350 if (Name.substr(11) == "nzc")
Nadav Rotem17ee58a2012-06-10 18:42:51 +0000351 return UpgradeSSE41Function(F, Intrinsic::x86_sse41_ptestnzc, NewFn);
352 }
Sanjay Patel1c3eaec2015-02-28 22:25:06 +0000353 // Several blend and other instructions with masks used the wrong number of
Chandler Carruth373b2b12014-09-06 10:00:01 +0000354 // bits.
Craig Topper5aebb862016-07-04 20:56:38 +0000355 if (IsX86 && Name == "sse41.insertps")
Chandler Carruth373b2b12014-09-06 10:00:01 +0000356 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_sse41_insertps,
357 NewFn);
Craig Topper5aebb862016-07-04 20:56:38 +0000358 if (IsX86 && Name == "sse41.dppd")
Chandler Carruth373b2b12014-09-06 10:00:01 +0000359 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_sse41_dppd,
360 NewFn);
Craig Topper5aebb862016-07-04 20:56:38 +0000361 if (IsX86 && Name == "sse41.dpps")
Chandler Carruth373b2b12014-09-06 10:00:01 +0000362 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_sse41_dpps,
363 NewFn);
Craig Topper5aebb862016-07-04 20:56:38 +0000364 if (IsX86 && Name == "sse41.mpsadbw")
Chandler Carruth373b2b12014-09-06 10:00:01 +0000365 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_sse41_mpsadbw,
366 NewFn);
Craig Topper5aebb862016-07-04 20:56:38 +0000367 if (IsX86 && Name == "avx.dp.ps.256")
Chandler Carruth373b2b12014-09-06 10:00:01 +0000368 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_avx_dp_ps_256,
369 NewFn);
Craig Topper5aebb862016-07-04 20:56:38 +0000370 if (IsX86 && Name == "avx2.mpsadbw")
Chandler Carruth373b2b12014-09-06 10:00:01 +0000371 return UpgradeX86IntrinsicsWith8BitMask(F, Intrinsic::x86_avx2_mpsadbw,
372 NewFn);
Craig Topper29f2e952015-01-25 23:26:02 +0000373
Craig Topper71dc02d2012-06-13 07:18:53 +0000374 // frcz.ss/sd may need to have an argument dropped
Craig Topper5aebb862016-07-04 20:56:38 +0000375 if (IsX86 && Name.startswith("xop.vfrcz.ss") && F->arg_size() == 2) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000376 rename(F);
Craig Topper71dc02d2012-06-13 07:18:53 +0000377 NewFn = Intrinsic::getDeclaration(F->getParent(),
378 Intrinsic::x86_xop_vfrcz_ss);
379 return true;
380 }
Craig Topper5aebb862016-07-04 20:56:38 +0000381 if (IsX86 && Name.startswith("xop.vfrcz.sd") && F->arg_size() == 2) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000382 rename(F);
Craig Topper71dc02d2012-06-13 07:18:53 +0000383 NewFn = Intrinsic::getDeclaration(F->getParent(),
384 Intrinsic::x86_xop_vfrcz_sd);
385 return true;
386 }
Craig Topperf7bf6de2016-07-08 06:14:47 +0000387 if (IsX86 && (Name.startswith("avx512.mask.pslli.") ||
388 Name.startswith("avx512.mask.psrai.") ||
389 Name.startswith("avx512.mask.psrli."))) {
Craig Topperf7bf6de2016-07-08 06:14:47 +0000390 Intrinsic::ID ShiftID;
391 if (Name.slice(12, 16) == "psll")
392 ShiftID = Name[18] == 'd' ? Intrinsic::x86_avx512_mask_psll_di_512
393 : Intrinsic::x86_avx512_mask_psll_qi_512;
394 else if (Name.slice(12, 16) == "psra")
395 ShiftID = Name[18] == 'd' ? Intrinsic::x86_avx512_mask_psra_di_512
396 : Intrinsic::x86_avx512_mask_psra_qi_512;
397 else
398 ShiftID = Name[18] == 'd' ? Intrinsic::x86_avx512_mask_psrl_di_512
399 : Intrinsic::x86_avx512_mask_psrl_qi_512;
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000400 rename(F);
Craig Topperf7bf6de2016-07-08 06:14:47 +0000401 NewFn = Intrinsic::getDeclaration(F->getParent(), ShiftID);
402 return true;
403 }
Craig Topper720c7bd2012-06-03 08:07:25 +0000404 // Fix the FMA4 intrinsics to remove the 4
Craig Topper5aebb862016-07-04 20:56:38 +0000405 if (IsX86 && Name.startswith("fma4.")) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000406 rename(F);
Craig Topper2c5ccd82012-06-03 16:48:52 +0000407 NewFn = F;
408 return true;
Craig Topper720c7bd2012-06-03 08:07:25 +0000409 }
Simon Pilgrime85506b2016-06-03 08:06:03 +0000410 // Upgrade any XOP PERMIL2 index operand still using a float/double vector.
Craig Topper5aebb862016-07-04 20:56:38 +0000411 if (IsX86 && Name.startswith("xop.vpermil2")) {
Simon Pilgrime85506b2016-06-03 08:06:03 +0000412 auto Params = F->getFunctionType()->params();
413 auto Idx = Params[2];
414 if (Idx->getScalarType()->isFloatingPointTy()) {
Rafael Espindolad7325ee2016-10-03 15:51:42 +0000415 rename(F);
Simon Pilgrime85506b2016-06-03 08:06:03 +0000416 unsigned IdxSize = Idx->getPrimitiveSizeInBits();
417 unsigned EltSize = Idx->getScalarSizeInBits();
418 Intrinsic::ID Permil2ID;
419 if (EltSize == 64 && IdxSize == 128)
420 Permil2ID = Intrinsic::x86_xop_vpermil2pd;
421 else if (EltSize == 32 && IdxSize == 128)
422 Permil2ID = Intrinsic::x86_xop_vpermil2ps;
423 else if (EltSize == 64 && IdxSize == 256)
424 Permil2ID = Intrinsic::x86_xop_vpermil2pd_256;
425 else
426 Permil2ID = Intrinsic::x86_xop_vpermil2ps_256;
427 NewFn = Intrinsic::getDeclaration(F->getParent(), Permil2ID);
428 return true;
429 }
430 }
Craig Topper3b1817d2012-02-03 06:10:55 +0000431 break;
432 }
Chris Lattnerb372f662011-06-18 18:56:39 +0000433 }
Chandler Carruth7132e002007-08-04 01:51:18 +0000434
Nadav Rotem17ee58a2012-06-10 18:42:51 +0000435 // This may not belong here. This function is effectively being overloaded
436 // to both detect an intrinsic which needs upgrading, and to provide the
437 // upgraded form of the intrinsic. We should perhaps have two separate
Chandler Carruth7132e002007-08-04 01:51:18 +0000438 // functions for this.
Evan Cheng0e179d02007-12-17 22:33:23 +0000439 return false;
Chandler Carruth7132e002007-08-04 01:51:18 +0000440}
441
Evan Cheng0e179d02007-12-17 22:33:23 +0000442bool llvm::UpgradeIntrinsicFunction(Function *F, Function *&NewFn) {
Craig Topperc6207612014-04-09 06:08:46 +0000443 NewFn = nullptr;
Evan Cheng0e179d02007-12-17 22:33:23 +0000444 bool Upgraded = UpgradeIntrinsicFunction1(F, NewFn);
Filipe Cabecinhas0011c582015-07-03 20:12:01 +0000445 assert(F != NewFn && "Intrinsic function upgraded to the same function");
Duncan Sands38ef3a82007-12-03 20:06:50 +0000446
447 // Upgrade intrinsic attributes. This does not change the function.
Evan Cheng0e179d02007-12-17 22:33:23 +0000448 if (NewFn)
449 F = NewFn;
Pete Cooper9e1d3352015-05-20 17:16:39 +0000450 if (Intrinsic::ID id = F->getIntrinsicID())
451 F->setAttributes(Intrinsic::getAttributes(F->getContext(), id));
Duncan Sands38ef3a82007-12-03 20:06:50 +0000452 return Upgraded;
453}
454
Bill Wendlinge26fffc2010-09-10 18:51:56 +0000455bool llvm::UpgradeGlobalVariable(GlobalVariable *GV) {
Chris Lattner80ed9dc2011-06-18 06:05:24 +0000456 // Nothing to do yet.
Bill Wendlinge26fffc2010-09-10 18:51:56 +0000457 return false;
458}
459
Simon Pilgrimf7186822016-06-09 21:09:03 +0000460// Handles upgrading SSE2/AVX2/AVX512BW PSLLDQ intrinsics by converting them
Craig Topperb324e432015-02-18 06:24:44 +0000461// to byte shuffles.
Craig Topper46b34fe2016-07-12 01:42:33 +0000462static Value *UpgradeX86PSLLDQIntrinsics(IRBuilder<> &Builder,
Craig Topper7355ac32016-05-29 06:37:33 +0000463 Value *Op, unsigned Shift) {
464 Type *ResultTy = Op->getType();
465 unsigned NumElts = ResultTy->getVectorNumElements() * 8;
Craig Topperb324e432015-02-18 06:24:44 +0000466
467 // Bitcast from a 64-bit element type to a byte element type.
Craig Topper46b34fe2016-07-12 01:42:33 +0000468 Type *VecTy = VectorType::get(Builder.getInt8Ty(), NumElts);
Craig Topper7355ac32016-05-29 06:37:33 +0000469 Op = Builder.CreateBitCast(Op, VecTy, "cast");
470
Craig Topperb324e432015-02-18 06:24:44 +0000471 // We'll be shuffling in zeroes.
Craig Topper7355ac32016-05-29 06:37:33 +0000472 Value *Res = Constant::getNullValue(VecTy);
Craig Topperb324e432015-02-18 06:24:44 +0000473
474 // If shift is less than 16, emit a shuffle to move the bytes. Otherwise,
475 // we'll just return the zero vector.
476 if (Shift < 16) {
Craig Topper99d1eab2016-06-12 00:41:19 +0000477 uint32_t Idxs[64];
Simon Pilgrimf7186822016-06-09 21:09:03 +0000478 // 256/512-bit version is split into 2/4 16-byte lanes.
Craig Topperb324e432015-02-18 06:24:44 +0000479 for (unsigned l = 0; l != NumElts; l += 16)
480 for (unsigned i = 0; i != 16; ++i) {
481 unsigned Idx = NumElts + i - Shift;
482 if (Idx < NumElts)
483 Idx -= NumElts - 16; // end of lane, switch operand.
Craig Topper7355ac32016-05-29 06:37:33 +0000484 Idxs[l + i] = Idx + l;
Craig Topperb324e432015-02-18 06:24:44 +0000485 }
486
Craig Topper7355ac32016-05-29 06:37:33 +0000487 Res = Builder.CreateShuffleVector(Res, Op, makeArrayRef(Idxs, NumElts));
Craig Topperb324e432015-02-18 06:24:44 +0000488 }
489
490 // Bitcast back to a 64-bit element type.
Craig Topper7355ac32016-05-29 06:37:33 +0000491 return Builder.CreateBitCast(Res, ResultTy, "cast");
Craig Topperb324e432015-02-18 06:24:44 +0000492}
493
Craig Topperea703ae2016-06-13 02:36:42 +0000494// Handles upgrading SSE2/AVX2/AVX512BW PSRLDQ intrinsics by converting them
495// to byte shuffles.
Craig Topper46b34fe2016-07-12 01:42:33 +0000496static Value *UpgradeX86PSRLDQIntrinsics(IRBuilder<> &Builder, Value *Op,
Craig Topperea703ae2016-06-13 02:36:42 +0000497 unsigned Shift) {
498 Type *ResultTy = Op->getType();
499 unsigned NumElts = ResultTy->getVectorNumElements() * 8;
500
501 // Bitcast from a 64-bit element type to a byte element type.
Craig Topper46b34fe2016-07-12 01:42:33 +0000502 Type *VecTy = VectorType::get(Builder.getInt8Ty(), NumElts);
Craig Topperea703ae2016-06-13 02:36:42 +0000503 Op = Builder.CreateBitCast(Op, VecTy, "cast");
504
505 // We'll be shuffling in zeroes.
506 Value *Res = Constant::getNullValue(VecTy);
507
508 // If shift is less than 16, emit a shuffle to move the bytes. Otherwise,
509 // we'll just return the zero vector.
510 if (Shift < 16) {
511 uint32_t Idxs[64];
512 // 256/512-bit version is split into 2/4 16-byte lanes.
513 for (unsigned l = 0; l != NumElts; l += 16)
514 for (unsigned i = 0; i != 16; ++i) {
515 unsigned Idx = i + Shift;
516 if (Idx >= 16)
517 Idx += NumElts - 16; // end of lane, switch operand.
518 Idxs[l + i] = Idx + l;
519 }
520
521 Res = Builder.CreateShuffleVector(Op, Res, makeArrayRef(Idxs, NumElts));
522 }
523
524 // Bitcast back to a 64-bit element type.
525 return Builder.CreateBitCast(Res, ResultTy, "cast");
526}
527
528static Value *getX86MaskVec(IRBuilder<> &Builder, Value *Mask,
529 unsigned NumElts) {
530 llvm::VectorType *MaskTy = llvm::VectorType::get(Builder.getInt1Ty(),
531 cast<IntegerType>(Mask->getType())->getBitWidth());
532 Mask = Builder.CreateBitCast(Mask, MaskTy);
533
534 // If we have less than 8 elements, then the starting mask was an i8 and
535 // we need to extract down to the right number of elements.
536 if (NumElts < 8) {
537 uint32_t Indices[4];
538 for (unsigned i = 0; i != NumElts; ++i)
539 Indices[i] = i;
540 Mask = Builder.CreateShuffleVector(Mask, Mask,
541 makeArrayRef(Indices, NumElts),
542 "extract");
543 }
544
545 return Mask;
546}
547
548static Value *EmitX86Select(IRBuilder<> &Builder, Value *Mask,
549 Value *Op0, Value *Op1) {
550 // If the mask is all ones just emit the align operation.
551 if (const auto *C = dyn_cast<Constant>(Mask))
552 if (C->isAllOnesValue())
553 return Op0;
554
555 Mask = getX86MaskVec(Builder, Mask, Op0->getType()->getVectorNumElements());
556 return Builder.CreateSelect(Mask, Op0, Op1);
557}
558
Craig Topper46b34fe2016-07-12 01:42:33 +0000559static Value *UpgradeX86PALIGNRIntrinsics(IRBuilder<> &Builder,
Craig Topper33350cc2016-06-06 06:12:54 +0000560 Value *Op0, Value *Op1, Value *Shift,
561 Value *Passthru, Value *Mask) {
562 unsigned ShiftVal = cast<llvm::ConstantInt>(Shift)->getZExtValue();
563
564 unsigned NumElts = Op0->getType()->getVectorNumElements();
565 assert(NumElts % 16 == 0);
566
567 // If palignr is shifting the pair of vectors more than the size of two
568 // lanes, emit zero.
569 if (ShiftVal >= 32)
570 return llvm::Constant::getNullValue(Op0->getType());
571
572 // If palignr is shifting the pair of input vectors more than one lane,
573 // but less than two lanes, convert to shifting in zeroes.
574 if (ShiftVal > 16) {
575 ShiftVal -= 16;
576 Op1 = Op0;
577 Op0 = llvm::Constant::getNullValue(Op0->getType());
578 }
579
Craig Topper99d1eab2016-06-12 00:41:19 +0000580 uint32_t Indices[64];
Craig Topper33350cc2016-06-06 06:12:54 +0000581 // 256-bit palignr operates on 128-bit lanes so we need to handle that
582 for (unsigned l = 0; l != NumElts; l += 16) {
583 for (unsigned i = 0; i != 16; ++i) {
584 unsigned Idx = ShiftVal + i;
585 if (Idx >= 16)
586 Idx += NumElts - 16; // End of lane, switch operand.
587 Indices[l + i] = Idx + l;
588 }
589 }
590
591 Value *Align = Builder.CreateShuffleVector(Op1, Op0,
592 makeArrayRef(Indices, NumElts),
593 "palignr");
594
Craig Topperea703ae2016-06-13 02:36:42 +0000595 return EmitX86Select(Builder, Mask, Align, Passthru);
Craig Topperb324e432015-02-18 06:24:44 +0000596}
597
Craig Topper46b34fe2016-07-12 01:42:33 +0000598static Value *UpgradeMaskedStore(IRBuilder<> &Builder,
Craig Topper50f85c22016-05-31 01:50:02 +0000599 Value *Ptr, Value *Data, Value *Mask,
600 bool Aligned) {
601 // Cast the pointer to the right type.
602 Ptr = Builder.CreateBitCast(Ptr,
603 llvm::PointerType::getUnqual(Data->getType()));
604 unsigned Align =
605 Aligned ? cast<VectorType>(Data->getType())->getBitWidth() / 8 : 1;
606
607 // If the mask is all ones just emit a regular store.
608 if (const auto *C = dyn_cast<Constant>(Mask))
609 if (C->isAllOnesValue())
610 return Builder.CreateAlignedStore(Data, Ptr, Align);
611
612 // Convert the mask from an integer type to a vector of i1.
613 unsigned NumElts = Data->getType()->getVectorNumElements();
Craig Topperea703ae2016-06-13 02:36:42 +0000614 Mask = getX86MaskVec(Builder, Mask, NumElts);
Craig Topper50f85c22016-05-31 01:50:02 +0000615 return Builder.CreateMaskedStore(Data, Ptr, Align, Mask);
616}
617
Craig Topper46b34fe2016-07-12 01:42:33 +0000618static Value *UpgradeMaskedLoad(IRBuilder<> &Builder,
Craig Topperf10fbfa2016-06-02 04:19:36 +0000619 Value *Ptr, Value *Passthru, Value *Mask,
620 bool Aligned) {
621 // Cast the pointer to the right type.
622 Ptr = Builder.CreateBitCast(Ptr,
623 llvm::PointerType::getUnqual(Passthru->getType()));
624 unsigned Align =
625 Aligned ? cast<VectorType>(Passthru->getType())->getBitWidth() / 8 : 1;
626
627 // If the mask is all ones just emit a regular store.
628 if (const auto *C = dyn_cast<Constant>(Mask))
629 if (C->isAllOnesValue())
630 return Builder.CreateAlignedLoad(Ptr, Align);
631
632 // Convert the mask from an integer type to a vector of i1.
633 unsigned NumElts = Passthru->getType()->getVectorNumElements();
Craig Topperea703ae2016-06-13 02:36:42 +0000634 Mask = getX86MaskVec(Builder, Mask, NumElts);
Craig Topperf10fbfa2016-06-02 04:19:36 +0000635 return Builder.CreateMaskedLoad(Ptr, Align, Mask, Passthru);
636}
637
Sanjay Patel51ab7572016-06-16 15:48:30 +0000638static Value *upgradeIntMinMax(IRBuilder<> &Builder, CallInst &CI,
639 ICmpInst::Predicate Pred) {
640 Value *Op0 = CI.getArgOperand(0);
641 Value *Op1 = CI.getArgOperand(1);
642 Value *Cmp = Builder.CreateICmp(Pred, Op0, Op1);
643 return Builder.CreateSelect(Cmp, Op0, Op1);
644}
645
Craig Topper0a0fb0f2016-06-21 03:53:24 +0000646static Value *upgradeMaskedCompare(IRBuilder<> &Builder, CallInst &CI,
647 ICmpInst::Predicate Pred) {
648 Value *Op0 = CI.getArgOperand(0);
649 unsigned NumElts = Op0->getType()->getVectorNumElements();
650 Value *Cmp = Builder.CreateICmp(Pred, Op0, CI.getArgOperand(1));
651
652 Value *Mask = CI.getArgOperand(2);
653 const auto *C = dyn_cast<Constant>(Mask);
654 if (!C || !C->isAllOnesValue())
655 Cmp = Builder.CreateAnd(Cmp, getX86MaskVec(Builder, Mask, NumElts));
656
657 if (NumElts < 8) {
658 uint32_t Indices[8];
659 for (unsigned i = 0; i != NumElts; ++i)
660 Indices[i] = i;
661 for (unsigned i = NumElts; i != 8; ++i)
Craig Topperd5d2a352016-07-07 06:11:07 +0000662 Indices[i] = NumElts + i % NumElts;
663 Cmp = Builder.CreateShuffleVector(Cmp,
664 Constant::getNullValue(Cmp->getType()),
Craig Topper0a0fb0f2016-06-21 03:53:24 +0000665 Indices);
666 }
667 return Builder.CreateBitCast(Cmp, IntegerType::get(CI.getContext(),
668 std::max(NumElts, 8U)));
669}
670
Sanjay Patel595098f2016-06-15 22:01:28 +0000671/// Upgrade a call to an old intrinsic. All argument and return casting must be
672/// provided to seamlessly integrate with existing context.
Chandler Carruth7132e002007-08-04 01:51:18 +0000673void llvm::UpgradeIntrinsicCall(CallInst *CI, Function *NewFn) {
Craig Topper3b1817d2012-02-03 06:10:55 +0000674 Function *F = CI->getCalledFunction();
Nick Lewycky2eb3ade2011-12-12 22:59:34 +0000675 LLVMContext &C = CI->getContext();
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000676 IRBuilder<> Builder(C);
Duncan P. N. Exon Smith52888a62015-10-08 23:49:46 +0000677 Builder.SetInsertPoint(CI->getParent(), CI->getIterator());
Chandler Carruth58a71ed2011-12-12 04:26:04 +0000678
Craig Topper3b1817d2012-02-03 06:10:55 +0000679 assert(F && "Intrinsic call is not direct?");
680
681 if (!NewFn) {
682 // Get the Function's name.
683 StringRef Name = F->getName();
684
Craig Topper5aebb862016-07-04 20:56:38 +0000685 assert(Name.startswith("llvm.") && "Intrinsic doesn't start with 'llvm.'");
686 Name = Name.substr(5);
687
688 bool IsX86 = Name.startswith("x86.");
689 if (IsX86)
690 Name = Name.substr(4);
691
Craig Topper3b1817d2012-02-03 06:10:55 +0000692 Value *Rep;
Sanjay Patel595098f2016-06-15 22:01:28 +0000693 // Upgrade packed integer vector compare intrinsics to compare instructions.
Craig Topper5aebb862016-07-04 20:56:38 +0000694 if (IsX86 && (Name.startswith("sse2.pcmpeq.") ||
695 Name.startswith("avx2.pcmpeq."))) {
Craig Topper3b1817d2012-02-03 06:10:55 +0000696 Rep = Builder.CreateICmpEQ(CI->getArgOperand(0), CI->getArgOperand(1),
697 "pcmpeq");
Craig Topper3b1817d2012-02-03 06:10:55 +0000698 Rep = Builder.CreateSExt(Rep, CI->getType(), "");
Craig Topper5aebb862016-07-04 20:56:38 +0000699 } else if (IsX86 && (Name.startswith("sse2.pcmpgt.") ||
700 Name.startswith("avx2.pcmpgt."))) {
Craig Topper3b1817d2012-02-03 06:10:55 +0000701 Rep = Builder.CreateICmpSGT(CI->getArgOperand(0), CI->getArgOperand(1),
702 "pcmpgt");
Craig Topper3b1817d2012-02-03 06:10:55 +0000703 Rep = Builder.CreateSExt(Rep, CI->getType(), "");
Craig Topper5aebb862016-07-04 20:56:38 +0000704 } else if (IsX86 && Name.startswith("avx512.mask.pcmpeq.")) {
Craig Topper0a0fb0f2016-06-21 03:53:24 +0000705 Rep = upgradeMaskedCompare(Builder, *CI, ICmpInst::ICMP_EQ);
Craig Topper5aebb862016-07-04 20:56:38 +0000706 } else if (IsX86 && Name.startswith("avx512.mask.pcmpgt.")) {
Craig Topper0a0fb0f2016-06-21 03:53:24 +0000707 Rep = upgradeMaskedCompare(Builder, *CI, ICmpInst::ICMP_SGT);
Craig Topper5aebb862016-07-04 20:56:38 +0000708 } else if (IsX86 && (Name == "sse41.pmaxsb" ||
709 Name == "sse2.pmaxs.w" ||
710 Name == "sse41.pmaxsd" ||
711 Name.startswith("avx2.pmaxs"))) {
Sanjay Patel51ab7572016-06-16 15:48:30 +0000712 Rep = upgradeIntMinMax(Builder, *CI, ICmpInst::ICMP_SGT);
Craig Topper5aebb862016-07-04 20:56:38 +0000713 } else if (IsX86 && (Name == "sse2.pmaxu.b" ||
714 Name == "sse41.pmaxuw" ||
715 Name == "sse41.pmaxud" ||
716 Name.startswith("avx2.pmaxu"))) {
Sanjay Patel51ab7572016-06-16 15:48:30 +0000717 Rep = upgradeIntMinMax(Builder, *CI, ICmpInst::ICMP_UGT);
Craig Topper5aebb862016-07-04 20:56:38 +0000718 } else if (IsX86 && (Name == "sse41.pminsb" ||
719 Name == "sse2.pmins.w" ||
720 Name == "sse41.pminsd" ||
721 Name.startswith("avx2.pmins"))) {
Sanjay Patel51ab7572016-06-16 15:48:30 +0000722 Rep = upgradeIntMinMax(Builder, *CI, ICmpInst::ICMP_SLT);
Craig Topper5aebb862016-07-04 20:56:38 +0000723 } else if (IsX86 && (Name == "sse2.pminu.b" ||
724 Name == "sse41.pminuw" ||
725 Name == "sse41.pminud" ||
726 Name.startswith("avx2.pminu"))) {
Sanjay Patel51ab7572016-06-16 15:48:30 +0000727 Rep = upgradeIntMinMax(Builder, *CI, ICmpInst::ICMP_ULT);
Craig Topper5aebb862016-07-04 20:56:38 +0000728 } else if (IsX86 && (Name == "sse2.cvtdq2pd" ||
729 Name == "sse2.cvtps2pd" ||
730 Name == "avx.cvtdq2.pd.256" ||
731 Name == "avx.cvt.ps2.pd.256")) {
Simon Pilgrim4298d062016-05-25 08:59:18 +0000732 // Lossless i32/float to double conversion.
733 // Extract the bottom elements if necessary and convert to double vector.
734 Value *Src = CI->getArgOperand(0);
735 VectorType *SrcTy = cast<VectorType>(Src->getType());
736 VectorType *DstTy = cast<VectorType>(CI->getType());
737 Rep = CI->getArgOperand(0);
738
739 unsigned NumDstElts = DstTy->getNumElements();
740 if (NumDstElts < SrcTy->getNumElements()) {
741 assert(NumDstElts == 2 && "Unexpected vector size");
Craig Topper99d1eab2016-06-12 00:41:19 +0000742 uint32_t ShuffleMask[2] = { 0, 1 };
743 Rep = Builder.CreateShuffleVector(Rep, UndefValue::get(SrcTy),
744 ShuffleMask);
Simon Pilgrim4298d062016-05-25 08:59:18 +0000745 }
746
747 bool Int2Double = (StringRef::npos != Name.find("cvtdq2"));
748 if (Int2Double)
749 Rep = Builder.CreateSIToFP(Rep, DstTy, "cvtdq2pd");
750 else
751 Rep = Builder.CreateFPExt(Rep, DstTy, "cvtps2pd");
Craig Topper5aebb862016-07-04 20:56:38 +0000752 } else if (IsX86 && Name.startswith("sse4a.movnt.")) {
Simon Pilgrimf4b2af12016-06-18 02:38:26 +0000753 Module *M = F->getParent();
754 SmallVector<Metadata *, 1> Elts;
755 Elts.push_back(
756 ConstantAsMetadata::get(ConstantInt::get(Type::getInt32Ty(C), 1)));
757 MDNode *Node = MDNode::get(C, Elts);
758
759 Value *Arg0 = CI->getArgOperand(0);
760 Value *Arg1 = CI->getArgOperand(1);
761
762 // Nontemporal (unaligned) store of the 0'th element of the float/double
763 // vector.
764 Type *SrcEltTy = cast<VectorType>(Arg1->getType())->getElementType();
765 PointerType *EltPtrTy = PointerType::getUnqual(SrcEltTy);
766 Value *Addr = Builder.CreateBitCast(Arg0, EltPtrTy, "cast");
767 Value *Extract =
768 Builder.CreateExtractElement(Arg1, (uint64_t)0, "extractelement");
769
770 StoreInst *SI = Builder.CreateAlignedStore(Extract, Addr, 1);
771 SI->setMetadata(M->getMDKindID("nontemporal"), Node);
772
773 // Remove intrinsic.
774 CI->eraseFromParent();
775 return;
Craig Topper70610cf2016-07-09 04:38:27 +0000776 } else if (IsX86 && (Name.startswith("avx.movnt.") ||
777 Name.startswith("avx512.storent."))) {
Craig Topper7daf8972012-05-08 06:58:15 +0000778 Module *M = F->getParent();
Duncan P. N. Exon Smith5bf8fef2014-12-09 18:38:53 +0000779 SmallVector<Metadata *, 1> Elts;
780 Elts.push_back(
781 ConstantAsMetadata::get(ConstantInt::get(Type::getInt32Ty(C), 1)));
Craig Topper7daf8972012-05-08 06:58:15 +0000782 MDNode *Node = MDNode::get(C, Elts);
783
784 Value *Arg0 = CI->getArgOperand(0);
785 Value *Arg1 = CI->getArgOperand(1);
786
787 // Convert the type of the pointer to a pointer to the stored type.
788 Value *BC = Builder.CreateBitCast(Arg0,
789 PointerType::getUnqual(Arg1->getType()),
790 "cast");
Craig Topper70610cf2016-07-09 04:38:27 +0000791 VectorType *VTy = cast<VectorType>(Arg1->getType());
792 StoreInst *SI = Builder.CreateAlignedStore(Arg1, BC,
793 VTy->getBitWidth() / 8);
Craig Topper7daf8972012-05-08 06:58:15 +0000794 SI->setMetadata(M->getMDKindID("nontemporal"), Node);
Craig Topper7daf8972012-05-08 06:58:15 +0000795
796 // Remove intrinsic.
797 CI->eraseFromParent();
798 return;
Craig Topper5aebb862016-07-04 20:56:38 +0000799 } else if (IsX86 && Name == "sse2.storel.dq") {
Craig Topper12e322a2016-05-25 06:56:32 +0000800 Value *Arg0 = CI->getArgOperand(0);
801 Value *Arg1 = CI->getArgOperand(1);
802
803 Type *NewVecTy = VectorType::get(Type::getInt64Ty(C), 2);
804 Value *BC0 = Builder.CreateBitCast(Arg1, NewVecTy, "cast");
805 Value *Elt = Builder.CreateExtractElement(BC0, (uint64_t)0);
806 Value *BC = Builder.CreateBitCast(Arg0,
807 PointerType::getUnqual(Elt->getType()),
808 "cast");
Craig Topper29ce55d2016-05-30 22:54:12 +0000809 Builder.CreateAlignedStore(Elt, BC, 1);
Craig Topper12e322a2016-05-25 06:56:32 +0000810
811 // Remove intrinsic.
812 CI->eraseFromParent();
813 return;
Craig Topper5aebb862016-07-04 20:56:38 +0000814 } else if (IsX86 && (Name.startswith("sse.storeu.") ||
815 Name.startswith("sse2.storeu.") ||
816 Name.startswith("avx.storeu."))) {
Craig Topper8287fd82016-05-30 23:15:56 +0000817 Value *Arg0 = CI->getArgOperand(0);
818 Value *Arg1 = CI->getArgOperand(1);
819
820 Arg0 = Builder.CreateBitCast(Arg0,
821 PointerType::getUnqual(Arg1->getType()),
822 "cast");
823 Builder.CreateAlignedStore(Arg1, Arg0, 1);
824
825 // Remove intrinsic.
826 CI->eraseFromParent();
827 return;
Craig Toppera57d2ca2016-09-03 23:55:13 +0000828 } else if (IsX86 && (Name.startswith("avx512.mask.storeu."))) {
Craig Topper46b34fe2016-07-12 01:42:33 +0000829 UpgradeMaskedStore(Builder, CI->getArgOperand(0), CI->getArgOperand(1),
Craig Topper50f85c22016-05-31 01:50:02 +0000830 CI->getArgOperand(2), /*Aligned*/false);
831
832 // Remove intrinsic.
833 CI->eraseFromParent();
834 return;
Craig Toppera57d2ca2016-09-03 23:55:13 +0000835 } else if (IsX86 && (Name.startswith("avx512.mask.store."))) {
Craig Topper46b34fe2016-07-12 01:42:33 +0000836 UpgradeMaskedStore(Builder, CI->getArgOperand(0), CI->getArgOperand(1),
Craig Topper50f85c22016-05-31 01:50:02 +0000837 CI->getArgOperand(2), /*Aligned*/true);
838
839 // Remove intrinsic.
840 CI->eraseFromParent();
841 return;
Craig Toppera57d2ca2016-09-03 23:55:13 +0000842 } else if (IsX86 && (Name.startswith("avx512.mask.loadu."))) {
Craig Topper46b34fe2016-07-12 01:42:33 +0000843 Rep = UpgradeMaskedLoad(Builder, CI->getArgOperand(0),
Craig Topperf10fbfa2016-06-02 04:19:36 +0000844 CI->getArgOperand(1), CI->getArgOperand(2),
845 /*Aligned*/false);
Craig Toppera57d2ca2016-09-03 23:55:13 +0000846 } else if (IsX86 && (Name.startswith("avx512.mask.load."))) {
Craig Topper46b34fe2016-07-12 01:42:33 +0000847 Rep = UpgradeMaskedLoad(Builder, CI->getArgOperand(0),
Craig Topperf10fbfa2016-06-02 04:19:36 +0000848 CI->getArgOperand(1),CI->getArgOperand(2),
849 /*Aligned*/true);
Craig Topper5aebb862016-07-04 20:56:38 +0000850 } else if (IsX86 && Name.startswith("xop.vpcom")) {
Craig Topper3352ba52012-06-09 16:46:13 +0000851 Intrinsic::ID intID;
852 if (Name.endswith("ub"))
853 intID = Intrinsic::x86_xop_vpcomub;
854 else if (Name.endswith("uw"))
855 intID = Intrinsic::x86_xop_vpcomuw;
856 else if (Name.endswith("ud"))
857 intID = Intrinsic::x86_xop_vpcomud;
858 else if (Name.endswith("uq"))
859 intID = Intrinsic::x86_xop_vpcomuq;
860 else if (Name.endswith("b"))
861 intID = Intrinsic::x86_xop_vpcomb;
862 else if (Name.endswith("w"))
863 intID = Intrinsic::x86_xop_vpcomw;
864 else if (Name.endswith("d"))
865 intID = Intrinsic::x86_xop_vpcomd;
866 else if (Name.endswith("q"))
867 intID = Intrinsic::x86_xop_vpcomq;
868 else
869 llvm_unreachable("Unknown suffix");
870
Craig Topper5aebb862016-07-04 20:56:38 +0000871 Name = Name.substr(9); // strip off "xop.vpcom"
Craig Topper3352ba52012-06-09 16:46:13 +0000872 unsigned Imm;
873 if (Name.startswith("lt"))
874 Imm = 0;
875 else if (Name.startswith("le"))
876 Imm = 1;
877 else if (Name.startswith("gt"))
878 Imm = 2;
879 else if (Name.startswith("ge"))
880 Imm = 3;
881 else if (Name.startswith("eq"))
882 Imm = 4;
883 else if (Name.startswith("ne"))
884 Imm = 5;
Craig Topper3352ba52012-06-09 16:46:13 +0000885 else if (Name.startswith("false"))
Craig Toppere32546d2015-02-13 07:42:15 +0000886 Imm = 6;
887 else if (Name.startswith("true"))
Craig Topper3352ba52012-06-09 16:46:13 +0000888 Imm = 7;
889 else
890 llvm_unreachable("Unknown condition");
891
892 Function *VPCOM = Intrinsic::getDeclaration(F->getParent(), intID);
David Blaikieff6409d2015-05-18 22:13:54 +0000893 Rep =
894 Builder.CreateCall(VPCOM, {CI->getArgOperand(0), CI->getArgOperand(1),
895 Builder.getInt8(Imm)});
Craig Topper5aebb862016-07-04 20:56:38 +0000896 } else if (IsX86 && Name == "xop.vpcmov") {
Simon Pilgrime88dc042015-11-03 20:27:01 +0000897 Value *Arg0 = CI->getArgOperand(0);
898 Value *Arg1 = CI->getArgOperand(1);
899 Value *Sel = CI->getArgOperand(2);
900 unsigned NumElts = CI->getType()->getVectorNumElements();
901 Constant *MinusOne = ConstantVector::getSplat(NumElts, Builder.getInt64(-1));
902 Value *NotSel = Builder.CreateXor(Sel, MinusOne);
903 Value *Sel0 = Builder.CreateAnd(Arg0, Sel);
904 Value *Sel1 = Builder.CreateAnd(Arg1, NotSel);
905 Rep = Builder.CreateOr(Sel0, Sel1);
Craig Topper5aebb862016-07-04 20:56:38 +0000906 } else if (IsX86 && Name == "sse42.crc32.64.8") {
Craig Topperef9e9932013-10-15 05:20:47 +0000907 Function *CRC32 = Intrinsic::getDeclaration(F->getParent(),
908 Intrinsic::x86_sse42_crc32_32_8);
909 Value *Trunc0 = Builder.CreateTrunc(CI->getArgOperand(0), Type::getInt32Ty(C));
David Blaikieff6409d2015-05-18 22:13:54 +0000910 Rep = Builder.CreateCall(CRC32, {Trunc0, CI->getArgOperand(1)});
Craig Topperef9e9932013-10-15 05:20:47 +0000911 Rep = Builder.CreateZExt(Rep, CI->getType(), "");
Simon Pilgrimea0d4f92016-07-22 13:58:44 +0000912 } else if (IsX86 && Name.startswith("avx.vbroadcast.s")) {
Adam Nemet39066802014-05-29 23:35:33 +0000913 // Replace broadcasts with a series of insertelements.
914 Type *VecTy = CI->getType();
915 Type *EltTy = VecTy->getVectorElementType();
916 unsigned EltNum = VecTy->getVectorNumElements();
917 Value *Cast = Builder.CreateBitCast(CI->getArgOperand(0),
918 EltTy->getPointerTo());
David Blaikie0c28fd72015-05-20 21:46:30 +0000919 Value *Load = Builder.CreateLoad(EltTy, Cast);
Adam Nemet39066802014-05-29 23:35:33 +0000920 Type *I32Ty = Type::getInt32Ty(C);
921 Rep = UndefValue::get(VecTy);
922 for (unsigned I = 0; I < EltNum; ++I)
923 Rep = Builder.CreateInsertElement(Rep, Load,
924 ConstantInt::get(I32Ty, I));
Craig Topper5aebb862016-07-04 20:56:38 +0000925 } else if (IsX86 && (Name.startswith("sse41.pmovsx") ||
926 Name.startswith("sse41.pmovzx") ||
927 Name.startswith("avx2.pmovsx") ||
928 Name.startswith("avx2.pmovzx"))) {
Simon Pilgrim9cb018b2015-09-23 08:48:33 +0000929 VectorType *SrcTy = cast<VectorType>(CI->getArgOperand(0)->getType());
930 VectorType *DstTy = cast<VectorType>(CI->getType());
931 unsigned NumDstElts = DstTy->getNumElements();
932
Simon Pilgrim9602d672016-05-28 18:03:41 +0000933 // Extract a subvector of the first NumDstElts lanes and sign/zero extend.
Craig Topperc0a5fa02016-06-12 04:48:00 +0000934 SmallVector<uint32_t, 8> ShuffleMask(NumDstElts);
Craig Topper99d1eab2016-06-12 00:41:19 +0000935 for (unsigned i = 0; i != NumDstElts; ++i)
Craig Topperc0a5fa02016-06-12 04:48:00 +0000936 ShuffleMask[i] = i;
Simon Pilgrim9cb018b2015-09-23 08:48:33 +0000937
938 Value *SV = Builder.CreateShuffleVector(
939 CI->getArgOperand(0), UndefValue::get(SrcTy), ShuffleMask);
Simon Pilgrim9602d672016-05-28 18:03:41 +0000940
941 bool DoSext = (StringRef::npos != Name.find("pmovsx"));
942 Rep = DoSext ? Builder.CreateSExt(SV, DstTy)
943 : Builder.CreateZExt(SV, DstTy);
Simon Pilgrimea0d4f92016-07-22 13:58:44 +0000944 } else if (IsX86 && (Name.startswith("avx.vbroadcastf128") ||
945 Name == "avx2.vbroadcasti128")) {
946 // Replace vbroadcastf128/vbroadcasti128 with a vector load+shuffle.
947 Type *EltTy = CI->getType()->getVectorElementType();
948 unsigned NumSrcElts = 128 / EltTy->getPrimitiveSizeInBits();
949 Type *VT = VectorType::get(EltTy, NumSrcElts);
David Blaikie0c28fd72015-05-20 21:46:30 +0000950 Value *Op = Builder.CreatePointerCast(CI->getArgOperand(0),
951 PointerType::getUnqual(VT));
Chandler Carruth0215e762016-08-10 07:41:26 +0000952 Value *Load = Builder.CreateAlignedLoad(Op, 1);
Simon Pilgrimea0d4f92016-07-22 13:58:44 +0000953 if (NumSrcElts == 2)
954 Rep = Builder.CreateShuffleVector(Load, UndefValue::get(Load->getType()),
955 { 0, 1, 0, 1 });
956 else
957 Rep = Builder.CreateShuffleVector(Load, UndefValue::get(Load->getType()),
958 { 0, 1, 2, 3, 0, 1, 2, 3 });
Craig Topper5aebb862016-07-04 20:56:38 +0000959 } else if (IsX86 && (Name.startswith("avx2.pbroadcast") ||
Simon Pilgrim4e96fbf2016-07-05 13:58:47 +0000960 Name.startswith("avx2.vbroadcast") ||
961 Name.startswith("avx512.pbroadcast") ||
962 Name.startswith("avx512.mask.broadcast.s"))) {
Ahmed Bougacha1a4987052015-08-20 20:36:19 +0000963 // Replace vp?broadcasts with a vector shuffle.
964 Value *Op = CI->getArgOperand(0);
965 unsigned NumElts = CI->getType()->getVectorNumElements();
966 Type *MaskTy = VectorType::get(Type::getInt32Ty(C), NumElts);
967 Rep = Builder.CreateShuffleVector(Op, UndefValue::get(Op->getType()),
968 Constant::getNullValue(MaskTy));
Simon Pilgrim4e96fbf2016-07-05 13:58:47 +0000969
970 if (CI->getNumArgOperands() == 3)
971 Rep = EmitX86Select(Builder, CI->getArgOperand(2), Rep,
972 CI->getArgOperand(1));
Craig Topper5aebb862016-07-04 20:56:38 +0000973 } else if (IsX86 && Name.startswith("avx512.mask.palignr.")) {
Craig Topper46b34fe2016-07-12 01:42:33 +0000974 Rep = UpgradeX86PALIGNRIntrinsics(Builder, CI->getArgOperand(0),
Craig Topper33350cc2016-06-06 06:12:54 +0000975 CI->getArgOperand(1),
976 CI->getArgOperand(2),
977 CI->getArgOperand(3),
978 CI->getArgOperand(4));
Craig Topper5aebb862016-07-04 20:56:38 +0000979 } else if (IsX86 && (Name == "sse2.psll.dq" ||
980 Name == "avx2.psll.dq")) {
Craig Topper7355ac32016-05-29 06:37:33 +0000981 // 128/256-bit shift left specified in bits.
Craig Topperb324e432015-02-18 06:24:44 +0000982 unsigned Shift = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
Craig Topper46b34fe2016-07-12 01:42:33 +0000983 Rep = UpgradeX86PSLLDQIntrinsics(Builder, CI->getArgOperand(0),
Craig Topperb324e432015-02-18 06:24:44 +0000984 Shift / 8); // Shift is in bits.
Craig Topper5aebb862016-07-04 20:56:38 +0000985 } else if (IsX86 && (Name == "sse2.psrl.dq" ||
986 Name == "avx2.psrl.dq")) {
Craig Topper7355ac32016-05-29 06:37:33 +0000987 // 128/256-bit shift right specified in bits.
Craig Topperb324e432015-02-18 06:24:44 +0000988 unsigned Shift = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
Craig Topper46b34fe2016-07-12 01:42:33 +0000989 Rep = UpgradeX86PSRLDQIntrinsics(Builder, CI->getArgOperand(0),
Craig Topperb324e432015-02-18 06:24:44 +0000990 Shift / 8); // Shift is in bits.
Craig Topper5aebb862016-07-04 20:56:38 +0000991 } else if (IsX86 && (Name == "sse2.psll.dq.bs" ||
992 Name == "avx2.psll.dq.bs" ||
993 Name == "avx512.psll.dq.512")) {
Simon Pilgrimf7186822016-06-09 21:09:03 +0000994 // 128/256/512-bit shift left specified in bytes.
Craig Topperb324e432015-02-18 06:24:44 +0000995 unsigned Shift = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
Craig Topper46b34fe2016-07-12 01:42:33 +0000996 Rep = UpgradeX86PSLLDQIntrinsics(Builder, CI->getArgOperand(0), Shift);
Craig Topper5aebb862016-07-04 20:56:38 +0000997 } else if (IsX86 && (Name == "sse2.psrl.dq.bs" ||
998 Name == "avx2.psrl.dq.bs" ||
999 Name == "avx512.psrl.dq.512")) {
Simon Pilgrimf7186822016-06-09 21:09:03 +00001000 // 128/256/512-bit shift right specified in bytes.
Craig Topperb324e432015-02-18 06:24:44 +00001001 unsigned Shift = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
Craig Topper46b34fe2016-07-12 01:42:33 +00001002 Rep = UpgradeX86PSRLDQIntrinsics(Builder, CI->getArgOperand(0), Shift);
Craig Topper5aebb862016-07-04 20:56:38 +00001003 } else if (IsX86 && (Name == "sse41.pblendw" ||
1004 Name.startswith("sse41.blendp") ||
1005 Name.startswith("avx.blend.p") ||
1006 Name == "avx2.pblendw" ||
1007 Name.startswith("avx2.pblendd."))) {
Craig Topper782d6202015-02-28 19:33:17 +00001008 Value *Op0 = CI->getArgOperand(0);
1009 Value *Op1 = CI->getArgOperand(1);
1010 unsigned Imm = cast <ConstantInt>(CI->getArgOperand(2))->getZExtValue();
1011 VectorType *VecTy = cast<VectorType>(CI->getType());
1012 unsigned NumElts = VecTy->getNumElements();
1013
Craig Topperc0a5fa02016-06-12 04:48:00 +00001014 SmallVector<uint32_t, 16> Idxs(NumElts);
1015 for (unsigned i = 0; i != NumElts; ++i)
1016 Idxs[i] = ((Imm >> (i%8)) & 1) ? i + NumElts : i;
Craig Topper782d6202015-02-28 19:33:17 +00001017
Craig Topper2f561822016-06-12 01:05:59 +00001018 Rep = Builder.CreateShuffleVector(Op0, Op1, Idxs);
Craig Topper5aebb862016-07-04 20:56:38 +00001019 } else if (IsX86 && (Name.startswith("avx.vinsertf128.") ||
1020 Name == "avx2.vinserti128")) {
Sanjay Patel19792fb2015-03-10 16:08:36 +00001021 Value *Op0 = CI->getArgOperand(0);
1022 Value *Op1 = CI->getArgOperand(1);
1023 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(2))->getZExtValue();
1024 VectorType *VecTy = cast<VectorType>(CI->getType());
1025 unsigned NumElts = VecTy->getNumElements();
Simon Pilgrim9cb018b2015-09-23 08:48:33 +00001026
Sanjay Patel19792fb2015-03-10 16:08:36 +00001027 // Mask off the high bits of the immediate value; hardware ignores those.
1028 Imm = Imm & 1;
Simon Pilgrim9cb018b2015-09-23 08:48:33 +00001029
Sanjay Patel19792fb2015-03-10 16:08:36 +00001030 // Extend the second operand into a vector that is twice as big.
1031 Value *UndefV = UndefValue::get(Op1->getType());
Craig Topperc0a5fa02016-06-12 04:48:00 +00001032 SmallVector<uint32_t, 8> Idxs(NumElts);
1033 for (unsigned i = 0; i != NumElts; ++i)
1034 Idxs[i] = i;
Craig Topper2f561822016-06-12 01:05:59 +00001035 Rep = Builder.CreateShuffleVector(Op1, UndefV, Idxs);
Sanjay Patel19792fb2015-03-10 16:08:36 +00001036
1037 // Insert the second operand into the first operand.
1038
1039 // Note that there is no guarantee that instruction lowering will actually
1040 // produce a vinsertf128 instruction for the created shuffles. In
1041 // particular, the 0 immediate case involves no lane changes, so it can
1042 // be handled as a blend.
1043
1044 // Example of shuffle mask for 32-bit elements:
1045 // Imm = 1 <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 10, i32 11>
1046 // Imm = 0 <i32 8, i32 9, i32 10, i32 11, i32 4, i32 5, i32 6, i32 7 >
1047
Sanjay Patel19792fb2015-03-10 16:08:36 +00001048 // The low half of the result is either the low half of the 1st operand
1049 // or the low half of the 2nd operand (the inserted vector).
Craig Topperc0a5fa02016-06-12 04:48:00 +00001050 for (unsigned i = 0; i != NumElts / 2; ++i)
1051 Idxs[i] = Imm ? i : (i + NumElts);
Sanjay Patel19792fb2015-03-10 16:08:36 +00001052 // The high half of the result is either the low half of the 2nd operand
1053 // (the inserted vector) or the high half of the 1st operand.
Craig Topperc0a5fa02016-06-12 04:48:00 +00001054 for (unsigned i = NumElts / 2; i != NumElts; ++i)
1055 Idxs[i] = Imm ? (i + NumElts / 2) : i;
Craig Topper2f561822016-06-12 01:05:59 +00001056 Rep = Builder.CreateShuffleVector(Op0, Rep, Idxs);
Craig Topper5aebb862016-07-04 20:56:38 +00001057 } else if (IsX86 && (Name.startswith("avx.vextractf128.") ||
1058 Name == "avx2.vextracti128")) {
Sanjay Patelaf1846c2015-03-12 15:15:19 +00001059 Value *Op0 = CI->getArgOperand(0);
1060 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
1061 VectorType *VecTy = cast<VectorType>(CI->getType());
1062 unsigned NumElts = VecTy->getNumElements();
Simon Pilgrim9cb018b2015-09-23 08:48:33 +00001063
Sanjay Patelaf1846c2015-03-12 15:15:19 +00001064 // Mask off the high bits of the immediate value; hardware ignores those.
1065 Imm = Imm & 1;
1066
1067 // Get indexes for either the high half or low half of the input vector.
Craig Topper2f561822016-06-12 01:05:59 +00001068 SmallVector<uint32_t, 4> Idxs(NumElts);
Sanjay Patelaf1846c2015-03-12 15:15:19 +00001069 for (unsigned i = 0; i != NumElts; ++i) {
Craig Topper2f561822016-06-12 01:05:59 +00001070 Idxs[i] = Imm ? (i + NumElts) : i;
Sanjay Patelaf1846c2015-03-12 15:15:19 +00001071 }
1072
1073 Value *UndefV = UndefValue::get(Op0->getType());
Craig Topper2f561822016-06-12 01:05:59 +00001074 Rep = Builder.CreateShuffleVector(Op0, UndefV, Idxs);
Craig Topper5aebb862016-07-04 20:56:38 +00001075 } else if (!IsX86 && Name == "stackprotectorcheck") {
Tim Shen00127562016-04-08 21:26:31 +00001076 Rep = nullptr;
Craig Topper5aebb862016-07-04 20:56:38 +00001077 } else if (IsX86 && (Name.startswith("avx512.mask.perm.df.") ||
1078 Name.startswith("avx512.mask.perm.di."))) {
Simon Pilgrim02d435d2016-07-04 14:19:05 +00001079 Value *Op0 = CI->getArgOperand(0);
1080 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
1081 VectorType *VecTy = cast<VectorType>(CI->getType());
1082 unsigned NumElts = VecTy->getNumElements();
1083
1084 SmallVector<uint32_t, 8> Idxs(NumElts);
1085 for (unsigned i = 0; i != NumElts; ++i)
1086 Idxs[i] = (i & ~0x3) + ((Imm >> (2 * (i & 0x3))) & 3);
1087
1088 Rep = Builder.CreateShuffleVector(Op0, Op0, Idxs);
1089
1090 if (CI->getNumArgOperands() == 4)
1091 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1092 CI->getArgOperand(2));
Craig Topper5aebb862016-07-04 20:56:38 +00001093 } else if (IsX86 && (Name.startswith("avx.vpermil.") ||
1094 Name == "sse2.pshuf.d" ||
1095 Name.startswith("avx512.mask.vpermil.p") ||
1096 Name.startswith("avx512.mask.pshuf.d."))) {
Craig Topper8a105052016-06-12 03:10:47 +00001097 Value *Op0 = CI->getArgOperand(0);
1098 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
1099 VectorType *VecTy = cast<VectorType>(CI->getType());
1100 unsigned NumElts = VecTy->getNumElements();
Simon Pilgrim9fca3002016-07-04 12:40:54 +00001101 // Calculate the size of each index in the immediate.
Craig Topper8a105052016-06-12 03:10:47 +00001102 unsigned IdxSize = 64 / VecTy->getScalarSizeInBits();
1103 unsigned IdxMask = ((1 << IdxSize) - 1);
1104
1105 SmallVector<uint32_t, 8> Idxs(NumElts);
1106 // Lookup the bits for this element, wrapping around the immediate every
1107 // 8-bits. Elements are grouped into sets of 2 or 4 elements so we need
1108 // to offset by the first index of each group.
1109 for (unsigned i = 0; i != NumElts; ++i)
1110 Idxs[i] = ((Imm >> ((i * IdxSize) % 8)) & IdxMask) | (i & ~IdxMask);
1111
1112 Rep = Builder.CreateShuffleVector(Op0, Op0, Idxs);
Craig Topper13cf7ca2016-06-13 02:36:48 +00001113
1114 if (CI->getNumArgOperands() == 4)
1115 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1116 CI->getArgOperand(2));
Craig Topper5aebb862016-07-04 20:56:38 +00001117 } else if (IsX86 && (Name == "sse2.pshufl.w" ||
1118 Name.startswith("avx512.mask.pshufl.w."))) {
Craig Topper10679862016-06-12 14:11:32 +00001119 Value *Op0 = CI->getArgOperand(0);
1120 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
1121 unsigned NumElts = CI->getType()->getVectorNumElements();
1122
1123 SmallVector<uint32_t, 16> Idxs(NumElts);
1124 for (unsigned l = 0; l != NumElts; l += 8) {
1125 for (unsigned i = 0; i != 4; ++i)
1126 Idxs[i + l] = ((Imm >> (2 * i)) & 0x3) + l;
1127 for (unsigned i = 4; i != 8; ++i)
1128 Idxs[i + l] = i + l;
1129 }
1130
1131 Rep = Builder.CreateShuffleVector(Op0, Op0, Idxs);
Craig Topper13cf7ca2016-06-13 02:36:48 +00001132
1133 if (CI->getNumArgOperands() == 4)
1134 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1135 CI->getArgOperand(2));
Craig Topper5aebb862016-07-04 20:56:38 +00001136 } else if (IsX86 && (Name == "sse2.pshufh.w" ||
1137 Name.startswith("avx512.mask.pshufh.w."))) {
Craig Topper10679862016-06-12 14:11:32 +00001138 Value *Op0 = CI->getArgOperand(0);
1139 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(1))->getZExtValue();
1140 unsigned NumElts = CI->getType()->getVectorNumElements();
1141
1142 SmallVector<uint32_t, 16> Idxs(NumElts);
1143 for (unsigned l = 0; l != NumElts; l += 8) {
1144 for (unsigned i = 0; i != 4; ++i)
1145 Idxs[i + l] = i + l;
1146 for (unsigned i = 0; i != 4; ++i)
1147 Idxs[i + l + 4] = ((Imm >> (2 * i)) & 0x3) + 4 + l;
1148 }
1149
1150 Rep = Builder.CreateShuffleVector(Op0, Op0, Idxs);
Craig Topper13cf7ca2016-06-13 02:36:48 +00001151
1152 if (CI->getNumArgOperands() == 4)
1153 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1154 CI->getArgOperand(2));
Craig Topper4619c9e2016-09-13 07:40:53 +00001155 } else if (IsX86 && Name.startswith("avx512.mask.shuf.p")) {
1156 Value *Op0 = CI->getArgOperand(0);
1157 Value *Op1 = CI->getArgOperand(1);
1158 unsigned Imm = cast<ConstantInt>(CI->getArgOperand(2))->getZExtValue();
1159 unsigned NumElts = CI->getType()->getVectorNumElements();
1160
1161 unsigned NumLaneElts = 128/CI->getType()->getScalarSizeInBits();
1162 unsigned HalfLaneElts = NumLaneElts / 2;
1163
1164 SmallVector<uint32_t, 16> Idxs(NumElts);
1165 for (unsigned i = 0; i != NumElts; ++i) {
1166 // Base index is the starting element of the lane.
1167 Idxs[i] = i - (i % NumLaneElts);
1168 // If we are half way through the lane switch to the other source.
1169 if ((i % NumLaneElts) >= HalfLaneElts)
1170 Idxs[i] += NumElts;
1171 // Now select the specific element. By adding HalfLaneElts bits from
1172 // the immediate. Wrapping around the immediate every 8-bits.
1173 Idxs[i] += (Imm >> ((i * HalfLaneElts) % 8)) & ((1 << HalfLaneElts) - 1);
1174 }
1175
1176 Rep = Builder.CreateShuffleVector(Op0, Op1, Idxs);
1177
1178 Rep = EmitX86Select(Builder, CI->getArgOperand(4), Rep,
1179 CI->getArgOperand(3));
Craig Topper5aebb862016-07-04 20:56:38 +00001180 } else if (IsX86 && (Name.startswith("avx512.mask.movddup") ||
1181 Name.startswith("avx512.mask.movshdup") ||
1182 Name.startswith("avx512.mask.movsldup"))) {
Simon Pilgrim19adee92016-07-02 14:42:35 +00001183 Value *Op0 = CI->getArgOperand(0);
1184 unsigned NumElts = CI->getType()->getVectorNumElements();
1185 unsigned NumLaneElts = 128/CI->getType()->getScalarSizeInBits();
1186
1187 unsigned Offset = 0;
Craig Topper5aebb862016-07-04 20:56:38 +00001188 if (Name.startswith("avx512.mask.movshdup."))
Simon Pilgrim19adee92016-07-02 14:42:35 +00001189 Offset = 1;
1190
1191 SmallVector<uint32_t, 16> Idxs(NumElts);
1192 for (unsigned l = 0; l != NumElts; l += NumLaneElts)
1193 for (unsigned i = 0; i != NumLaneElts; i += 2) {
1194 Idxs[i + l + 0] = i + l + Offset;
1195 Idxs[i + l + 1] = i + l + Offset;
1196 }
1197
1198 Rep = Builder.CreateShuffleVector(Op0, Op0, Idxs);
1199
1200 Rep = EmitX86Select(Builder, CI->getArgOperand(2), Rep,
1201 CI->getArgOperand(1));
Craig Topper5aebb862016-07-04 20:56:38 +00001202 } else if (IsX86 && (Name.startswith("avx512.mask.punpckl") ||
1203 Name.startswith("avx512.mask.unpckl."))) {
Craig Topper597aa422016-06-23 07:37:33 +00001204 Value *Op0 = CI->getArgOperand(0);
1205 Value *Op1 = CI->getArgOperand(1);
1206 int NumElts = CI->getType()->getVectorNumElements();
1207 int NumLaneElts = 128/CI->getType()->getScalarSizeInBits();
1208
1209 SmallVector<uint32_t, 64> Idxs(NumElts);
1210 for (int l = 0; l != NumElts; l += NumLaneElts)
1211 for (int i = 0; i != NumLaneElts; ++i)
1212 Idxs[i + l] = l + (i / 2) + NumElts * (i % 2);
1213
1214 Rep = Builder.CreateShuffleVector(Op0, Op1, Idxs);
1215
1216 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1217 CI->getArgOperand(2));
Craig Topper5aebb862016-07-04 20:56:38 +00001218 } else if (IsX86 && (Name.startswith("avx512.mask.punpckh") ||
1219 Name.startswith("avx512.mask.unpckh."))) {
Craig Topper597aa422016-06-23 07:37:33 +00001220 Value *Op0 = CI->getArgOperand(0);
1221 Value *Op1 = CI->getArgOperand(1);
1222 int NumElts = CI->getType()->getVectorNumElements();
1223 int NumLaneElts = 128/CI->getType()->getScalarSizeInBits();
1224
1225 SmallVector<uint32_t, 64> Idxs(NumElts);
1226 for (int l = 0; l != NumElts; l += NumLaneElts)
1227 for (int i = 0; i != NumLaneElts; ++i)
1228 Idxs[i + l] = (NumLaneElts / 2) + l + (i / 2) + NumElts * (i % 2);
1229
1230 Rep = Builder.CreateShuffleVector(Op0, Op1, Idxs);
1231
1232 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1233 CI->getArgOperand(2));
Craig Toppera6e6feb2016-07-12 05:27:53 +00001234 } else if (IsX86 && Name.startswith("avx512.mask.pand.")) {
1235 Rep = Builder.CreateAnd(CI->getArgOperand(0), CI->getArgOperand(1));
1236 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1237 CI->getArgOperand(2));
1238 } else if (IsX86 && Name.startswith("avx512.mask.pandn.")) {
1239 Rep = Builder.CreateAnd(Builder.CreateNot(CI->getArgOperand(0)),
1240 CI->getArgOperand(1));
1241 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1242 CI->getArgOperand(2));
1243 } else if (IsX86 && Name.startswith("avx512.mask.por.")) {
1244 Rep = Builder.CreateOr(CI->getArgOperand(0), CI->getArgOperand(1));
1245 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1246 CI->getArgOperand(2));
1247 } else if (IsX86 && Name.startswith("avx512.mask.pxor.")) {
1248 Rep = Builder.CreateXor(CI->getArgOperand(0), CI->getArgOperand(1));
1249 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1250 CI->getArgOperand(2));
Craig Toppere75c4952016-09-02 05:29:17 +00001251 } else if (IsX86 && Name.startswith("avx512.mask.and.")) {
1252 VectorType *FTy = cast<VectorType>(CI->getType());
1253 VectorType *ITy = VectorType::getInteger(FTy);
1254 Rep = Builder.CreateAnd(Builder.CreateBitCast(CI->getArgOperand(0), ITy),
1255 Builder.CreateBitCast(CI->getArgOperand(1), ITy));
1256 Rep = Builder.CreateBitCast(Rep, FTy);
1257 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1258 CI->getArgOperand(2));
1259 } else if (IsX86 && Name.startswith("avx512.mask.andn.")) {
1260 VectorType *FTy = cast<VectorType>(CI->getType());
1261 VectorType *ITy = VectorType::getInteger(FTy);
1262 Rep = Builder.CreateNot(Builder.CreateBitCast(CI->getArgOperand(0), ITy));
1263 Rep = Builder.CreateAnd(Rep,
1264 Builder.CreateBitCast(CI->getArgOperand(1), ITy));
1265 Rep = Builder.CreateBitCast(Rep, FTy);
1266 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1267 CI->getArgOperand(2));
1268 } else if (IsX86 && Name.startswith("avx512.mask.or.")) {
1269 VectorType *FTy = cast<VectorType>(CI->getType());
1270 VectorType *ITy = VectorType::getInteger(FTy);
1271 Rep = Builder.CreateOr(Builder.CreateBitCast(CI->getArgOperand(0), ITy),
1272 Builder.CreateBitCast(CI->getArgOperand(1), ITy));
1273 Rep = Builder.CreateBitCast(Rep, FTy);
1274 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1275 CI->getArgOperand(2));
1276 } else if (IsX86 && Name.startswith("avx512.mask.xor.")) {
1277 VectorType *FTy = cast<VectorType>(CI->getType());
1278 VectorType *ITy = VectorType::getInteger(FTy);
1279 Rep = Builder.CreateXor(Builder.CreateBitCast(CI->getArgOperand(0), ITy),
1280 Builder.CreateBitCast(CI->getArgOperand(1), ITy));
1281 Rep = Builder.CreateBitCast(Rep, FTy);
1282 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1283 CI->getArgOperand(2));
Craig Topperaf0d63d2016-09-04 02:09:53 +00001284 } else if (IsX86 && Name.startswith("avx512.mask.padd.")) {
1285 Rep = Builder.CreateAdd(CI->getArgOperand(0), CI->getArgOperand(1));
1286 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1287 CI->getArgOperand(2));
1288 } else if (IsX86 && Name.startswith("avx512.mask.psub.")) {
1289 Rep = Builder.CreateSub(CI->getArgOperand(0), CI->getArgOperand(1));
1290 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1291 CI->getArgOperand(2));
1292 } else if (IsX86 && Name.startswith("avx512.mask.pmull.")) {
1293 Rep = Builder.CreateMul(CI->getArgOperand(0), CI->getArgOperand(1));
1294 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1295 CI->getArgOperand(2));
Craig Topper41773452016-09-04 18:13:33 +00001296 } else if (IsX86 && (Name.startswith("avx512.mask.add.pd.128") ||
1297 Name.startswith("avx512.mask.add.pd.256") ||
1298 Name.startswith("avx512.mask.add.ps.128") ||
1299 Name.startswith("avx512.mask.add.ps.256"))) {
1300 Rep = Builder.CreateFAdd(CI->getArgOperand(0), CI->getArgOperand(1));
1301 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1302 CI->getArgOperand(2));
1303 } else if (IsX86 && (Name.startswith("avx512.mask.div.pd.128") ||
1304 Name.startswith("avx512.mask.div.pd.256") ||
1305 Name.startswith("avx512.mask.div.ps.128") ||
1306 Name.startswith("avx512.mask.div.ps.256"))) {
1307 Rep = Builder.CreateFDiv(CI->getArgOperand(0), CI->getArgOperand(1));
1308 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1309 CI->getArgOperand(2));
1310 } else if (IsX86 && (Name.startswith("avx512.mask.mul.pd.128") ||
1311 Name.startswith("avx512.mask.mul.pd.256") ||
1312 Name.startswith("avx512.mask.mul.ps.128") ||
1313 Name.startswith("avx512.mask.mul.ps.256"))) {
1314 Rep = Builder.CreateFMul(CI->getArgOperand(0), CI->getArgOperand(1));
1315 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1316 CI->getArgOperand(2));
1317 } else if (IsX86 && (Name.startswith("avx512.mask.sub.pd.128") ||
1318 Name.startswith("avx512.mask.sub.pd.256") ||
1319 Name.startswith("avx512.mask.sub.ps.128") ||
1320 Name.startswith("avx512.mask.sub.ps.256"))) {
1321 Rep = Builder.CreateFSub(CI->getArgOperand(0), CI->getArgOperand(1));
1322 Rep = EmitX86Select(Builder, CI->getArgOperand(3), Rep,
1323 CI->getArgOperand(2));
Craig Topper3b1817d2012-02-03 06:10:55 +00001324 } else {
Craig Topper8a105052016-06-12 03:10:47 +00001325 llvm_unreachable("Unknown function for CallInst upgrade.");
Craig Topper3b1817d2012-02-03 06:10:55 +00001326 }
1327
Tim Shen00127562016-04-08 21:26:31 +00001328 if (Rep)
1329 CI->replaceAllUsesWith(Rep);
Craig Topper3b1817d2012-02-03 06:10:55 +00001330 CI->eraseFromParent();
1331 return;
1332 }
1333
Yaron Kerend1fdbe72015-03-30 16:10:39 +00001334 std::string Name = CI->getName();
Adrian Prantl87b7eb92014-10-01 18:55:02 +00001335 if (!Name.empty())
1336 CI->setName(Name + ".old");
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001337
Chandler Carruth58a71ed2011-12-12 04:26:04 +00001338 switch (NewFn->getIntrinsicID()) {
1339 default:
Chris Lattner0bcbde42011-11-27 08:42:07 +00001340 llvm_unreachable("Unknown function for CallInst upgrade.");
Chandler Carruth58a71ed2011-12-12 04:26:04 +00001341
Craig Topperf7bf6de2016-07-08 06:14:47 +00001342 case Intrinsic::x86_avx512_mask_psll_di_512:
1343 case Intrinsic::x86_avx512_mask_psra_di_512:
1344 case Intrinsic::x86_avx512_mask_psrl_di_512:
1345 case Intrinsic::x86_avx512_mask_psll_qi_512:
1346 case Intrinsic::x86_avx512_mask_psra_qi_512:
1347 case Intrinsic::x86_avx512_mask_psrl_qi_512:
Jeroen Ketemaab99b592015-09-30 10:56:37 +00001348 case Intrinsic::arm_neon_vld1:
1349 case Intrinsic::arm_neon_vld2:
1350 case Intrinsic::arm_neon_vld3:
1351 case Intrinsic::arm_neon_vld4:
1352 case Intrinsic::arm_neon_vld2lane:
1353 case Intrinsic::arm_neon_vld3lane:
1354 case Intrinsic::arm_neon_vld4lane:
1355 case Intrinsic::arm_neon_vst1:
1356 case Intrinsic::arm_neon_vst2:
1357 case Intrinsic::arm_neon_vst3:
1358 case Intrinsic::arm_neon_vst4:
1359 case Intrinsic::arm_neon_vst2lane:
1360 case Intrinsic::arm_neon_vst3lane:
1361 case Intrinsic::arm_neon_vst4lane: {
1362 SmallVector<Value *, 4> Args(CI->arg_operands().begin(),
1363 CI->arg_operands().end());
1364 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, Args));
1365 CI->eraseFromParent();
1366 return;
1367 }
1368
Chandler Carruth58a71ed2011-12-12 04:26:04 +00001369 case Intrinsic::ctlz:
Nuno Lopesad40c0a2012-05-22 15:25:31 +00001370 case Intrinsic::cttz:
Chandler Carruth58a71ed2011-12-12 04:26:04 +00001371 assert(CI->getNumArgOperands() == 1 &&
1372 "Mismatch between function args and call args");
David Blaikieff6409d2015-05-18 22:13:54 +00001373 CI->replaceAllUsesWith(Builder.CreateCall(
1374 NewFn, {CI->getArgOperand(0), Builder.getFalse()}, Name));
Chandler Carruth58a71ed2011-12-12 04:26:04 +00001375 CI->eraseFromParent();
1376 return;
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001377
Matt Arsenaultfbcbce42013-10-07 18:06:48 +00001378 case Intrinsic::objectsize:
David Blaikieff6409d2015-05-18 22:13:54 +00001379 CI->replaceAllUsesWith(Builder.CreateCall(
1380 NewFn, {CI->getArgOperand(0), CI->getArgOperand(1)}, Name));
Matt Arsenaultfbcbce42013-10-07 18:06:48 +00001381 CI->eraseFromParent();
1382 return;
1383
Joel Jonesb84f7be2012-07-18 00:02:16 +00001384 case Intrinsic::ctpop: {
David Blaikieff6409d2015-05-18 22:13:54 +00001385 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, {CI->getArgOperand(0)}));
Joel Jonesb84f7be2012-07-18 00:02:16 +00001386 CI->eraseFromParent();
1387 return;
1388 }
Joel Jones43cb8782012-07-13 23:25:25 +00001389
Craig Topper71dc02d2012-06-13 07:18:53 +00001390 case Intrinsic::x86_xop_vfrcz_ss:
1391 case Intrinsic::x86_xop_vfrcz_sd:
David Blaikieff6409d2015-05-18 22:13:54 +00001392 CI->replaceAllUsesWith(
1393 Builder.CreateCall(NewFn, {CI->getArgOperand(1)}, Name));
Craig Topper71dc02d2012-06-13 07:18:53 +00001394 CI->eraseFromParent();
1395 return;
1396
Simon Pilgrime85506b2016-06-03 08:06:03 +00001397 case Intrinsic::x86_xop_vpermil2pd:
1398 case Intrinsic::x86_xop_vpermil2ps:
1399 case Intrinsic::x86_xop_vpermil2pd_256:
1400 case Intrinsic::x86_xop_vpermil2ps_256: {
1401 SmallVector<Value *, 4> Args(CI->arg_operands().begin(),
1402 CI->arg_operands().end());
1403 VectorType *FltIdxTy = cast<VectorType>(Args[2]->getType());
1404 VectorType *IntIdxTy = VectorType::getInteger(FltIdxTy);
1405 Args[2] = Builder.CreateBitCast(Args[2], IntIdxTy);
1406 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, Args, Name));
1407 CI->eraseFromParent();
1408 return;
1409 }
1410
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001411 case Intrinsic::x86_sse41_ptestc:
1412 case Intrinsic::x86_sse41_ptestz:
Craig Topper71dc02d2012-06-13 07:18:53 +00001413 case Intrinsic::x86_sse41_ptestnzc: {
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001414 // The arguments for these intrinsics used to be v4f32, and changed
1415 // to v2i64. This is purely a nop, since those are bitwise intrinsics.
1416 // So, the only thing required is a bitcast for both arguments.
1417 // First, check the arguments have the old type.
1418 Value *Arg0 = CI->getArgOperand(0);
1419 if (Arg0->getType() != VectorType::get(Type::getFloatTy(C), 4))
1420 return;
1421
1422 // Old intrinsic, add bitcasts
1423 Value *Arg1 = CI->getArgOperand(1);
1424
David Blaikie5bacf372015-04-24 21:16:07 +00001425 Type *NewVecTy = VectorType::get(Type::getInt64Ty(C), 2);
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001426
David Blaikie5bacf372015-04-24 21:16:07 +00001427 Value *BC0 = Builder.CreateBitCast(Arg0, NewVecTy, "cast");
1428 Value *BC1 = Builder.CreateBitCast(Arg1, NewVecTy, "cast");
1429
David Blaikieff6409d2015-05-18 22:13:54 +00001430 CallInst *NewCall = Builder.CreateCall(NewFn, {BC0, BC1}, Name);
Nadav Rotem17ee58a2012-06-10 18:42:51 +00001431 CI->replaceAllUsesWith(NewCall);
1432 CI->eraseFromParent();
1433 return;
Evan Cheng0e179d02007-12-17 22:33:23 +00001434 }
Chandler Carruth373b2b12014-09-06 10:00:01 +00001435
Chandler Carruth373b2b12014-09-06 10:00:01 +00001436 case Intrinsic::x86_sse41_insertps:
1437 case Intrinsic::x86_sse41_dppd:
1438 case Intrinsic::x86_sse41_dpps:
1439 case Intrinsic::x86_sse41_mpsadbw:
Chandler Carruth373b2b12014-09-06 10:00:01 +00001440 case Intrinsic::x86_avx_dp_ps_256:
Chandler Carruth373b2b12014-09-06 10:00:01 +00001441 case Intrinsic::x86_avx2_mpsadbw: {
1442 // Need to truncate the last argument from i32 to i8 -- this argument models
1443 // an inherently 8-bit immediate operand to these x86 instructions.
1444 SmallVector<Value *, 4> Args(CI->arg_operands().begin(),
1445 CI->arg_operands().end());
1446
1447 // Replace the last argument with a trunc.
1448 Args.back() = Builder.CreateTrunc(Args.back(), Type::getInt8Ty(C), "trunc");
1449
1450 CallInst *NewCall = Builder.CreateCall(NewFn, Args);
1451 CI->replaceAllUsesWith(NewCall);
1452 CI->eraseFromParent();
1453 return;
1454 }
Marcin Koscielnicki3fdc2572016-04-19 20:51:05 +00001455
1456 case Intrinsic::thread_pointer: {
1457 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, {}));
1458 CI->eraseFromParent();
1459 return;
1460 }
Artur Pilipenko7ad95ec2016-06-28 18:27:25 +00001461
Mehdi Amini8c629ec2016-08-13 23:31:24 +00001462 case Intrinsic::invariant_start:
1463 case Intrinsic::invariant_end:
Artur Pilipenko7ad95ec2016-06-28 18:27:25 +00001464 case Intrinsic::masked_load:
1465 case Intrinsic::masked_store: {
1466 SmallVector<Value *, 4> Args(CI->arg_operands().begin(),
1467 CI->arg_operands().end());
1468 CI->replaceAllUsesWith(Builder.CreateCall(NewFn, Args));
1469 CI->eraseFromParent();
1470 return;
1471 }
Craig Topper71dc02d2012-06-13 07:18:53 +00001472 }
Chandler Carruth7132e002007-08-04 01:51:18 +00001473}
1474
Sanjay Patelfdf0d5f2016-04-18 19:11:57 +00001475void llvm::UpgradeCallsToIntrinsic(Function *F) {
Chandler Carruth7132e002007-08-04 01:51:18 +00001476 assert(F && "Illegal attempt to upgrade a non-existent intrinsic.");
1477
Sanjay Patelfdf0d5f2016-04-18 19:11:57 +00001478 // Check if this function should be upgraded and get the replacement function
1479 // if there is one.
Chris Lattner80ed9dc2011-06-18 06:05:24 +00001480 Function *NewFn;
Evan Cheng0e179d02007-12-17 22:33:23 +00001481 if (UpgradeIntrinsicFunction(F, NewFn)) {
Sanjay Patelfdf0d5f2016-04-18 19:11:57 +00001482 // Replace all users of the old function with the new function or new
1483 // instructions. This is not a range loop because the call is deleted.
1484 for (auto UI = F->user_begin(), UE = F->user_end(); UI != UE; )
Duncan P. N. Exon Smith93f53c42016-04-17 03:59:37 +00001485 if (CallInst *CI = dyn_cast<CallInst>(*UI++))
Filipe Cabecinhas0011c582015-07-03 20:12:01 +00001486 UpgradeIntrinsicCall(CI, NewFn);
Sanjay Patelfdf0d5f2016-04-18 19:11:57 +00001487
Filipe Cabecinhas0011c582015-07-03 20:12:01 +00001488 // Remove old function, no longer used, from the module.
1489 F->eraseFromParent();
Chandler Carruth7132e002007-08-04 01:51:18 +00001490 }
1491}
Devang Patel80ae3492009-08-28 23:24:31 +00001492
Mehdi Aminie4709272016-09-14 22:29:59 +00001493MDNode *llvm::UpgradeTBAANode(MDNode &MD) {
Manman Ren209b17c2013-09-28 00:22:27 +00001494 // Check if the tag uses struct-path aware TBAA format.
Mehdi Aminie4709272016-09-14 22:29:59 +00001495 if (isa<MDNode>(MD.getOperand(0)) && MD.getNumOperands() >= 3)
1496 return &MD;
Manman Ren209b17c2013-09-28 00:22:27 +00001497
Mehdi Aminie4709272016-09-14 22:29:59 +00001498 auto &Context = MD.getContext();
1499 if (MD.getNumOperands() == 3) {
1500 Metadata *Elts[] = {MD.getOperand(0), MD.getOperand(1)};
1501 MDNode *ScalarType = MDNode::get(Context, Elts);
Manman Ren209b17c2013-09-28 00:22:27 +00001502 // Create a MDNode <ScalarType, ScalarType, offset 0, const>
Duncan P. N. Exon Smith5bf8fef2014-12-09 18:38:53 +00001503 Metadata *Elts2[] = {ScalarType, ScalarType,
Mehdi Aminie4709272016-09-14 22:29:59 +00001504 ConstantAsMetadata::get(
1505 Constant::getNullValue(Type::getInt64Ty(Context))),
1506 MD.getOperand(2)};
1507 return MDNode::get(Context, Elts2);
Manman Ren209b17c2013-09-28 00:22:27 +00001508 }
Mehdi Aminie4709272016-09-14 22:29:59 +00001509 // Create a MDNode <MD, MD, offset 0>
1510 Metadata *Elts[] = {&MD, &MD, ConstantAsMetadata::get(Constant::getNullValue(
1511 Type::getInt64Ty(Context)))};
1512 return MDNode::get(Context, Elts);
Manman Ren209b17c2013-09-28 00:22:27 +00001513}
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001514
1515Instruction *llvm::UpgradeBitCastInst(unsigned Opc, Value *V, Type *DestTy,
1516 Instruction *&Temp) {
1517 if (Opc != Instruction::BitCast)
Craig Topperc6207612014-04-09 06:08:46 +00001518 return nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001519
Craig Topperc6207612014-04-09 06:08:46 +00001520 Temp = nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001521 Type *SrcTy = V->getType();
1522 if (SrcTy->isPtrOrPtrVectorTy() && DestTy->isPtrOrPtrVectorTy() &&
1523 SrcTy->getPointerAddressSpace() != DestTy->getPointerAddressSpace()) {
1524 LLVMContext &Context = V->getContext();
1525
1526 // We have no information about target data layout, so we assume that
1527 // the maximum pointer size is 64bit.
1528 Type *MidTy = Type::getInt64Ty(Context);
1529 Temp = CastInst::Create(Instruction::PtrToInt, V, MidTy);
1530
1531 return CastInst::Create(Instruction::IntToPtr, Temp, DestTy);
1532 }
1533
Craig Topperc6207612014-04-09 06:08:46 +00001534 return nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001535}
1536
1537Value *llvm::UpgradeBitCastExpr(unsigned Opc, Constant *C, Type *DestTy) {
1538 if (Opc != Instruction::BitCast)
Craig Topperc6207612014-04-09 06:08:46 +00001539 return nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001540
1541 Type *SrcTy = C->getType();
1542 if (SrcTy->isPtrOrPtrVectorTy() && DestTy->isPtrOrPtrVectorTy() &&
1543 SrcTy->getPointerAddressSpace() != DestTy->getPointerAddressSpace()) {
1544 LLVMContext &Context = C->getContext();
1545
1546 // We have no information about target data layout, so we assume that
1547 // the maximum pointer size is 64bit.
1548 Type *MidTy = Type::getInt64Ty(Context);
1549
1550 return ConstantExpr::getIntToPtr(ConstantExpr::getPtrToInt(C, MidTy),
1551 DestTy);
1552 }
1553
Craig Topperc6207612014-04-09 06:08:46 +00001554 return nullptr;
Matt Arsenaultb03bd4d2013-11-15 01:34:59 +00001555}
Manman Ren8b4306c2013-12-02 21:29:56 +00001556
1557/// Check the debug info version number, if it is out-dated, drop the debug
1558/// info. Return true if module is modified.
1559bool llvm::UpgradeDebugInfo(Module &M) {
Manman Ren2ebfb422014-01-16 01:51:12 +00001560 unsigned Version = getDebugMetadataVersionFromModule(M);
1561 if (Version == DEBUG_METADATA_VERSION)
Manman Ren8b4306c2013-12-02 21:29:56 +00001562 return false;
1563
Manman Ren2ebfb422014-01-16 01:51:12 +00001564 bool RetCode = StripDebugInfo(M);
1565 if (RetCode) {
1566 DiagnosticInfoDebugMetadataVersion DiagVersion(M, Version);
1567 M.getContext().diagnose(DiagVersion);
1568 }
1569 return RetCode;
Manman Ren8b4306c2013-12-02 21:29:56 +00001570}
Eli Bendersky5d5e18d2014-06-25 15:41:00 +00001571
Manman Renb5d7ff42016-05-25 23:14:48 +00001572bool llvm::UpgradeModuleFlags(Module &M) {
1573 const NamedMDNode *ModFlags = M.getModuleFlagsMetadata();
1574 if (!ModFlags)
1575 return false;
1576
1577 bool HasObjCFlag = false, HasClassProperties = false;
1578 for (unsigned I = 0, E = ModFlags->getNumOperands(); I != E; ++I) {
1579 MDNode *Op = ModFlags->getOperand(I);
1580 if (Op->getNumOperands() < 2)
1581 continue;
1582 MDString *ID = dyn_cast_or_null<MDString>(Op->getOperand(1));
1583 if (!ID)
1584 continue;
1585 if (ID->getString() == "Objective-C Image Info Version")
1586 HasObjCFlag = true;
1587 if (ID->getString() == "Objective-C Class Properties")
1588 HasClassProperties = true;
1589 }
1590 // "Objective-C Class Properties" is recently added for Objective-C. We
1591 // upgrade ObjC bitcodes to contain a "Objective-C Class Properties" module
Mehdi Aminib53b62e2016-09-16 00:38:18 +00001592 // flag of value 0, so we can correclty downgrade this flag when trying to
1593 // link an ObjC bitcode without this module flag with an ObjC bitcode with
1594 // this module flag.
Manman Renb5d7ff42016-05-25 23:14:48 +00001595 if (HasObjCFlag && !HasClassProperties) {
Mehdi Aminib53b62e2016-09-16 00:38:18 +00001596 M.addModuleFlag(llvm::Module::Override, "Objective-C Class Properties",
Manman Renb5d7ff42016-05-25 23:14:48 +00001597 (uint32_t)0);
1598 return true;
1599 }
1600 return false;
1601}
1602
Duncan P. N. Exon Smithefe16c82016-03-25 00:56:13 +00001603static bool isOldLoopArgument(Metadata *MD) {
1604 auto *T = dyn_cast_or_null<MDTuple>(MD);
1605 if (!T)
1606 return false;
1607 if (T->getNumOperands() < 1)
1608 return false;
1609 auto *S = dyn_cast_or_null<MDString>(T->getOperand(0));
1610 if (!S)
1611 return false;
1612 return S->getString().startswith("llvm.vectorizer.");
1613}
1614
1615static MDString *upgradeLoopTag(LLVMContext &C, StringRef OldTag) {
1616 StringRef OldPrefix = "llvm.vectorizer.";
1617 assert(OldTag.startswith(OldPrefix) && "Expected old prefix");
1618
1619 if (OldTag == "llvm.vectorizer.unroll")
1620 return MDString::get(C, "llvm.loop.interleave.count");
1621
1622 return MDString::get(
1623 C, (Twine("llvm.loop.vectorize.") + OldTag.drop_front(OldPrefix.size()))
1624 .str());
1625}
1626
1627static Metadata *upgradeLoopArgument(Metadata *MD) {
1628 auto *T = dyn_cast_or_null<MDTuple>(MD);
1629 if (!T)
1630 return MD;
1631 if (T->getNumOperands() < 1)
1632 return MD;
1633 auto *OldTag = dyn_cast_or_null<MDString>(T->getOperand(0));
1634 if (!OldTag)
1635 return MD;
1636 if (!OldTag->getString().startswith("llvm.vectorizer."))
1637 return MD;
1638
1639 // This has an old tag. Upgrade it.
1640 SmallVector<Metadata *, 8> Ops;
1641 Ops.reserve(T->getNumOperands());
1642 Ops.push_back(upgradeLoopTag(T->getContext(), OldTag->getString()));
1643 for (unsigned I = 1, E = T->getNumOperands(); I != E; ++I)
1644 Ops.push_back(T->getOperand(I));
1645
1646 return MDTuple::get(T->getContext(), Ops);
1647}
1648
1649MDNode *llvm::upgradeInstructionLoopAttachment(MDNode &N) {
1650 auto *T = dyn_cast<MDTuple>(&N);
1651 if (!T)
1652 return &N;
1653
David Majnemer0a16c222016-08-11 21:15:00 +00001654 if (none_of(T->operands(), isOldLoopArgument))
Duncan P. N. Exon Smithefe16c82016-03-25 00:56:13 +00001655 return &N;
1656
1657 SmallVector<Metadata *, 8> Ops;
1658 Ops.reserve(T->getNumOperands());
1659 for (Metadata *MD : T->operands())
1660 Ops.push_back(upgradeLoopArgument(MD));
1661
1662 return MDTuple::get(T->getContext(), Ops);
Eli Bendersky5d5e18d2014-06-25 15:41:00 +00001663}