blob: 2c8fb8b89697bb3437d319b28d6f2c07a047de1a [file] [log] [blame]
Meador Inge5e890452012-10-13 16:45:24 +00001//===------ SimplifyLibCalls.cpp - Library calls simplifier ---------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This is a utility pass used for testing the InstructionSimplify analysis.
11// The analysis is applied to every instruction, and if it simplifies then the
12// instruction is replaced by the simplification. If you are looking for a pass
13// that performs serious instruction folding, use the instcombine pass instead.
14//
15//===----------------------------------------------------------------------===//
16
17#include "llvm/Transforms/Utils/SimplifyLibCalls.h"
18#include "llvm/DataLayout.h"
19#include "llvm/ADT/StringMap.h"
20#include "llvm/Analysis/ValueTracking.h"
21#include "llvm/Function.h"
22#include "llvm/IRBuilder.h"
23#include "llvm/LLVMContext.h"
24#include "llvm/Target/TargetLibraryInfo.h"
25#include "llvm/Transforms/Utils/BuildLibCalls.h"
26
27using namespace llvm;
28
29/// This class is the abstract base class for the set of optimizations that
30/// corresponds to one library call.
31namespace {
32class LibCallOptimization {
33protected:
34 Function *Caller;
35 const DataLayout *TD;
36 const TargetLibraryInfo *TLI;
37 LLVMContext* Context;
38public:
39 LibCallOptimization() { }
40 virtual ~LibCallOptimization() {}
41
42 /// callOptimizer - This pure virtual method is implemented by base classes to
43 /// do various optimizations. If this returns null then no transformation was
44 /// performed. If it returns CI, then it transformed the call and CI is to be
45 /// deleted. If it returns something else, replace CI with the new value and
46 /// delete CI.
47 virtual Value *callOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B)
48 =0;
49
50 Value *optimizeCall(CallInst *CI, const DataLayout *TD,
51 const TargetLibraryInfo *TLI, IRBuilder<> &B) {
52 Caller = CI->getParent()->getParent();
53 this->TD = TD;
54 this->TLI = TLI;
55 if (CI->getCalledFunction())
56 Context = &CI->getCalledFunction()->getContext();
57
58 // We never change the calling convention.
59 if (CI->getCallingConv() != llvm::CallingConv::C)
60 return NULL;
61
62 return callOptimizer(CI->getCalledFunction(), CI, B);
63 }
64};
65
66//===----------------------------------------------------------------------===//
67// Fortified Library Call Optimizations
68//===----------------------------------------------------------------------===//
69
70struct FortifiedLibCallOptimization : public LibCallOptimization {
71protected:
72 virtual bool isFoldable(unsigned SizeCIOp, unsigned SizeArgOp,
73 bool isString) const = 0;
74};
75
76struct InstFortifiedLibCallOptimization : public FortifiedLibCallOptimization {
77 CallInst *CI;
78
79 bool isFoldable(unsigned SizeCIOp, unsigned SizeArgOp, bool isString) const {
80 if (CI->getArgOperand(SizeCIOp) == CI->getArgOperand(SizeArgOp))
81 return true;
82 if (ConstantInt *SizeCI =
83 dyn_cast<ConstantInt>(CI->getArgOperand(SizeCIOp))) {
84 if (SizeCI->isAllOnesValue())
85 return true;
86 if (isString) {
87 uint64_t Len = GetStringLength(CI->getArgOperand(SizeArgOp));
88 // If the length is 0 we don't know how long it is and so we can't
89 // remove the check.
90 if (Len == 0) return false;
91 return SizeCI->getZExtValue() >= Len;
92 }
93 if (ConstantInt *Arg = dyn_cast<ConstantInt>(
94 CI->getArgOperand(SizeArgOp)))
95 return SizeCI->getZExtValue() >= Arg->getZExtValue();
96 }
97 return false;
98 }
99};
100
101struct MemCpyChkOpt : public InstFortifiedLibCallOptimization {
102 virtual Value *callOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
103 this->CI = CI;
104 FunctionType *FT = Callee->getFunctionType();
105 LLVMContext &Context = CI->getParent()->getContext();
106
107 // Check if this has the right signature.
108 if (FT->getNumParams() != 4 || FT->getReturnType() != FT->getParamType(0) ||
109 !FT->getParamType(0)->isPointerTy() ||
110 !FT->getParamType(1)->isPointerTy() ||
111 FT->getParamType(2) != TD->getIntPtrType(Context) ||
112 FT->getParamType(3) != TD->getIntPtrType(Context))
113 return 0;
114
115 if (isFoldable(3, 2, false)) {
116 B.CreateMemCpy(CI->getArgOperand(0), CI->getArgOperand(1),
117 CI->getArgOperand(2), 1);
118 return CI->getArgOperand(0);
119 }
120 return 0;
121 }
122};
123
124struct MemMoveChkOpt : public InstFortifiedLibCallOptimization {
125 virtual Value *callOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
126 this->CI = CI;
127 FunctionType *FT = Callee->getFunctionType();
128 LLVMContext &Context = CI->getParent()->getContext();
129
130 // Check if this has the right signature.
131 if (FT->getNumParams() != 4 || FT->getReturnType() != FT->getParamType(0) ||
132 !FT->getParamType(0)->isPointerTy() ||
133 !FT->getParamType(1)->isPointerTy() ||
134 FT->getParamType(2) != TD->getIntPtrType(Context) ||
135 FT->getParamType(3) != TD->getIntPtrType(Context))
136 return 0;
137
138 if (isFoldable(3, 2, false)) {
139 B.CreateMemMove(CI->getArgOperand(0), CI->getArgOperand(1),
140 CI->getArgOperand(2), 1);
141 return CI->getArgOperand(0);
142 }
143 return 0;
144 }
145};
146
147struct MemSetChkOpt : public InstFortifiedLibCallOptimization {
148 virtual Value *callOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
149 this->CI = CI;
150 FunctionType *FT = Callee->getFunctionType();
151 LLVMContext &Context = CI->getParent()->getContext();
152
153 // Check if this has the right signature.
154 if (FT->getNumParams() != 4 || FT->getReturnType() != FT->getParamType(0) ||
155 !FT->getParamType(0)->isPointerTy() ||
156 !FT->getParamType(1)->isIntegerTy() ||
157 FT->getParamType(2) != TD->getIntPtrType(Context) ||
158 FT->getParamType(3) != TD->getIntPtrType(Context))
159 return 0;
160
161 if (isFoldable(3, 2, false)) {
162 Value *Val = B.CreateIntCast(CI->getArgOperand(1), B.getInt8Ty(),
163 false);
164 B.CreateMemSet(CI->getArgOperand(0), Val, CI->getArgOperand(2), 1);
165 return CI->getArgOperand(0);
166 }
167 return 0;
168 }
169};
170
171struct StrCpyChkOpt : public InstFortifiedLibCallOptimization {
172 virtual Value *callOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
173 this->CI = CI;
174 StringRef Name = Callee->getName();
175 FunctionType *FT = Callee->getFunctionType();
176 LLVMContext &Context = CI->getParent()->getContext();
177
178 // Check if this has the right signature.
179 if (FT->getNumParams() != 3 ||
180 FT->getReturnType() != FT->getParamType(0) ||
181 FT->getParamType(0) != FT->getParamType(1) ||
182 FT->getParamType(0) != Type::getInt8PtrTy(Context) ||
183 FT->getParamType(2) != TD->getIntPtrType(Context))
184 return 0;
185
186 // If a) we don't have any length information, or b) we know this will
187 // fit then just lower to a plain st[rp]cpy. Otherwise we'll keep our
188 // st[rp]cpy_chk call which may fail at runtime if the size is too long.
189 // TODO: It might be nice to get a maximum length out of the possible
190 // string lengths for varying.
191 if (isFoldable(2, 1, true)) {
192 Value *Ret = EmitStrCpy(CI->getArgOperand(0), CI->getArgOperand(1), B, TD,
193 TLI, Name.substr(2, 6));
194 return Ret;
195 }
196 return 0;
197 }
198};
199
200struct StrNCpyChkOpt : public InstFortifiedLibCallOptimization {
201 virtual Value *callOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
202 this->CI = CI;
203 StringRef Name = Callee->getName();
204 FunctionType *FT = Callee->getFunctionType();
205 LLVMContext &Context = CI->getParent()->getContext();
206
207 // Check if this has the right signature.
208 if (FT->getNumParams() != 4 || FT->getReturnType() != FT->getParamType(0) ||
209 FT->getParamType(0) != FT->getParamType(1) ||
210 FT->getParamType(0) != Type::getInt8PtrTy(Context) ||
211 !FT->getParamType(2)->isIntegerTy() ||
212 FT->getParamType(3) != TD->getIntPtrType(Context))
213 return 0;
214
215 if (isFoldable(3, 2, false)) {
216 Value *Ret = EmitStrNCpy(CI->getArgOperand(0), CI->getArgOperand(1),
217 CI->getArgOperand(2), B, TD, TLI,
218 Name.substr(2, 7));
219 return Ret;
220 }
221 return 0;
222 }
223};
224
Meador Inge73d8a582012-10-13 16:45:32 +0000225//===----------------------------------------------------------------------===//
226// String and Memory Library Call Optimizations
227//===----------------------------------------------------------------------===//
228
229struct StrCatOpt : public LibCallOptimization {
230 virtual Value *callOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
231 // Verify the "strcat" function prototype.
232 FunctionType *FT = Callee->getFunctionType();
233 if (FT->getNumParams() != 2 ||
234 FT->getReturnType() != B.getInt8PtrTy() ||
235 FT->getParamType(0) != FT->getReturnType() ||
236 FT->getParamType(1) != FT->getReturnType())
237 return 0;
238
239 // Extract some information from the instruction
240 Value *Dst = CI->getArgOperand(0);
241 Value *Src = CI->getArgOperand(1);
242
243 // See if we can get the length of the input string.
244 uint64_t Len = GetStringLength(Src);
245 if (Len == 0) return 0;
246 --Len; // Unbias length.
247
248 // Handle the simple, do-nothing case: strcat(x, "") -> x
249 if (Len == 0)
250 return Dst;
251
252 // These optimizations require DataLayout.
253 if (!TD) return 0;
254
255 return emitStrLenMemCpy(Src, Dst, Len, B);
256 }
257
258 Value *emitStrLenMemCpy(Value *Src, Value *Dst, uint64_t Len,
259 IRBuilder<> &B) {
260 // We need to find the end of the destination string. That's where the
261 // memory is to be moved to. We just generate a call to strlen.
262 Value *DstLen = EmitStrLen(Dst, B, TD, TLI);
263 if (!DstLen)
264 return 0;
265
266 // Now that we have the destination's length, we must index into the
267 // destination's pointer to get the actual memcpy destination (end of
268 // the string .. we're concatenating).
269 Value *CpyDst = B.CreateGEP(Dst, DstLen, "endptr");
270
271 // We have enough information to now generate the memcpy call to do the
272 // concatenation for us. Make a memcpy to copy the nul byte with align = 1.
273 B.CreateMemCpy(CpyDst, Src,
274 ConstantInt::get(TD->getIntPtrType(*Context), Len + 1), 1);
275 return Dst;
276 }
277};
278
279struct StrNCatOpt : public StrCatOpt {
280 virtual Value *callOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
281 // Verify the "strncat" function prototype.
282 FunctionType *FT = Callee->getFunctionType();
283 if (FT->getNumParams() != 3 ||
284 FT->getReturnType() != B.getInt8PtrTy() ||
285 FT->getParamType(0) != FT->getReturnType() ||
286 FT->getParamType(1) != FT->getReturnType() ||
287 !FT->getParamType(2)->isIntegerTy())
288 return 0;
289
290 // Extract some information from the instruction
291 Value *Dst = CI->getArgOperand(0);
292 Value *Src = CI->getArgOperand(1);
293 uint64_t Len;
294
295 // We don't do anything if length is not constant
296 if (ConstantInt *LengthArg = dyn_cast<ConstantInt>(CI->getArgOperand(2)))
297 Len = LengthArg->getZExtValue();
298 else
299 return 0;
300
301 // See if we can get the length of the input string.
302 uint64_t SrcLen = GetStringLength(Src);
303 if (SrcLen == 0) return 0;
304 --SrcLen; // Unbias length.
305
306 // Handle the simple, do-nothing cases:
307 // strncat(x, "", c) -> x
308 // strncat(x, c, 0) -> x
309 if (SrcLen == 0 || Len == 0) return Dst;
310
311 // These optimizations require DataLayout.
312 if (!TD) return 0;
313
314 // We don't optimize this case
315 if (Len < SrcLen) return 0;
316
317 // strncat(x, s, c) -> strcat(x, s)
318 // s is constant so the strcat can be optimized further
319 return emitStrLenMemCpy(Src, Dst, SrcLen, B);
320 }
321};
322
Meador Inge5e890452012-10-13 16:45:24 +0000323} // End anonymous namespace.
324
325namespace llvm {
326
327class LibCallSimplifierImpl {
328 LibCallSimplifier *Simplifier;
329 const DataLayout *TD;
330 const TargetLibraryInfo *TLI;
331 StringMap<LibCallOptimization*> Optimizations;
332
333 // Fortified library call optimizations.
334 MemCpyChkOpt MemCpyChk;
335 MemMoveChkOpt MemMoveChk;
336 MemSetChkOpt MemSetChk;
337 StrCpyChkOpt StrCpyChk;
338 StrNCpyChkOpt StrNCpyChk;
339
Meador Inge73d8a582012-10-13 16:45:32 +0000340 // String and memory library call optimizations.
341 StrCatOpt StrCat;
342 StrNCatOpt StrNCat;
343
Meador Inge5e890452012-10-13 16:45:24 +0000344 void initOptimizations();
345public:
346 LibCallSimplifierImpl(const DataLayout *TD, const TargetLibraryInfo *TLI) {
347 this->TD = TD;
348 this->TLI = TLI;
349 }
350
351 Value *optimizeCall(CallInst *CI);
352};
353
354void LibCallSimplifierImpl::initOptimizations() {
355 // Fortified library call optimizations.
356 Optimizations["__memcpy_chk"] = &MemCpyChk;
357 Optimizations["__memmove_chk"] = &MemMoveChk;
358 Optimizations["__memset_chk"] = &MemSetChk;
359 Optimizations["__strcpy_chk"] = &StrCpyChk;
360 Optimizations["__stpcpy_chk"] = &StrCpyChk;
361 Optimizations["__strncpy_chk"] = &StrNCpyChk;
362 Optimizations["__stpncpy_chk"] = &StrNCpyChk;
Meador Inge73d8a582012-10-13 16:45:32 +0000363
364 // String and memory library call optimizations.
365 Optimizations["strcat"] = &StrCat;
366 Optimizations["strncat"] = &StrNCat;
Meador Inge5e890452012-10-13 16:45:24 +0000367}
368
369Value *LibCallSimplifierImpl::optimizeCall(CallInst *CI) {
370 if (Optimizations.empty())
371 initOptimizations();
372
373 Function *Callee = CI->getCalledFunction();
374 LibCallOptimization *LCO = Optimizations.lookup(Callee->getName());
375 if (LCO) {
376 IRBuilder<> Builder(CI);
377 return LCO->optimizeCall(CI, TD, TLI, Builder);
378 }
379 return 0;
380}
381
382LibCallSimplifier::LibCallSimplifier(const DataLayout *TD,
383 const TargetLibraryInfo *TLI) {
384 Impl = new LibCallSimplifierImpl(TD, TLI);
385}
386
387LibCallSimplifier::~LibCallSimplifier() {
388 delete Impl;
389}
390
391Value *LibCallSimplifier::optimizeCall(CallInst *CI) {
392 return Impl->optimizeCall(CI);
393}
394
395}