blob: 992c8b922f75dcf4ce0a9bb744dc0ef27ec33f1c [file] [log] [blame]
Peter Collingbourne9f7ec142016-02-03 02:51:00 +00001//===- Evaluator.cpp - LLVM IR evaluator ----------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// Function evaluator for LLVM IR.
11//
12//===----------------------------------------------------------------------===//
13
14#include "llvm/Transforms/Utils/Evaluator.h"
Eugene Zelenko5adb96c2017-10-26 00:55:39 +000015#include "llvm/ADT/DenseMap.h"
16#include "llvm/ADT/STLExtras.h"
17#include "llvm/ADT/SmallPtrSet.h"
18#include "llvm/ADT/SmallVector.h"
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000019#include "llvm/Analysis/ConstantFolding.h"
20#include "llvm/IR/BasicBlock.h"
21#include "llvm/IR/CallSite.h"
Eugene Zelenko5adb96c2017-10-26 00:55:39 +000022#include "llvm/IR/Constant.h"
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000023#include "llvm/IR/Constants.h"
Craig Topperb5c2bfa2017-03-20 05:08:41 +000024#include "llvm/IR/DataLayout.h"
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000025#include "llvm/IR/DerivedTypes.h"
Eugene Zelenko5adb96c2017-10-26 00:55:39 +000026#include "llvm/IR/Function.h"
Eugene Leviant6a572b82018-07-10 16:34:23 +000027#include "llvm/IR/GlobalAlias.h"
Eugene Zelenko5adb96c2017-10-26 00:55:39 +000028#include "llvm/IR/GlobalValue.h"
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000029#include "llvm/IR/GlobalVariable.h"
Eugene Zelenko5adb96c2017-10-26 00:55:39 +000030#include "llvm/IR/InstrTypes.h"
31#include "llvm/IR/Instruction.h"
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000032#include "llvm/IR/Instructions.h"
Chandler Carruth6bda14b2017-06-06 11:49:48 +000033#include "llvm/IR/IntrinsicInst.h"
Eugene Zelenko5adb96c2017-10-26 00:55:39 +000034#include "llvm/IR/Intrinsics.h"
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000035#include "llvm/IR/Operator.h"
Eugene Zelenko5adb96c2017-10-26 00:55:39 +000036#include "llvm/IR/Type.h"
37#include "llvm/IR/User.h"
38#include "llvm/IR/Value.h"
39#include "llvm/Support/Casting.h"
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000040#include "llvm/Support/Debug.h"
Peter Collingbourne83cc9812016-02-03 03:16:37 +000041#include "llvm/Support/raw_ostream.h"
Eugene Zelenko5adb96c2017-10-26 00:55:39 +000042#include <iterator>
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000043
44#define DEBUG_TYPE "evaluator"
45
46using namespace llvm;
47
48static inline bool
49isSimpleEnoughValueToCommit(Constant *C,
50 SmallPtrSetImpl<Constant *> &SimpleConstants,
51 const DataLayout &DL);
52
53/// Return true if the specified constant can be handled by the code generator.
54/// We don't want to generate something like:
55/// void *X = &X/42;
56/// because the code generator doesn't have a relocation that can handle that.
57///
58/// This function should be called if C was not found (but just got inserted)
59/// in SimpleConstants to avoid having to rescan the same constants all the
60/// time.
61static bool
62isSimpleEnoughValueToCommitHelper(Constant *C,
63 SmallPtrSetImpl<Constant *> &SimpleConstants,
64 const DataLayout &DL) {
65 // Simple global addresses are supported, do not allow dllimport or
66 // thread-local globals.
67 if (auto *GV = dyn_cast<GlobalValue>(C))
68 return !GV->hasDLLImportStorageClass() && !GV->isThreadLocal();
69
70 // Simple integer, undef, constant aggregate zero, etc are all supported.
71 if (C->getNumOperands() == 0 || isa<BlockAddress>(C))
72 return true;
73
74 // Aggregate values are safe if all their elements are.
Duncan P. N. Exon Smith1de3c7e2016-04-05 21:10:45 +000075 if (isa<ConstantAggregate>(C)) {
Peter Collingbourne9f7ec142016-02-03 02:51:00 +000076 for (Value *Op : C->operands())
77 if (!isSimpleEnoughValueToCommit(cast<Constant>(Op), SimpleConstants, DL))
78 return false;
79 return true;
80 }
81
82 // We don't know exactly what relocations are allowed in constant expressions,
83 // so we allow &global+constantoffset, which is safe and uniformly supported
84 // across targets.
85 ConstantExpr *CE = cast<ConstantExpr>(C);
86 switch (CE->getOpcode()) {
87 case Instruction::BitCast:
88 // Bitcast is fine if the casted value is fine.
89 return isSimpleEnoughValueToCommit(CE->getOperand(0), SimpleConstants, DL);
90
91 case Instruction::IntToPtr:
92 case Instruction::PtrToInt:
93 // int <=> ptr is fine if the int type is the same size as the
94 // pointer type.
95 if (DL.getTypeSizeInBits(CE->getType()) !=
96 DL.getTypeSizeInBits(CE->getOperand(0)->getType()))
97 return false;
98 return isSimpleEnoughValueToCommit(CE->getOperand(0), SimpleConstants, DL);
99
100 // GEP is fine if it is simple + constant offset.
101 case Instruction::GetElementPtr:
102 for (unsigned i = 1, e = CE->getNumOperands(); i != e; ++i)
103 if (!isa<ConstantInt>(CE->getOperand(i)))
104 return false;
105 return isSimpleEnoughValueToCommit(CE->getOperand(0), SimpleConstants, DL);
106
107 case Instruction::Add:
108 // We allow simple+cst.
109 if (!isa<ConstantInt>(CE->getOperand(1)))
110 return false;
111 return isSimpleEnoughValueToCommit(CE->getOperand(0), SimpleConstants, DL);
112 }
113 return false;
114}
115
116static inline bool
117isSimpleEnoughValueToCommit(Constant *C,
118 SmallPtrSetImpl<Constant *> &SimpleConstants,
119 const DataLayout &DL) {
120 // If we already checked this constant, we win.
121 if (!SimpleConstants.insert(C).second)
122 return true;
123 // Check the constant.
124 return isSimpleEnoughValueToCommitHelper(C, SimpleConstants, DL);
125}
126
127/// Return true if this constant is simple enough for us to understand. In
128/// particular, if it is a cast to anything other than from one pointer type to
129/// another pointer type, we punt. We basically just support direct accesses to
130/// globals and GEP's of globals. This should be kept up to date with
131/// CommitValueTo.
132static bool isSimpleEnoughPointerToCommit(Constant *C) {
133 // Conservatively, avoid aggregate types. This is because we don't
134 // want to worry about them partially overlapping other stores.
135 if (!cast<PointerType>(C->getType())->getElementType()->isSingleValueType())
136 return false;
137
138 if (GlobalVariable *GV = dyn_cast<GlobalVariable>(C))
139 // Do not allow weak/*_odr/linkonce linkage or external globals.
140 return GV->hasUniqueInitializer();
141
142 if (ConstantExpr *CE = dyn_cast<ConstantExpr>(C)) {
143 // Handle a constantexpr gep.
144 if (CE->getOpcode() == Instruction::GetElementPtr &&
145 isa<GlobalVariable>(CE->getOperand(0)) &&
146 cast<GEPOperator>(CE)->isInBounds()) {
147 GlobalVariable *GV = cast<GlobalVariable>(CE->getOperand(0));
148 // Do not allow weak/*_odr/linkonce/dllimport/dllexport linkage or
149 // external globals.
150 if (!GV->hasUniqueInitializer())
151 return false;
152
153 // The first index must be zero.
154 ConstantInt *CI = dyn_cast<ConstantInt>(*std::next(CE->op_begin()));
155 if (!CI || !CI->isZero()) return false;
156
157 // The remaining indices must be compile-time known integers within the
158 // notional bounds of the corresponding static array types.
159 if (!CE->isGEPWithNoNotionalOverIndexing())
160 return false;
161
162 return ConstantFoldLoadThroughGEPConstantExpr(GV->getInitializer(), CE);
163
164 // A constantexpr bitcast from a pointer to another pointer is a no-op,
165 // and we know how to evaluate it by moving the bitcast from the pointer
166 // operand to the value operand.
167 } else if (CE->getOpcode() == Instruction::BitCast &&
168 isa<GlobalVariable>(CE->getOperand(0))) {
169 // Do not allow weak/*_odr/linkonce/dllimport/dllexport linkage or
170 // external globals.
171 return cast<GlobalVariable>(CE->getOperand(0))->hasUniqueInitializer();
172 }
173 }
174
175 return false;
176}
177
Eugene Leviant6f42a2c2018-03-13 10:19:50 +0000178static Constant *getInitializer(Constant *C) {
179 auto *GV = dyn_cast<GlobalVariable>(C);
180 return GV && GV->hasDefinitiveInitializer() ? GV->getInitializer() : nullptr;
181}
182
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000183/// Return the value that would be computed by a load from P after the stores
184/// reflected by 'memory' have been performed. If we can't decide, return null.
185Constant *Evaluator::ComputeLoadResult(Constant *P) {
186 // If this memory location has been recently stored, use the stored value: it
187 // is the most up-to-date.
188 DenseMap<Constant*, Constant*>::const_iterator I = MutatedMemory.find(P);
189 if (I != MutatedMemory.end()) return I->second;
190
191 // Access it.
192 if (GlobalVariable *GV = dyn_cast<GlobalVariable>(P)) {
193 if (GV->hasDefinitiveInitializer())
194 return GV->getInitializer();
195 return nullptr;
196 }
197
Eugene Leviant6f42a2c2018-03-13 10:19:50 +0000198 if (ConstantExpr *CE = dyn_cast<ConstantExpr>(P)) {
199 switch (CE->getOpcode()) {
200 // Handle a constantexpr getelementptr.
201 case Instruction::GetElementPtr:
202 if (auto *I = getInitializer(CE->getOperand(0)))
203 return ConstantFoldLoadThroughGEPConstantExpr(I, CE);
204 break;
205 // Handle a constantexpr bitcast.
206 case Instruction::BitCast:
Mircea Trofinaa3fea6c2018-04-06 15:54:47 +0000207 Constant *Val = getVal(CE->getOperand(0));
208 auto MM = MutatedMemory.find(Val);
209 auto *I = (MM != MutatedMemory.end()) ? MM->second
210 : getInitializer(CE->getOperand(0));
211 if (I)
Eugene Leviant6f42a2c2018-03-13 10:19:50 +0000212 return ConstantFoldLoadThroughBitcast(
213 I, P->getType()->getPointerElementType(), DL);
214 break;
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000215 }
Eugene Leviant6f42a2c2018-03-13 10:19:50 +0000216 }
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000217
218 return nullptr; // don't know how to evaluate.
219}
220
Eugene Leviant6a572b82018-07-10 16:34:23 +0000221static Function *getFunction(Constant *C) {
222 if (auto *Fn = dyn_cast<Function>(C))
223 return Fn;
224
225 if (auto *Alias = dyn_cast<GlobalAlias>(C))
226 if (auto *Fn = dyn_cast<Function>(Alias->getAliasee()))
227 return Fn;
228 return nullptr;
229}
230
Eugene Leviant6e413442018-07-01 11:02:07 +0000231Function *
232Evaluator::getCalleeWithFormalArgs(CallSite &CS,
233 SmallVector<Constant *, 8> &Formals) {
234 auto *V = CS.getCalledValue();
Eugene Leviant6a572b82018-07-10 16:34:23 +0000235 if (auto *Fn = getFunction(getVal(V)))
Eugene Leviant6e413442018-07-01 11:02:07 +0000236 return getFormalParams(CS, Fn, Formals) ? Fn : nullptr;
237
238 auto *CE = dyn_cast<ConstantExpr>(V);
239 if (!CE || CE->getOpcode() != Instruction::BitCast ||
Eugene Leviant6a572b82018-07-10 16:34:23 +0000240 !getFormalParams(CS, getFunction(CE->getOperand(0)), Formals))
Eugene Leviant6e413442018-07-01 11:02:07 +0000241 return nullptr;
242
243 return dyn_cast<Function>(
244 ConstantFoldLoadThroughBitcast(CE, CE->getOperand(0)->getType(), DL));
245}
246
247bool Evaluator::getFormalParams(CallSite &CS, Function *F,
248 SmallVector<Constant *, 8> &Formals) {
Eugene Leviant6a572b82018-07-10 16:34:23 +0000249 if (!F)
250 return false;
251
Eugene Leviant6e413442018-07-01 11:02:07 +0000252 auto *FTy = F->getFunctionType();
253 if (FTy->getNumParams() > CS.getNumArgOperands()) {
254 LLVM_DEBUG(dbgs() << "Too few arguments for function.\n");
255 return false;
256 }
257
258 auto ArgI = CS.arg_begin();
259 for (auto ParI = FTy->param_begin(), ParE = FTy->param_end(); ParI != ParE;
260 ++ParI) {
261 auto *ArgC = ConstantFoldLoadThroughBitcast(getVal(*ArgI), *ParI, DL);
262 if (!ArgC) {
263 LLVM_DEBUG(dbgs() << "Can not convert function argument.\n");
264 return false;
265 }
266 Formals.push_back(ArgC);
267 ++ArgI;
268 }
269 return true;
270}
271
272/// If call expression contains bitcast then we may need to cast
273/// evaluated return value to a type of the call expression.
274Constant *Evaluator::castCallResultIfNeeded(Value *CallExpr, Constant *RV) {
275 ConstantExpr *CE = dyn_cast<ConstantExpr>(CallExpr);
276 if (!RV || !CE || CE->getOpcode() != Instruction::BitCast)
277 return RV;
278
279 if (auto *FT =
280 dyn_cast<FunctionType>(CE->getType()->getPointerElementType())) {
281 RV = ConstantFoldLoadThroughBitcast(RV, FT->getReturnType(), DL);
282 if (!RV)
283 LLVM_DEBUG(dbgs() << "Failed to fold bitcast call expr\n");
284 }
285 return RV;
286}
287
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000288/// Evaluate all instructions in block BB, returning true if successful, false
289/// if we can't evaluate it. NewBB returns the next BB that control flows into,
290/// or null upon return.
291bool Evaluator::EvaluateBlock(BasicBlock::iterator CurInst,
292 BasicBlock *&NextBB) {
293 // This is the main evaluation loop.
Eugene Zelenko5adb96c2017-10-26 00:55:39 +0000294 while (true) {
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000295 Constant *InstResult = nullptr;
296
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000297 LLVM_DEBUG(dbgs() << "Evaluating Instruction: " << *CurInst << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000298
299 if (StoreInst *SI = dyn_cast<StoreInst>(CurInst)) {
300 if (!SI->isSimple()) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000301 LLVM_DEBUG(dbgs() << "Store is not simple! Can not evaluate.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000302 return false; // no volatile/atomic accesses.
303 }
304 Constant *Ptr = getVal(SI->getOperand(1));
David Majnemerd536f232016-07-29 03:27:26 +0000305 if (auto *FoldedPtr = ConstantFoldConstant(Ptr, DL, TLI)) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000306 LLVM_DEBUG(dbgs() << "Folding constant ptr expression: " << *Ptr);
David Majnemerd536f232016-07-29 03:27:26 +0000307 Ptr = FoldedPtr;
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000308 LLVM_DEBUG(dbgs() << "; To: " << *Ptr << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000309 }
310 if (!isSimpleEnoughPointerToCommit(Ptr)) {
311 // If this is too complex for us to commit, reject it.
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000312 LLVM_DEBUG(
313 dbgs() << "Pointer is too complex for us to evaluate store.");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000314 return false;
315 }
316
317 Constant *Val = getVal(SI->getOperand(0));
318
319 // If this might be too difficult for the backend to handle (e.g. the addr
320 // of one global variable divided by another) then we can't commit it.
321 if (!isSimpleEnoughValueToCommit(Val, SimpleConstants, DL)) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000322 LLVM_DEBUG(dbgs() << "Store value is too complex to evaluate store. "
323 << *Val << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000324 return false;
325 }
326
327 if (ConstantExpr *CE = dyn_cast<ConstantExpr>(Ptr)) {
328 if (CE->getOpcode() == Instruction::BitCast) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000329 LLVM_DEBUG(dbgs()
330 << "Attempting to resolve bitcast on constant ptr.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000331 // If we're evaluating a store through a bitcast, then we need
332 // to pull the bitcast off the pointer type and push it onto the
333 // stored value.
334 Ptr = CE->getOperand(0);
335
336 Type *NewTy = cast<PointerType>(Ptr->getType())->getElementType();
337
338 // In order to push the bitcast onto the stored value, a bitcast
339 // from NewTy to Val's type must be legal. If it's not, we can try
340 // introspecting NewTy to find a legal conversion.
Eugene Leviant6f42a2c2018-03-13 10:19:50 +0000341 Constant *NewVal;
342 while (!(NewVal = ConstantFoldLoadThroughBitcast(Val, NewTy, DL))) {
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000343 // If NewTy is a struct, we can convert the pointer to the struct
344 // into a pointer to its first member.
345 // FIXME: This could be extended to support arrays as well.
346 if (StructType *STy = dyn_cast<StructType>(NewTy)) {
347 NewTy = STy->getTypeAtIndex(0U);
348
349 IntegerType *IdxTy = IntegerType::get(NewTy->getContext(), 32);
350 Constant *IdxZero = ConstantInt::get(IdxTy, 0, false);
351 Constant * const IdxList[] = {IdxZero, IdxZero};
352
353 Ptr = ConstantExpr::getGetElementPtr(nullptr, Ptr, IdxList);
David Majnemerd536f232016-07-29 03:27:26 +0000354 if (auto *FoldedPtr = ConstantFoldConstant(Ptr, DL, TLI))
355 Ptr = FoldedPtr;
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000356
357 // If we can't improve the situation by introspecting NewTy,
358 // we have to give up.
359 } else {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000360 LLVM_DEBUG(dbgs() << "Failed to bitcast constant ptr, can not "
361 "evaluate.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000362 return false;
363 }
364 }
365
Eugene Leviant6f42a2c2018-03-13 10:19:50 +0000366 Val = NewVal;
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000367 LLVM_DEBUG(dbgs() << "Evaluated bitcast: " << *Val << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000368 }
369 }
370
371 MutatedMemory[Ptr] = Val;
372 } else if (BinaryOperator *BO = dyn_cast<BinaryOperator>(CurInst)) {
373 InstResult = ConstantExpr::get(BO->getOpcode(),
374 getVal(BO->getOperand(0)),
375 getVal(BO->getOperand(1)));
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000376 LLVM_DEBUG(dbgs() << "Found a BinaryOperator! Simplifying: "
377 << *InstResult << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000378 } else if (CmpInst *CI = dyn_cast<CmpInst>(CurInst)) {
379 InstResult = ConstantExpr::getCompare(CI->getPredicate(),
380 getVal(CI->getOperand(0)),
381 getVal(CI->getOperand(1)));
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000382 LLVM_DEBUG(dbgs() << "Found a CmpInst! Simplifying: " << *InstResult
383 << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000384 } else if (CastInst *CI = dyn_cast<CastInst>(CurInst)) {
385 InstResult = ConstantExpr::getCast(CI->getOpcode(),
386 getVal(CI->getOperand(0)),
387 CI->getType());
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000388 LLVM_DEBUG(dbgs() << "Found a Cast! Simplifying: " << *InstResult
389 << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000390 } else if (SelectInst *SI = dyn_cast<SelectInst>(CurInst)) {
391 InstResult = ConstantExpr::getSelect(getVal(SI->getOperand(0)),
392 getVal(SI->getOperand(1)),
393 getVal(SI->getOperand(2)));
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000394 LLVM_DEBUG(dbgs() << "Found a Select! Simplifying: " << *InstResult
395 << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000396 } else if (auto *EVI = dyn_cast<ExtractValueInst>(CurInst)) {
397 InstResult = ConstantExpr::getExtractValue(
398 getVal(EVI->getAggregateOperand()), EVI->getIndices());
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000399 LLVM_DEBUG(dbgs() << "Found an ExtractValueInst! Simplifying: "
400 << *InstResult << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000401 } else if (auto *IVI = dyn_cast<InsertValueInst>(CurInst)) {
402 InstResult = ConstantExpr::getInsertValue(
403 getVal(IVI->getAggregateOperand()),
404 getVal(IVI->getInsertedValueOperand()), IVI->getIndices());
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000405 LLVM_DEBUG(dbgs() << "Found an InsertValueInst! Simplifying: "
406 << *InstResult << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000407 } else if (GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(CurInst)) {
408 Constant *P = getVal(GEP->getOperand(0));
409 SmallVector<Constant*, 8> GEPOps;
410 for (User::op_iterator i = GEP->op_begin() + 1, e = GEP->op_end();
411 i != e; ++i)
412 GEPOps.push_back(getVal(*i));
413 InstResult =
414 ConstantExpr::getGetElementPtr(GEP->getSourceElementType(), P, GEPOps,
415 cast<GEPOperator>(GEP)->isInBounds());
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000416 LLVM_DEBUG(dbgs() << "Found a GEP! Simplifying: " << *InstResult << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000417 } else if (LoadInst *LI = dyn_cast<LoadInst>(CurInst)) {
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000418 if (!LI->isSimple()) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000419 LLVM_DEBUG(
420 dbgs() << "Found a Load! Not a simple load, can not evaluate.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000421 return false; // no volatile/atomic accesses.
422 }
423
424 Constant *Ptr = getVal(LI->getOperand(0));
David Majnemerd536f232016-07-29 03:27:26 +0000425 if (auto *FoldedPtr = ConstantFoldConstant(Ptr, DL, TLI)) {
426 Ptr = FoldedPtr;
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000427 LLVM_DEBUG(dbgs() << "Found a constant pointer expression, constant "
428 "folding: "
429 << *Ptr << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000430 }
431 InstResult = ComputeLoadResult(Ptr);
432 if (!InstResult) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000433 LLVM_DEBUG(
434 dbgs() << "Failed to compute load result. Can not evaluate load."
435 "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000436 return false; // Could not evaluate load.
437 }
438
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000439 LLVM_DEBUG(dbgs() << "Evaluated load: " << *InstResult << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000440 } else if (AllocaInst *AI = dyn_cast<AllocaInst>(CurInst)) {
441 if (AI->isArrayAllocation()) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000442 LLVM_DEBUG(dbgs() << "Found an array alloca. Can not evaluate.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000443 return false; // Cannot handle array allocs.
444 }
445 Type *Ty = AI->getAllocatedType();
Eugene Zelenko5adb96c2017-10-26 00:55:39 +0000446 AllocaTmps.push_back(llvm::make_unique<GlobalVariable>(
447 Ty, false, GlobalValue::InternalLinkage, UndefValue::get(Ty),
Yaxun Liuea988f12018-05-19 02:58:16 +0000448 AI->getName(), /*TLMode=*/GlobalValue::NotThreadLocal,
449 AI->getType()->getPointerAddressSpace()));
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000450 InstResult = AllocaTmps.back().get();
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000451 LLVM_DEBUG(dbgs() << "Found an alloca. Result: " << *InstResult << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000452 } else if (isa<CallInst>(CurInst) || isa<InvokeInst>(CurInst)) {
453 CallSite CS(&*CurInst);
454
455 // Debug info can safely be ignored here.
456 if (isa<DbgInfoIntrinsic>(CS.getInstruction())) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000457 LLVM_DEBUG(dbgs() << "Ignoring debug info.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000458 ++CurInst;
459 continue;
460 }
461
462 // Cannot handle inline asm.
463 if (isa<InlineAsm>(CS.getCalledValue())) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000464 LLVM_DEBUG(dbgs() << "Found inline asm, can not evaluate.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000465 return false;
466 }
467
468 if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(CS.getInstruction())) {
469 if (MemSetInst *MSI = dyn_cast<MemSetInst>(II)) {
470 if (MSI->isVolatile()) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000471 LLVM_DEBUG(dbgs() << "Can not optimize a volatile memset "
472 << "intrinsic.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000473 return false;
474 }
475 Constant *Ptr = getVal(MSI->getDest());
476 Constant *Val = getVal(MSI->getValue());
477 Constant *DestVal = ComputeLoadResult(getVal(Ptr));
478 if (Val->isNullValue() && DestVal && DestVal->isNullValue()) {
479 // This memset is a no-op.
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000480 LLVM_DEBUG(dbgs() << "Ignoring no-op memset.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000481 ++CurInst;
482 continue;
483 }
484 }
485
486 if (II->getIntrinsicID() == Intrinsic::lifetime_start ||
487 II->getIntrinsicID() == Intrinsic::lifetime_end) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000488 LLVM_DEBUG(dbgs() << "Ignoring lifetime intrinsic.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000489 ++CurInst;
490 continue;
491 }
492
493 if (II->getIntrinsicID() == Intrinsic::invariant_start) {
494 // We don't insert an entry into Values, as it doesn't have a
495 // meaningful return value.
496 if (!II->use_empty()) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000497 LLVM_DEBUG(dbgs()
498 << "Found unused invariant_start. Can't evaluate.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000499 return false;
500 }
501 ConstantInt *Size = cast<ConstantInt>(II->getArgOperand(0));
502 Value *PtrArg = getVal(II->getArgOperand(1));
503 Value *Ptr = PtrArg->stripPointerCasts();
504 if (GlobalVariable *GV = dyn_cast<GlobalVariable>(Ptr)) {
505 Type *ElemTy = GV->getValueType();
Craig Topper79ab6432017-07-06 18:39:47 +0000506 if (!Size->isMinusOne() &&
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000507 Size->getValue().getLimitedValue() >=
508 DL.getTypeStoreSize(ElemTy)) {
509 Invariants.insert(GV);
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000510 LLVM_DEBUG(dbgs() << "Found a global var that is an invariant: "
511 << *GV << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000512 } else {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000513 LLVM_DEBUG(dbgs()
514 << "Found a global var, but can not treat it as an "
515 "invariant.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000516 }
517 }
518 // Continue even if we do nothing.
519 ++CurInst;
520 continue;
521 } else if (II->getIntrinsicID() == Intrinsic::assume) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000522 LLVM_DEBUG(dbgs() << "Skipping assume intrinsic.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000523 ++CurInst;
524 continue;
Dan Gohman2c74fe92017-11-08 21:59:51 +0000525 } else if (II->getIntrinsicID() == Intrinsic::sideeffect) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000526 LLVM_DEBUG(dbgs() << "Skipping sideeffect intrinsic.\n");
Dan Gohman2c74fe92017-11-08 21:59:51 +0000527 ++CurInst;
528 continue;
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000529 }
530
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000531 LLVM_DEBUG(dbgs() << "Unknown intrinsic. Can not evaluate.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000532 return false;
533 }
534
535 // Resolve function pointers.
Eugene Leviant6e413442018-07-01 11:02:07 +0000536 SmallVector<Constant *, 8> Formals;
537 Function *Callee = getCalleeWithFormalArgs(CS, Formals);
Sanjoy Das5ce32722016-04-08 00:48:30 +0000538 if (!Callee || Callee->isInterposable()) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000539 LLVM_DEBUG(dbgs() << "Can not resolve function pointer.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000540 return false; // Cannot resolve.
541 }
542
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000543 if (Callee->isDeclaration()) {
544 // If this is a function we can constant fold, do it.
Andrew Kaylor647025f2017-06-09 23:18:11 +0000545 if (Constant *C = ConstantFoldCall(CS, Callee, Formals, TLI)) {
Eugene Leviant6e413442018-07-01 11:02:07 +0000546 InstResult = castCallResultIfNeeded(CS.getCalledValue(), C);
547 if (!InstResult)
548 return false;
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000549 LLVM_DEBUG(dbgs() << "Constant folded function call. Result: "
550 << *InstResult << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000551 } else {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000552 LLVM_DEBUG(dbgs() << "Can not constant fold function call.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000553 return false;
554 }
555 } else {
556 if (Callee->getFunctionType()->isVarArg()) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000557 LLVM_DEBUG(dbgs() << "Can not constant fold vararg function call.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000558 return false;
559 }
560
561 Constant *RetVal = nullptr;
562 // Execute the call, if successful, use the return value.
563 ValueStack.emplace_back();
564 if (!EvaluateFunction(Callee, RetVal, Formals)) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000565 LLVM_DEBUG(dbgs() << "Failed to evaluate function.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000566 return false;
567 }
568 ValueStack.pop_back();
Eugene Leviant6e413442018-07-01 11:02:07 +0000569 InstResult = castCallResultIfNeeded(CS.getCalledValue(), RetVal);
570 if (RetVal && !InstResult)
571 return false;
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000572
573 if (InstResult) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000574 LLVM_DEBUG(dbgs() << "Successfully evaluated function. Result: "
575 << *InstResult << "\n\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000576 } else {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000577 LLVM_DEBUG(dbgs()
578 << "Successfully evaluated function. Result: 0\n\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000579 }
580 }
Chandler Carruth9ae926b2018-08-26 09:51:22 +0000581 } else if (CurInst->isTerminator()) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000582 LLVM_DEBUG(dbgs() << "Found a terminator instruction.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000583
584 if (BranchInst *BI = dyn_cast<BranchInst>(CurInst)) {
585 if (BI->isUnconditional()) {
586 NextBB = BI->getSuccessor(0);
587 } else {
588 ConstantInt *Cond =
589 dyn_cast<ConstantInt>(getVal(BI->getCondition()));
590 if (!Cond) return false; // Cannot determine.
591
592 NextBB = BI->getSuccessor(!Cond->getZExtValue());
593 }
594 } else if (SwitchInst *SI = dyn_cast<SwitchInst>(CurInst)) {
595 ConstantInt *Val =
596 dyn_cast<ConstantInt>(getVal(SI->getCondition()));
597 if (!Val) return false; // Cannot determine.
Chandler Carruth927d8e62017-04-12 07:27:28 +0000598 NextBB = SI->findCaseValue(Val)->getCaseSuccessor();
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000599 } else if (IndirectBrInst *IBI = dyn_cast<IndirectBrInst>(CurInst)) {
600 Value *Val = getVal(IBI->getAddress())->stripPointerCasts();
601 if (BlockAddress *BA = dyn_cast<BlockAddress>(Val))
602 NextBB = BA->getBasicBlock();
603 else
604 return false; // Cannot determine.
605 } else if (isa<ReturnInst>(CurInst)) {
606 NextBB = nullptr;
607 } else {
608 // invoke, unwind, resume, unreachable.
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000609 LLVM_DEBUG(dbgs() << "Can not handle terminator.");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000610 return false; // Cannot handle this terminator.
611 }
612
613 // We succeeded at evaluating this block!
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000614 LLVM_DEBUG(dbgs() << "Successfully evaluated block.\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000615 return true;
616 } else {
617 // Did not know how to evaluate this!
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000618 LLVM_DEBUG(
619 dbgs() << "Failed to evaluate block due to unhandled instruction."
620 "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000621 return false;
622 }
623
624 if (!CurInst->use_empty()) {
David Majnemerd536f232016-07-29 03:27:26 +0000625 if (auto *FoldedInstResult = ConstantFoldConstant(InstResult, DL, TLI))
626 InstResult = FoldedInstResult;
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000627
628 setVal(&*CurInst, InstResult);
629 }
630
631 // If we just processed an invoke, we finished evaluating the block.
632 if (InvokeInst *II = dyn_cast<InvokeInst>(CurInst)) {
633 NextBB = II->getNormalDest();
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000634 LLVM_DEBUG(dbgs() << "Found an invoke instruction. Finished Block.\n\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000635 return true;
636 }
637
638 // Advance program counter.
639 ++CurInst;
640 }
641}
642
643/// Evaluate a call to function F, returning true if successful, false if we
644/// can't evaluate it. ActualArgs contains the formal arguments for the
645/// function.
646bool Evaluator::EvaluateFunction(Function *F, Constant *&RetVal,
647 const SmallVectorImpl<Constant*> &ActualArgs) {
648 // Check to see if this function is already executing (recursion). If so,
649 // bail out. TODO: we might want to accept limited recursion.
David Majnemer0d955d02016-08-11 22:21:41 +0000650 if (is_contained(CallStack, F))
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000651 return false;
652
653 CallStack.push_back(F);
654
655 // Initialize arguments to the incoming values specified.
656 unsigned ArgNo = 0;
657 for (Function::arg_iterator AI = F->arg_begin(), E = F->arg_end(); AI != E;
658 ++AI, ++ArgNo)
659 setVal(&*AI, ActualArgs[ArgNo]);
660
661 // ExecutedBlocks - We only handle non-looping, non-recursive code. As such,
662 // we can only evaluate any one basic block at most once. This set keeps
663 // track of what we have executed so we can detect recursive cases etc.
664 SmallPtrSet<BasicBlock*, 32> ExecutedBlocks;
665
666 // CurBB - The current basic block we're evaluating.
667 BasicBlock *CurBB = &F->front();
668
669 BasicBlock::iterator CurInst = CurBB->begin();
670
Eugene Zelenko5adb96c2017-10-26 00:55:39 +0000671 while (true) {
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000672 BasicBlock *NextBB = nullptr; // Initialized to avoid compiler warnings.
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000673 LLVM_DEBUG(dbgs() << "Trying to evaluate BB: " << *CurBB << "\n");
Peter Collingbourne9f7ec142016-02-03 02:51:00 +0000674
675 if (!EvaluateBlock(CurInst, NextBB))
676 return false;
677
678 if (!NextBB) {
679 // Successfully running until there's no next block means that we found
680 // the return. Fill it the return value and pop the call stack.
681 ReturnInst *RI = cast<ReturnInst>(CurBB->getTerminator());
682 if (RI->getNumOperands())
683 RetVal = getVal(RI->getOperand(0));
684 CallStack.pop_back();
685 return true;
686 }
687
688 // Okay, we succeeded in evaluating this control flow. See if we have
689 // executed the new block before. If so, we have a looping function,
690 // which we cannot evaluate in reasonable time.
691 if (!ExecutedBlocks.insert(NextBB).second)
692 return false; // looped!
693
694 // Okay, we have never been in this block before. Check to see if there
695 // are any PHI nodes. If so, evaluate them with information about where
696 // we came from.
697 PHINode *PN = nullptr;
698 for (CurInst = NextBB->begin();
699 (PN = dyn_cast<PHINode>(CurInst)); ++CurInst)
700 setVal(PN, getVal(PN->getIncomingValueForBlock(CurBB)));
701
702 // Advance to the next block.
703 CurBB = NextBB;
704 }
705}