blob: 6f166b8ee7fae628b1df39f2de7e21dc26bab9f5 [file] [log] [blame]
Chris Lattner704541b2011-01-02 21:47:05 +00001//===- EarlyCSE.cpp - Simple and fast CSE pass ----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This pass performs a simple dominator tree walk that eliminates trivially
11// redundant instructions.
12//
13//===----------------------------------------------------------------------===//
14
Chris Lattner704541b2011-01-02 21:47:05 +000015#include "llvm/Transforms/Scalar.h"
Michael Ilseman336cb792012-10-09 16:57:38 +000016#include "llvm/ADT/Hashing.h"
Chris Lattner18ae5432011-01-02 23:04:14 +000017#include "llvm/ADT/ScopedHashTable.h"
Chris Lattner8fac5db2011-01-02 23:19:45 +000018#include "llvm/ADT/Statistic.h"
Hal Finkel60db0582014-09-07 18:57:58 +000019#include "llvm/Analysis/AssumptionTracker.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000020#include "llvm/Analysis/InstructionSimplify.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000021#include "llvm/IR/DataLayout.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000022#include "llvm/IR/Dominators.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000023#include "llvm/IR/Instructions.h"
Hal Finkel1e16fa32014-11-03 20:21:32 +000024#include "llvm/IR/IntrinsicInst.h"
25#include "llvm/IR/PatternMatch.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000026#include "llvm/Pass.h"
27#include "llvm/Support/Debug.h"
28#include "llvm/Support/RecyclingAllocator.h"
29#include "llvm/Target/TargetLibraryInfo.h"
30#include "llvm/Transforms/Utils/Local.h"
Lenny Maiorani9eefc812014-09-20 13:29:20 +000031#include <deque>
Chris Lattner704541b2011-01-02 21:47:05 +000032using namespace llvm;
Hal Finkel1e16fa32014-11-03 20:21:32 +000033using namespace llvm::PatternMatch;
Chris Lattner704541b2011-01-02 21:47:05 +000034
Chandler Carruth964daaa2014-04-22 02:55:47 +000035#define DEBUG_TYPE "early-cse"
36
Chris Lattner4cb36542011-01-03 03:28:23 +000037STATISTIC(NumSimplify, "Number of instructions simplified or DCE'd");
38STATISTIC(NumCSE, "Number of instructions CSE'd");
Chris Lattner92bb0f92011-01-03 03:41:27 +000039STATISTIC(NumCSELoad, "Number of load instructions CSE'd");
40STATISTIC(NumCSECall, "Number of call instructions CSE'd");
Chris Lattner9e5e9ed2011-01-03 04:17:24 +000041STATISTIC(NumDSE, "Number of trivial dead stores removed");
Chris Lattnerb9a8efc2011-01-03 03:18:43 +000042
43static unsigned getHash(const void *V) {
44 return DenseMapInfo<const void*>::getHashValue(V);
45}
Chris Lattner8fac5db2011-01-02 23:19:45 +000046
Chris Lattner79d83062011-01-03 02:20:48 +000047//===----------------------------------------------------------------------===//
Nadav Rotem465834c2012-07-24 10:51:42 +000048// SimpleValue
Chris Lattner79d83062011-01-03 02:20:48 +000049//===----------------------------------------------------------------------===//
50
Chris Lattner704541b2011-01-02 21:47:05 +000051namespace {
Chris Lattner79d83062011-01-03 02:20:48 +000052 /// SimpleValue - Instances of this struct represent available values in the
Chris Lattner18ae5432011-01-02 23:04:14 +000053 /// scoped hash table.
Chris Lattner79d83062011-01-03 02:20:48 +000054 struct SimpleValue {
Chris Lattner18ae5432011-01-02 23:04:14 +000055 Instruction *Inst;
Nadav Rotem465834c2012-07-24 10:51:42 +000056
Chris Lattner4cb36542011-01-03 03:28:23 +000057 SimpleValue(Instruction *I) : Inst(I) {
58 assert((isSentinel() || canHandle(I)) && "Inst can't be handled!");
59 }
Nadav Rotem465834c2012-07-24 10:51:42 +000060
Chris Lattner18ae5432011-01-02 23:04:14 +000061 bool isSentinel() const {
62 return Inst == DenseMapInfo<Instruction*>::getEmptyKey() ||
63 Inst == DenseMapInfo<Instruction*>::getTombstoneKey();
64 }
Nadav Rotem465834c2012-07-24 10:51:42 +000065
Chris Lattner18ae5432011-01-02 23:04:14 +000066 static bool canHandle(Instruction *Inst) {
Chris Lattnerbde6ec12011-01-03 23:38:13 +000067 // This can only handle non-void readnone functions.
68 if (CallInst *CI = dyn_cast<CallInst>(Inst))
69 return CI->doesNotAccessMemory() && !CI->getType()->isVoidTy();
Chris Lattner8fac5db2011-01-02 23:19:45 +000070 return isa<CastInst>(Inst) || isa<BinaryOperator>(Inst) ||
71 isa<GetElementPtrInst>(Inst) || isa<CmpInst>(Inst) ||
72 isa<SelectInst>(Inst) || isa<ExtractElementInst>(Inst) ||
73 isa<InsertElementInst>(Inst) || isa<ShuffleVectorInst>(Inst) ||
74 isa<ExtractValueInst>(Inst) || isa<InsertValueInst>(Inst);
Chris Lattner18ae5432011-01-02 23:04:14 +000075 }
Chris Lattner18ae5432011-01-02 23:04:14 +000076 };
77}
78
79namespace llvm {
Chris Lattner79d83062011-01-03 02:20:48 +000080template<> struct DenseMapInfo<SimpleValue> {
81 static inline SimpleValue getEmptyKey() {
Chris Lattner4cb36542011-01-03 03:28:23 +000082 return DenseMapInfo<Instruction*>::getEmptyKey();
Chris Lattner18ae5432011-01-02 23:04:14 +000083 }
Chris Lattner79d83062011-01-03 02:20:48 +000084 static inline SimpleValue getTombstoneKey() {
Chris Lattner4cb36542011-01-03 03:28:23 +000085 return DenseMapInfo<Instruction*>::getTombstoneKey();
Chris Lattner18ae5432011-01-02 23:04:14 +000086 }
Chris Lattner79d83062011-01-03 02:20:48 +000087 static unsigned getHashValue(SimpleValue Val);
88 static bool isEqual(SimpleValue LHS, SimpleValue RHS);
Chris Lattner18ae5432011-01-02 23:04:14 +000089};
90}
91
Chris Lattner79d83062011-01-03 02:20:48 +000092unsigned DenseMapInfo<SimpleValue>::getHashValue(SimpleValue Val) {
Chris Lattner18ae5432011-01-02 23:04:14 +000093 Instruction *Inst = Val.Inst;
Chris Lattner02a97762011-01-03 01:10:08 +000094 // Hash in all of the operands as pointers.
Michael Ilseman336cb792012-10-09 16:57:38 +000095 if (BinaryOperator* BinOp = dyn_cast<BinaryOperator>(Inst)) {
96 Value *LHS = BinOp->getOperand(0);
97 Value *RHS = BinOp->getOperand(1);
98 if (BinOp->isCommutative() && BinOp->getOperand(0) > BinOp->getOperand(1))
99 std::swap(LHS, RHS);
Chris Lattner02a97762011-01-03 01:10:08 +0000100
Michael Ilseman336cb792012-10-09 16:57:38 +0000101 if (isa<OverflowingBinaryOperator>(BinOp)) {
102 // Hash the overflow behavior
103 unsigned Overflow =
104 BinOp->hasNoSignedWrap() * OverflowingBinaryOperator::NoSignedWrap |
105 BinOp->hasNoUnsignedWrap() * OverflowingBinaryOperator::NoUnsignedWrap;
106 return hash_combine(BinOp->getOpcode(), Overflow, LHS, RHS);
107 }
108
109 return hash_combine(BinOp->getOpcode(), LHS, RHS);
Chris Lattner02a97762011-01-03 01:10:08 +0000110 }
111
Michael Ilseman336cb792012-10-09 16:57:38 +0000112 if (CmpInst *CI = dyn_cast<CmpInst>(Inst)) {
113 Value *LHS = CI->getOperand(0);
114 Value *RHS = CI->getOperand(1);
115 CmpInst::Predicate Pred = CI->getPredicate();
116 if (Inst->getOperand(0) > Inst->getOperand(1)) {
117 std::swap(LHS, RHS);
118 Pred = CI->getSwappedPredicate();
119 }
120 return hash_combine(Inst->getOpcode(), Pred, LHS, RHS);
121 }
122
123 if (CastInst *CI = dyn_cast<CastInst>(Inst))
124 return hash_combine(CI->getOpcode(), CI->getType(), CI->getOperand(0));
125
126 if (const ExtractValueInst *EVI = dyn_cast<ExtractValueInst>(Inst))
127 return hash_combine(EVI->getOpcode(), EVI->getOperand(0),
128 hash_combine_range(EVI->idx_begin(), EVI->idx_end()));
129
130 if (const InsertValueInst *IVI = dyn_cast<InsertValueInst>(Inst))
131 return hash_combine(IVI->getOpcode(), IVI->getOperand(0),
132 IVI->getOperand(1),
133 hash_combine_range(IVI->idx_begin(), IVI->idx_end()));
134
135 assert((isa<CallInst>(Inst) || isa<BinaryOperator>(Inst) ||
136 isa<GetElementPtrInst>(Inst) || isa<SelectInst>(Inst) ||
137 isa<ExtractElementInst>(Inst) || isa<InsertElementInst>(Inst) ||
138 isa<ShuffleVectorInst>(Inst)) && "Invalid/unknown instruction");
139
Chris Lattner02a97762011-01-03 01:10:08 +0000140 // Mix in the opcode.
Michael Ilseman336cb792012-10-09 16:57:38 +0000141 return hash_combine(Inst->getOpcode(),
142 hash_combine_range(Inst->value_op_begin(),
143 Inst->value_op_end()));
Chris Lattner18ae5432011-01-02 23:04:14 +0000144}
145
Chris Lattner79d83062011-01-03 02:20:48 +0000146bool DenseMapInfo<SimpleValue>::isEqual(SimpleValue LHS, SimpleValue RHS) {
Chris Lattner18ae5432011-01-02 23:04:14 +0000147 Instruction *LHSI = LHS.Inst, *RHSI = RHS.Inst;
148
149 if (LHS.isSentinel() || RHS.isSentinel())
150 return LHSI == RHSI;
Nadav Rotem465834c2012-07-24 10:51:42 +0000151
Chris Lattner18ae5432011-01-02 23:04:14 +0000152 if (LHSI->getOpcode() != RHSI->getOpcode()) return false;
Michael Ilseman336cb792012-10-09 16:57:38 +0000153 if (LHSI->isIdenticalTo(RHSI)) return true;
154
155 // If we're not strictly identical, we still might be a commutable instruction
156 if (BinaryOperator *LHSBinOp = dyn_cast<BinaryOperator>(LHSI)) {
157 if (!LHSBinOp->isCommutative())
158 return false;
159
160 assert(isa<BinaryOperator>(RHSI)
161 && "same opcode, but different instruction type?");
162 BinaryOperator *RHSBinOp = cast<BinaryOperator>(RHSI);
163
164 // Check overflow attributes
165 if (isa<OverflowingBinaryOperator>(LHSBinOp)) {
166 assert(isa<OverflowingBinaryOperator>(RHSBinOp)
167 && "same opcode, but different operator type?");
168 if (LHSBinOp->hasNoUnsignedWrap() != RHSBinOp->hasNoUnsignedWrap() ||
169 LHSBinOp->hasNoSignedWrap() != RHSBinOp->hasNoSignedWrap())
170 return false;
171 }
172
173 // Commuted equality
174 return LHSBinOp->getOperand(0) == RHSBinOp->getOperand(1) &&
175 LHSBinOp->getOperand(1) == RHSBinOp->getOperand(0);
176 }
177 if (CmpInst *LHSCmp = dyn_cast<CmpInst>(LHSI)) {
178 assert(isa<CmpInst>(RHSI)
179 && "same opcode, but different instruction type?");
180 CmpInst *RHSCmp = cast<CmpInst>(RHSI);
181 // Commuted equality
182 return LHSCmp->getOperand(0) == RHSCmp->getOperand(1) &&
183 LHSCmp->getOperand(1) == RHSCmp->getOperand(0) &&
184 LHSCmp->getSwappedPredicate() == RHSCmp->getPredicate();
185 }
186
187 return false;
Chris Lattner18ae5432011-01-02 23:04:14 +0000188}
189
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000190//===----------------------------------------------------------------------===//
Nadav Rotem465834c2012-07-24 10:51:42 +0000191// CallValue
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000192//===----------------------------------------------------------------------===//
193
194namespace {
Chris Lattner92bb0f92011-01-03 03:41:27 +0000195 /// CallValue - Instances of this struct represent available call values in
196 /// the scoped hash table.
197 struct CallValue {
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000198 Instruction *Inst;
Nadav Rotem465834c2012-07-24 10:51:42 +0000199
Chris Lattner92bb0f92011-01-03 03:41:27 +0000200 CallValue(Instruction *I) : Inst(I) {
Chris Lattner4cb36542011-01-03 03:28:23 +0000201 assert((isSentinel() || canHandle(I)) && "Inst can't be handled!");
202 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000203
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000204 bool isSentinel() const {
205 return Inst == DenseMapInfo<Instruction*>::getEmptyKey() ||
206 Inst == DenseMapInfo<Instruction*>::getTombstoneKey();
207 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000208
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000209 static bool canHandle(Instruction *Inst) {
Chris Lattner16ca19f2011-01-03 18:43:03 +0000210 // Don't value number anything that returns void.
211 if (Inst->getType()->isVoidTy())
212 return false;
Nadav Rotem465834c2012-07-24 10:51:42 +0000213
Chris Lattner142f1cd2011-01-03 18:28:15 +0000214 CallInst *CI = dyn_cast<CallInst>(Inst);
Craig Topperf40110f2014-04-25 05:29:35 +0000215 if (!CI || !CI->onlyReadsMemory())
Chris Lattner142f1cd2011-01-03 18:28:15 +0000216 return false;
Chris Lattner142f1cd2011-01-03 18:28:15 +0000217 return true;
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000218 }
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000219 };
220}
221
222namespace llvm {
Chris Lattner92bb0f92011-01-03 03:41:27 +0000223 template<> struct DenseMapInfo<CallValue> {
224 static inline CallValue getEmptyKey() {
Chris Lattner4cb36542011-01-03 03:28:23 +0000225 return DenseMapInfo<Instruction*>::getEmptyKey();
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000226 }
Chris Lattner92bb0f92011-01-03 03:41:27 +0000227 static inline CallValue getTombstoneKey() {
Chris Lattner4cb36542011-01-03 03:28:23 +0000228 return DenseMapInfo<Instruction*>::getTombstoneKey();
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000229 }
Chris Lattner92bb0f92011-01-03 03:41:27 +0000230 static unsigned getHashValue(CallValue Val);
231 static bool isEqual(CallValue LHS, CallValue RHS);
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000232 };
233}
Chris Lattner92bb0f92011-01-03 03:41:27 +0000234unsigned DenseMapInfo<CallValue>::getHashValue(CallValue Val) {
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000235 Instruction *Inst = Val.Inst;
236 // Hash in all of the operands as pointers.
237 unsigned Res = 0;
Chris Lattner16ca19f2011-01-03 18:43:03 +0000238 for (unsigned i = 0, e = Inst->getNumOperands(); i != e; ++i) {
239 assert(!Inst->getOperand(i)->getType()->isMetadataTy() &&
240 "Cannot value number calls with metadata operands");
Eli Friedman154a9672011-10-12 22:00:26 +0000241 Res ^= getHash(Inst->getOperand(i)) << (i & 0xF);
Chris Lattner16ca19f2011-01-03 18:43:03 +0000242 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000243
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000244 // Mix in the opcode.
245 return (Res << 1) ^ Inst->getOpcode();
246}
247
Chris Lattner92bb0f92011-01-03 03:41:27 +0000248bool DenseMapInfo<CallValue>::isEqual(CallValue LHS, CallValue RHS) {
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000249 Instruction *LHSI = LHS.Inst, *RHSI = RHS.Inst;
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000250 if (LHS.isSentinel() || RHS.isSentinel())
251 return LHSI == RHSI;
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000252 return LHSI->isIdenticalTo(RHSI);
253}
254
Chris Lattner18ae5432011-01-02 23:04:14 +0000255
Chris Lattner79d83062011-01-03 02:20:48 +0000256//===----------------------------------------------------------------------===//
Nadav Rotem465834c2012-07-24 10:51:42 +0000257// EarlyCSE pass.
Chris Lattner79d83062011-01-03 02:20:48 +0000258//===----------------------------------------------------------------------===//
259
Chris Lattner18ae5432011-01-02 23:04:14 +0000260namespace {
Nadav Rotem465834c2012-07-24 10:51:42 +0000261
Chris Lattner704541b2011-01-02 21:47:05 +0000262/// EarlyCSE - This pass does a simple depth-first walk over the dominator
263/// tree, eliminating trivially redundant instructions and using instsimplify
264/// to canonicalize things as it goes. It is intended to be fast and catch
265/// obvious cases so that instcombine and other passes are more effective. It
266/// is expected that a later pass of GVN will catch the interesting/hard
267/// cases.
268class EarlyCSE : public FunctionPass {
269public:
Rafael Espindola37dc9e12014-02-21 00:06:31 +0000270 const DataLayout *DL;
Chad Rosierc24b86f2011-12-01 03:08:23 +0000271 const TargetLibraryInfo *TLI;
Chris Lattner18ae5432011-01-02 23:04:14 +0000272 DominatorTree *DT;
Hal Finkel60db0582014-09-07 18:57:58 +0000273 AssumptionTracker *AT;
Chris Lattnerd815f692011-01-03 01:42:46 +0000274 typedef RecyclingAllocator<BumpPtrAllocator,
Chris Lattner79d83062011-01-03 02:20:48 +0000275 ScopedHashTableVal<SimpleValue, Value*> > AllocatorTy;
276 typedef ScopedHashTable<SimpleValue, Value*, DenseMapInfo<SimpleValue>,
Chris Lattnerd815f692011-01-03 01:42:46 +0000277 AllocatorTy> ScopedHTType;
Nadav Rotem465834c2012-07-24 10:51:42 +0000278
Chris Lattner79d83062011-01-03 02:20:48 +0000279 /// AvailableValues - This scoped hash table contains the current values of
280 /// all of our simple scalar expressions. As we walk down the domtree, we
281 /// look to see if instructions are in this: if so, we replace them with what
282 /// we find, otherwise we insert them so that dominated values can succeed in
283 /// their lookup.
284 ScopedHTType *AvailableValues;
Nadav Rotem465834c2012-07-24 10:51:42 +0000285
Chris Lattner92bb0f92011-01-03 03:41:27 +0000286 /// AvailableLoads - This scoped hash table contains the current values
287 /// of loads. This allows us to get efficient access to dominating loads when
288 /// we have a fully redundant load. In addition to the most recent load, we
289 /// keep track of a generation count of the read, which is compared against
290 /// the current generation count. The current generation count is
291 /// incremented after every possibly writing memory operation, which ensures
292 /// that we only CSE loads with other loads that have no intervening store.
Chris Lattner4b9a5252011-01-03 03:53:50 +0000293 typedef RecyclingAllocator<BumpPtrAllocator,
294 ScopedHashTableVal<Value*, std::pair<Value*, unsigned> > > LoadMapAllocator;
295 typedef ScopedHashTable<Value*, std::pair<Value*, unsigned>,
296 DenseMapInfo<Value*>, LoadMapAllocator> LoadHTType;
Chris Lattner92bb0f92011-01-03 03:41:27 +0000297 LoadHTType *AvailableLoads;
Nadav Rotem465834c2012-07-24 10:51:42 +0000298
Chris Lattner92bb0f92011-01-03 03:41:27 +0000299 /// AvailableCalls - This scoped hash table contains the current values
300 /// of read-only call values. It uses the same generation count as loads.
301 typedef ScopedHashTable<CallValue, std::pair<Value*, unsigned> > CallHTType;
302 CallHTType *AvailableCalls;
Nadav Rotem465834c2012-07-24 10:51:42 +0000303
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000304 /// CurrentGeneration - This is the current generation of the memory value.
305 unsigned CurrentGeneration;
Nadav Rotem465834c2012-07-24 10:51:42 +0000306
Chris Lattner704541b2011-01-02 21:47:05 +0000307 static char ID;
Chris Lattner79d83062011-01-03 02:20:48 +0000308 explicit EarlyCSE() : FunctionPass(ID) {
Chris Lattner704541b2011-01-02 21:47:05 +0000309 initializeEarlyCSEPass(*PassRegistry::getPassRegistry());
310 }
311
Craig Topper3e4c6972014-03-05 09:10:37 +0000312 bool runOnFunction(Function &F) override;
Chris Lattner704541b2011-01-02 21:47:05 +0000313
314private:
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000315
316 // NodeScope - almost a POD, but needs to call the constructors for the
317 // scoped hash tables so that a new scope gets pushed on. These are RAII so
318 // that the scope gets popped when the NodeScope is destroyed.
319 class NodeScope {
320 public:
321 NodeScope(ScopedHTType *availableValues,
322 LoadHTType *availableLoads,
323 CallHTType *availableCalls) :
324 Scope(*availableValues),
325 LoadScope(*availableLoads),
326 CallScope(*availableCalls) {}
327
328 private:
Craig Toppera60c0f12012-09-15 17:09:36 +0000329 NodeScope(const NodeScope&) LLVM_DELETED_FUNCTION;
330 void operator=(const NodeScope&) LLVM_DELETED_FUNCTION;
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000331
332 ScopedHTType::ScopeTy Scope;
333 LoadHTType::ScopeTy LoadScope;
334 CallHTType::ScopeTy CallScope;
335 };
336
337 // StackNode - contains all the needed information to create a stack for
338 // doing a depth first tranversal of the tree. This includes scopes for
339 // values, loads, and calls as well as the generation. There is a child
340 // iterator so that the children do not need to be store spearately.
341 class StackNode {
342 public:
343 StackNode(ScopedHTType *availableValues,
344 LoadHTType *availableLoads,
345 CallHTType *availableCalls,
346 unsigned cg, DomTreeNode *n,
347 DomTreeNode::iterator child, DomTreeNode::iterator end) :
348 CurrentGeneration(cg), ChildGeneration(cg), Node(n),
349 ChildIter(child), EndIter(end),
350 Scopes(availableValues, availableLoads, availableCalls),
351 Processed(false) {}
352
353 // Accessors.
354 unsigned currentGeneration() { return CurrentGeneration; }
355 unsigned childGeneration() { return ChildGeneration; }
356 void childGeneration(unsigned generation) { ChildGeneration = generation; }
357 DomTreeNode *node() { return Node; }
358 DomTreeNode::iterator childIter() { return ChildIter; }
359 DomTreeNode *nextChild() {
360 DomTreeNode *child = *ChildIter;
361 ++ChildIter;
362 return child;
363 }
364 DomTreeNode::iterator end() { return EndIter; }
365 bool isProcessed() { return Processed; }
366 void process() { Processed = true; }
367
368 private:
Craig Toppera60c0f12012-09-15 17:09:36 +0000369 StackNode(const StackNode&) LLVM_DELETED_FUNCTION;
370 void operator=(const StackNode&) LLVM_DELETED_FUNCTION;
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000371
372 // Members.
373 unsigned CurrentGeneration;
374 unsigned ChildGeneration;
375 DomTreeNode *Node;
376 DomTreeNode::iterator ChildIter;
377 DomTreeNode::iterator EndIter;
378 NodeScope Scopes;
379 bool Processed;
380 };
381
Chris Lattner18ae5432011-01-02 23:04:14 +0000382 bool processNode(DomTreeNode *Node);
Nadav Rotem465834c2012-07-24 10:51:42 +0000383
Chris Lattner704541b2011-01-02 21:47:05 +0000384 // This transformation requires dominator postdominator info
Craig Topper3e4c6972014-03-05 09:10:37 +0000385 void getAnalysisUsage(AnalysisUsage &AU) const override {
Hal Finkel60db0582014-09-07 18:57:58 +0000386 AU.addRequired<AssumptionTracker>();
Chandler Carruth73523022014-01-13 13:07:17 +0000387 AU.addRequired<DominatorTreeWrapperPass>();
Chad Rosierc24b86f2011-12-01 03:08:23 +0000388 AU.addRequired<TargetLibraryInfo>();
Chris Lattner704541b2011-01-02 21:47:05 +0000389 AU.setPreservesCFG();
390 }
391};
392}
393
394char EarlyCSE::ID = 0;
395
396// createEarlyCSEPass - The public interface to this file.
397FunctionPass *llvm::createEarlyCSEPass() {
398 return new EarlyCSE();
399}
400
401INITIALIZE_PASS_BEGIN(EarlyCSE, "early-cse", "Early CSE", false, false)
Hal Finkel60db0582014-09-07 18:57:58 +0000402INITIALIZE_PASS_DEPENDENCY(AssumptionTracker)
Chandler Carruth73523022014-01-13 13:07:17 +0000403INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
Chad Rosierc24b86f2011-12-01 03:08:23 +0000404INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfo)
Chris Lattner704541b2011-01-02 21:47:05 +0000405INITIALIZE_PASS_END(EarlyCSE, "early-cse", "Early CSE", false, false)
406
Chris Lattner18ae5432011-01-02 23:04:14 +0000407bool EarlyCSE::processNode(DomTreeNode *Node) {
Chris Lattner18ae5432011-01-02 23:04:14 +0000408 BasicBlock *BB = Node->getBlock();
Nadav Rotem465834c2012-07-24 10:51:42 +0000409
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000410 // If this block has a single predecessor, then the predecessor is the parent
411 // of the domtree node and all of the live out memory values are still current
412 // in this block. If this block has multiple predecessors, then they could
413 // have invalidated the live-out memory values of our parent value. For now,
414 // just be conservative and invalidate memory if this block has multiple
415 // predecessors.
Craig Topperf40110f2014-04-25 05:29:35 +0000416 if (!BB->getSinglePredecessor())
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000417 ++CurrentGeneration;
Nadav Rotem465834c2012-07-24 10:51:42 +0000418
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000419 /// LastStore - Keep track of the last non-volatile store that we saw... for
420 /// as long as there in no instruction that reads memory. If we see a store
421 /// to the same location, we delete the dead store. This zaps trivial dead
422 /// stores which can occur in bitfield code among other things.
Craig Topperf40110f2014-04-25 05:29:35 +0000423 StoreInst *LastStore = nullptr;
Nadav Rotem465834c2012-07-24 10:51:42 +0000424
Chris Lattner18ae5432011-01-02 23:04:14 +0000425 bool Changed = false;
426
427 // See if any instructions in the block can be eliminated. If so, do it. If
428 // not, add them to AvailableValues.
429 for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ) {
430 Instruction *Inst = I++;
Nadav Rotem465834c2012-07-24 10:51:42 +0000431
Chris Lattner18ae5432011-01-02 23:04:14 +0000432 // Dead instructions should just be removed.
Benjamin Kramer8bcc9712012-08-29 15:32:21 +0000433 if (isInstructionTriviallyDead(Inst, TLI)) {
Chris Lattner8fac5db2011-01-02 23:19:45 +0000434 DEBUG(dbgs() << "EarlyCSE DCE: " << *Inst << '\n');
Chris Lattner18ae5432011-01-02 23:04:14 +0000435 Inst->eraseFromParent();
436 Changed = true;
Chris Lattner8fac5db2011-01-02 23:19:45 +0000437 ++NumSimplify;
Chris Lattner18ae5432011-01-02 23:04:14 +0000438 continue;
439 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000440
Hal Finkel1e16fa32014-11-03 20:21:32 +0000441 // Skip assume intrinsics, they don't really have side effects (although
442 // they're marked as such to ensure preservation of control dependencies),
443 // and this pass will not disturb any of the assumption's control
444 // dependencies.
445 if (match(Inst, m_Intrinsic<Intrinsic::assume>())) {
446 DEBUG(dbgs() << "EarlyCSE skipping assumption: " << *Inst << '\n');
447 continue;
448 }
449
Chris Lattner18ae5432011-01-02 23:04:14 +0000450 // If the instruction can be simplified (e.g. X+0 = X) then replace it with
451 // its simpler value.
Hal Finkel60db0582014-09-07 18:57:58 +0000452 if (Value *V = SimplifyInstruction(Inst, DL, TLI, DT, AT)) {
Chris Lattner8fac5db2011-01-02 23:19:45 +0000453 DEBUG(dbgs() << "EarlyCSE Simplify: " << *Inst << " to: " << *V << '\n');
Chris Lattner18ae5432011-01-02 23:04:14 +0000454 Inst->replaceAllUsesWith(V);
455 Inst->eraseFromParent();
456 Changed = true;
Chris Lattner8fac5db2011-01-02 23:19:45 +0000457 ++NumSimplify;
Chris Lattner18ae5432011-01-02 23:04:14 +0000458 continue;
459 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000460
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000461 // If this is a simple instruction that we can value number, process it.
462 if (SimpleValue::canHandle(Inst)) {
463 // See if the instruction has an available value. If so, use it.
Chris Lattner4cb36542011-01-03 03:28:23 +0000464 if (Value *V = AvailableValues->lookup(Inst)) {
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000465 DEBUG(dbgs() << "EarlyCSE CSE: " << *Inst << " to: " << *V << '\n');
466 Inst->replaceAllUsesWith(V);
467 Inst->eraseFromParent();
468 Changed = true;
469 ++NumCSE;
470 continue;
471 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000472
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000473 // Otherwise, just remember that this value is available.
Chris Lattner4cb36542011-01-03 03:28:23 +0000474 AvailableValues->insert(Inst, Inst);
Chris Lattner18ae5432011-01-02 23:04:14 +0000475 continue;
476 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000477
Chris Lattner92bb0f92011-01-03 03:41:27 +0000478 // If this is a non-volatile load, process it.
479 if (LoadInst *LI = dyn_cast<LoadInst>(Inst)) {
480 // Ignore volatile loads.
Eli Friedman7c5dc122011-09-12 20:23:13 +0000481 if (!LI->isSimple()) {
Craig Topperf40110f2014-04-25 05:29:35 +0000482 LastStore = nullptr;
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000483 continue;
484 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000485
Chris Lattner92bb0f92011-01-03 03:41:27 +0000486 // If we have an available version of this load, and if it is the right
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000487 // generation, replace this instruction.
Chris Lattner92bb0f92011-01-03 03:41:27 +0000488 std::pair<Value*, unsigned> InVal =
489 AvailableLoads->lookup(Inst->getOperand(0));
Craig Topperf40110f2014-04-25 05:29:35 +0000490 if (InVal.first != nullptr && InVal.second == CurrentGeneration) {
Chris Lattner92bb0f92011-01-03 03:41:27 +0000491 DEBUG(dbgs() << "EarlyCSE CSE LOAD: " << *Inst << " to: "
492 << *InVal.first << '\n');
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000493 if (!Inst->use_empty()) Inst->replaceAllUsesWith(InVal.first);
494 Inst->eraseFromParent();
495 Changed = true;
Chris Lattner92bb0f92011-01-03 03:41:27 +0000496 ++NumCSELoad;
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000497 continue;
498 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000499
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000500 // Otherwise, remember that we have this instruction.
Chris Lattner92bb0f92011-01-03 03:41:27 +0000501 AvailableLoads->insert(Inst->getOperand(0),
502 std::pair<Value*, unsigned>(Inst, CurrentGeneration));
Craig Topperf40110f2014-04-25 05:29:35 +0000503 LastStore = nullptr;
Chris Lattner92bb0f92011-01-03 03:41:27 +0000504 continue;
505 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000506
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000507 // If this instruction may read from memory, forget LastStore.
508 if (Inst->mayReadFromMemory())
Craig Topperf40110f2014-04-25 05:29:35 +0000509 LastStore = nullptr;
Nadav Rotem465834c2012-07-24 10:51:42 +0000510
Chris Lattner92bb0f92011-01-03 03:41:27 +0000511 // If this is a read-only call, process it.
512 if (CallValue::canHandle(Inst)) {
513 // If we have an available version of this call, and if it is the right
514 // generation, replace this instruction.
515 std::pair<Value*, unsigned> InVal = AvailableCalls->lookup(Inst);
Craig Topperf40110f2014-04-25 05:29:35 +0000516 if (InVal.first != nullptr && InVal.second == CurrentGeneration) {
Chris Lattner92bb0f92011-01-03 03:41:27 +0000517 DEBUG(dbgs() << "EarlyCSE CSE CALL: " << *Inst << " to: "
518 << *InVal.first << '\n');
519 if (!Inst->use_empty()) Inst->replaceAllUsesWith(InVal.first);
520 Inst->eraseFromParent();
521 Changed = true;
522 ++NumCSECall;
523 continue;
524 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000525
Chris Lattner92bb0f92011-01-03 03:41:27 +0000526 // Otherwise, remember that we have this instruction.
527 AvailableCalls->insert(Inst,
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000528 std::pair<Value*, unsigned>(Inst, CurrentGeneration));
529 continue;
530 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000531
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000532 // Okay, this isn't something we can CSE at all. Check to see if it is
533 // something that could modify memory. If so, our available memory values
534 // cannot be used so bump the generation count.
Chris Lattnere0e32a92011-01-03 03:46:34 +0000535 if (Inst->mayWriteToMemory()) {
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000536 ++CurrentGeneration;
Nadav Rotem465834c2012-07-24 10:51:42 +0000537
Chris Lattnere0e32a92011-01-03 03:46:34 +0000538 if (StoreInst *SI = dyn_cast<StoreInst>(Inst)) {
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000539 // We do a trivial form of DSE if there are two stores to the same
540 // location with no intervening loads. Delete the earlier store.
541 if (LastStore &&
542 LastStore->getPointerOperand() == SI->getPointerOperand()) {
543 DEBUG(dbgs() << "EarlyCSE DEAD STORE: " << *LastStore << " due to: "
Chris Lattner142f1cd2011-01-03 18:28:15 +0000544 << *Inst << '\n');
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000545 LastStore->eraseFromParent();
546 Changed = true;
547 ++NumDSE;
Craig Topperf40110f2014-04-25 05:29:35 +0000548 LastStore = nullptr;
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000549 continue;
550 }
Nadav Rotem465834c2012-07-24 10:51:42 +0000551
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000552 // Okay, we just invalidated anything we knew about loaded values. Try
553 // to salvage *something* by remembering that the stored value is a live
554 // version of the pointer. It is safe to forward from volatile stores
555 // to non-volatile loads, so we don't have to check for volatility of
556 // the store.
Chris Lattnere0e32a92011-01-03 03:46:34 +0000557 AvailableLoads->insert(SI->getPointerOperand(),
558 std::pair<Value*, unsigned>(SI->getValueOperand(), CurrentGeneration));
Nadav Rotem465834c2012-07-24 10:51:42 +0000559
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000560 // Remember that this was the last store we saw for DSE.
Eli Friedman7c5dc122011-09-12 20:23:13 +0000561 if (SI->isSimple())
Chris Lattner9e5e9ed2011-01-03 04:17:24 +0000562 LastStore = SI;
Chris Lattnere0e32a92011-01-03 03:46:34 +0000563 }
564 }
Chris Lattner18ae5432011-01-02 23:04:14 +0000565 }
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000566
Chris Lattner18ae5432011-01-02 23:04:14 +0000567 return Changed;
Chris Lattner704541b2011-01-02 21:47:05 +0000568}
Chris Lattner18ae5432011-01-02 23:04:14 +0000569
570
571bool EarlyCSE::runOnFunction(Function &F) {
Paul Robinsonaf4e64d2014-02-06 00:07:05 +0000572 if (skipOptnoneFunction(F))
573 return false;
574
Lenny Maiorani9eefc812014-09-20 13:29:20 +0000575 // Note, deque is being used here because there is significant performance gains
576 // over vector when the container becomes very large due to the specific access
577 // patterns. For more information see the mailing list discussion on this:
578 // http://lists.cs.uiuc.edu/pipermail/llvm-commits/Week-of-Mon-20120116/135228.html
579 std::deque<StackNode *> nodesToProcess;
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000580
Rafael Espindola93512512014-02-25 17:30:31 +0000581 DataLayoutPass *DLP = getAnalysisIfAvailable<DataLayoutPass>();
Craig Topperf40110f2014-04-25 05:29:35 +0000582 DL = DLP ? &DLP->getDataLayout() : nullptr;
Chad Rosierc24b86f2011-12-01 03:08:23 +0000583 TLI = &getAnalysis<TargetLibraryInfo>();
Chandler Carruth73523022014-01-13 13:07:17 +0000584 DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
Hal Finkel60db0582014-09-07 18:57:58 +0000585 AT = &getAnalysis<AssumptionTracker>();
Nadav Rotem465834c2012-07-24 10:51:42 +0000586
Chris Lattner92bb0f92011-01-03 03:41:27 +0000587 // Tables that the pass uses when walking the domtree.
Chris Lattnerd815f692011-01-03 01:42:46 +0000588 ScopedHTType AVTable;
Chris Lattner18ae5432011-01-02 23:04:14 +0000589 AvailableValues = &AVTable;
Chris Lattner92bb0f92011-01-03 03:41:27 +0000590 LoadHTType LoadTable;
591 AvailableLoads = &LoadTable;
592 CallHTType CallTable;
593 AvailableCalls = &CallTable;
Nadav Rotem465834c2012-07-24 10:51:42 +0000594
Chris Lattnerb9a8efc2011-01-03 03:18:43 +0000595 CurrentGeneration = 0;
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000596 bool Changed = false;
597
598 // Process the root node.
Michael Gottesman2bf01732013-12-05 18:42:12 +0000599 nodesToProcess.push_back(
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000600 new StackNode(AvailableValues, AvailableLoads, AvailableCalls,
601 CurrentGeneration, DT->getRootNode(),
602 DT->getRootNode()->begin(),
603 DT->getRootNode()->end()));
604
605 // Save the current generation.
606 unsigned LiveOutGeneration = CurrentGeneration;
607
608 // Process the stack.
609 while (!nodesToProcess.empty()) {
610 // Grab the first item off the stack. Set the current generation, remove
611 // the node from the stack, and process it.
Michael Gottesman2bf01732013-12-05 18:42:12 +0000612 StackNode *NodeToProcess = nodesToProcess.back();
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000613
614 // Initialize class members.
615 CurrentGeneration = NodeToProcess->currentGeneration();
616
617 // Check if the node needs to be processed.
618 if (!NodeToProcess->isProcessed()) {
619 // Process the node.
620 Changed |= processNode(NodeToProcess->node());
621 NodeToProcess->childGeneration(CurrentGeneration);
622 NodeToProcess->process();
623 } else if (NodeToProcess->childIter() != NodeToProcess->end()) {
624 // Push the next child onto the stack.
625 DomTreeNode *child = NodeToProcess->nextChild();
Michael Gottesman2bf01732013-12-05 18:42:12 +0000626 nodesToProcess.push_back(
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000627 new StackNode(AvailableValues,
628 AvailableLoads,
629 AvailableCalls,
630 NodeToProcess->childGeneration(), child,
631 child->begin(), child->end()));
632 } else {
633 // It has been processed, and there are no more children to process,
634 // so delete it and pop it off the stack.
635 delete NodeToProcess;
Michael Gottesman2bf01732013-12-05 18:42:12 +0000636 nodesToProcess.pop_back();
Lenny Maiorani8d670b82012-01-31 23:14:41 +0000637 }
638 } // while (!nodes...)
639
640 // Reset the current generation.
641 CurrentGeneration = LiveOutGeneration;
642
643 return Changed;
Chris Lattner18ae5432011-01-02 23:04:14 +0000644}