blob: 5f953dfbb030d36c120be6ff4dbb5ab2f22f6882 [file] [log] [blame]
Chris Lattner159b98f2008-12-05 07:49:08 +00001//===- GVN.cpp - Eliminate redundant values and loads ---------------------===//
Owen Anderson85c40642007-07-24 17:55:58 +00002//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner081ce942007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Owen Anderson85c40642007-07-24 17:55:58 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This pass performs global value numbering to eliminate fully redundant
11// instructions. It also performs simple dead load elimination.
12//
John Criswell6e0aa282009-03-10 15:04:53 +000013// Note that this pass does the value numbering itself; it does not use the
Matthijs Kooijman9aac1db2008-06-05 07:55:49 +000014// ValueNumbering analysis passes.
15//
Owen Anderson85c40642007-07-24 17:55:58 +000016//===----------------------------------------------------------------------===//
17
18#define DEBUG_TYPE "gvn"
Owen Anderson85c40642007-07-24 17:55:58 +000019#include "llvm/Transforms/Scalar.h"
Owen Anderson5d72a422007-07-25 19:57:03 +000020#include "llvm/BasicBlock.h"
Owen Andersonacfa3ad2007-07-26 18:26:51 +000021#include "llvm/Constants.h"
Owen Anderson85c40642007-07-24 17:55:58 +000022#include "llvm/DerivedTypes.h"
Owen Andersonacfa3ad2007-07-26 18:26:51 +000023#include "llvm/Function.h"
Devang Patela7379552009-03-06 02:59:27 +000024#include "llvm/IntrinsicInst.h"
Owen Anderson24be4c12009-07-03 00:17:18 +000025#include "llvm/LLVMContext.h"
Chris Lattner0907b522009-09-21 05:57:11 +000026#include "llvm/Operator.h"
Owen Andersonacfa3ad2007-07-26 18:26:51 +000027#include "llvm/Value.h"
Owen Anderson85c40642007-07-24 17:55:58 +000028#include "llvm/ADT/DenseMap.h"
29#include "llvm/ADT/DepthFirstIterator.h"
Owen Andersona03e7862008-12-15 02:03:00 +000030#include "llvm/ADT/PostOrderIterator.h"
Owen Anderson85c40642007-07-24 17:55:58 +000031#include "llvm/ADT/SmallPtrSet.h"
32#include "llvm/ADT/SmallVector.h"
33#include "llvm/ADT/Statistic.h"
Owen Anderson5e9366f2007-10-18 19:39:33 +000034#include "llvm/Analysis/Dominators.h"
35#include "llvm/Analysis/AliasAnalysis.h"
Victor Hernandez48c3c542009-09-18 22:35:49 +000036#include "llvm/Analysis/MallocHelper.h"
Owen Anderson85c40642007-07-24 17:55:58 +000037#include "llvm/Analysis/MemoryDependenceAnalysis.h"
38#include "llvm/Support/CFG.h"
Owen Andersona2bf7662008-06-19 19:57:25 +000039#include "llvm/Support/CommandLine.h"
Chris Lattner9c5be3c2008-03-29 04:36:18 +000040#include "llvm/Support/Debug.h"
Edwin Török675d5622009-07-11 20:10:48 +000041#include "llvm/Support/ErrorHandling.h"
Chris Lattner0907b522009-09-21 05:57:11 +000042#include "llvm/Support/GetElementPtrTypeIterator.h"
Daniel Dunbar005975c2009-07-25 00:23:56 +000043#include "llvm/Support/raw_ostream.h"
Chris Lattner7741aa52009-09-20 19:03:47 +000044#include "llvm/Target/TargetData.h"
Owen Andersonec747c42008-06-19 19:54:19 +000045#include "llvm/Transforms/Utils/BasicBlockUtils.h"
Dale Johannesena19b67f2009-06-17 20:48:23 +000046#include "llvm/Transforms/Utils/Local.h"
Duncan Sands05f68372008-10-08 07:23:46 +000047#include <cstdio>
Owen Anderson85c40642007-07-24 17:55:58 +000048using namespace llvm;
49
Bill Wendling3858cae2008-12-22 22:14:07 +000050STATISTIC(NumGVNInstr, "Number of instructions deleted");
51STATISTIC(NumGVNLoad, "Number of loads deleted");
52STATISTIC(NumGVNPRE, "Number of instructions PRE'd");
Owen Anderson7558f202008-07-15 16:28:06 +000053STATISTIC(NumGVNBlocks, "Number of blocks merged");
Bill Wendling3858cae2008-12-22 22:14:07 +000054STATISTIC(NumPRELoad, "Number of loads PRE'd");
Chris Lattner1be83222008-03-22 04:13:49 +000055
Evan Cheng019a2e12008-06-20 01:01:07 +000056static cl::opt<bool> EnablePRE("enable-pre",
Owen Anderson3a053612008-07-17 19:41:00 +000057 cl::init(true), cl::Hidden);
Dan Gohman828f89f2009-06-15 18:30:15 +000058static cl::opt<bool> EnableLoadPRE("enable-load-pre", cl::init(true));
Owen Andersona2bf7662008-06-19 19:57:25 +000059
Owen Anderson85c40642007-07-24 17:55:58 +000060//===----------------------------------------------------------------------===//
61// ValueTable Class
62//===----------------------------------------------------------------------===//
63
64/// This class holds the mapping between values and value numbers. It is used
65/// as an efficient mechanism to determine the expression-wise equivalence of
66/// two values.
67namespace {
Chris Lattnerfa2d1ba2009-09-02 06:11:42 +000068 struct Expression {
Dan Gohman7ce405e2009-06-04 22:49:04 +000069 enum ExpressionOpcode { ADD, FADD, SUB, FSUB, MUL, FMUL,
70 UDIV, SDIV, FDIV, UREM, SREM,
Daniel Dunbar3be44e62009-09-20 02:20:51 +000071 FREM, SHL, LSHR, ASHR, AND, OR, XOR, ICMPEQ,
72 ICMPNE, ICMPUGT, ICMPUGE, ICMPULT, ICMPULE,
73 ICMPSGT, ICMPSGE, ICMPSLT, ICMPSLE, FCMPOEQ,
74 FCMPOGT, FCMPOGE, FCMPOLT, FCMPOLE, FCMPONE,
75 FCMPORD, FCMPUNO, FCMPUEQ, FCMPUGT, FCMPUGE,
Owen Anderson85c40642007-07-24 17:55:58 +000076 FCMPULT, FCMPULE, FCMPUNE, EXTRACT, INSERT,
77 SHUFFLE, SELECT, TRUNC, ZEXT, SEXT, FPTOUI,
Daniel Dunbar3be44e62009-09-20 02:20:51 +000078 FPTOSI, UITOFP, SITOFP, FPTRUNC, FPEXT,
Owen Anderson771d1122008-05-13 08:17:22 +000079 PTRTOINT, INTTOPTR, BITCAST, GEP, CALL, CONSTANT,
Owen Andersonb0cc5ed2008-06-19 17:25:39 +000080 EMPTY, TOMBSTONE };
Owen Anderson85c40642007-07-24 17:55:58 +000081
82 ExpressionOpcode opcode;
83 const Type* type;
84 uint32_t firstVN;
85 uint32_t secondVN;
86 uint32_t thirdVN;
87 SmallVector<uint32_t, 4> varargs;
Chris Lattnerff36c952009-09-21 02:42:51 +000088 Value *function;
Daniel Dunbar3be44e62009-09-20 02:20:51 +000089
Owen Anderson85c40642007-07-24 17:55:58 +000090 Expression() { }
91 Expression(ExpressionOpcode o) : opcode(o) { }
Daniel Dunbar3be44e62009-09-20 02:20:51 +000092
Owen Anderson85c40642007-07-24 17:55:58 +000093 bool operator==(const Expression &other) const {
94 if (opcode != other.opcode)
95 return false;
96 else if (opcode == EMPTY || opcode == TOMBSTONE)
97 return true;
98 else if (type != other.type)
99 return false;
Owen Anderson5e9366f2007-10-18 19:39:33 +0000100 else if (function != other.function)
101 return false;
Owen Anderson85c40642007-07-24 17:55:58 +0000102 else if (firstVN != other.firstVN)
103 return false;
104 else if (secondVN != other.secondVN)
105 return false;
106 else if (thirdVN != other.thirdVN)
107 return false;
108 else {
109 if (varargs.size() != other.varargs.size())
110 return false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000111
Owen Anderson85c40642007-07-24 17:55:58 +0000112 for (size_t i = 0; i < varargs.size(); ++i)
113 if (varargs[i] != other.varargs[i])
114 return false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000115
Owen Anderson85c40642007-07-24 17:55:58 +0000116 return true;
117 }
118 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000119
Owen Anderson85c40642007-07-24 17:55:58 +0000120 bool operator!=(const Expression &other) const {
Bill Wendling9b5d4b72008-12-22 22:16:31 +0000121 return !(*this == other);
Owen Anderson85c40642007-07-24 17:55:58 +0000122 }
123 };
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000124
Chris Lattnerfa2d1ba2009-09-02 06:11:42 +0000125 class ValueTable {
Owen Anderson85c40642007-07-24 17:55:58 +0000126 private:
127 DenseMap<Value*, uint32_t> valueNumbering;
128 DenseMap<Expression, uint32_t> expressionNumbering;
Owen Andersonbcf2bd52008-05-12 20:15:55 +0000129 AliasAnalysis* AA;
130 MemoryDependenceAnalysis* MD;
131 DominatorTree* DT;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000132
Owen Anderson85c40642007-07-24 17:55:58 +0000133 uint32_t nextValueNumber;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000134
Owen Anderson85c40642007-07-24 17:55:58 +0000135 Expression::ExpressionOpcode getOpcode(BinaryOperator* BO);
136 Expression::ExpressionOpcode getOpcode(CmpInst* C);
137 Expression::ExpressionOpcode getOpcode(CastInst* C);
138 Expression create_expression(BinaryOperator* BO);
139 Expression create_expression(CmpInst* C);
140 Expression create_expression(ShuffleVectorInst* V);
141 Expression create_expression(ExtractElementInst* C);
142 Expression create_expression(InsertElementInst* V);
143 Expression create_expression(SelectInst* V);
144 Expression create_expression(CastInst* C);
145 Expression create_expression(GetElementPtrInst* G);
Owen Anderson5e9366f2007-10-18 19:39:33 +0000146 Expression create_expression(CallInst* C);
Owen Anderson771d1122008-05-13 08:17:22 +0000147 Expression create_expression(Constant* C);
Owen Anderson85c40642007-07-24 17:55:58 +0000148 public:
Dan Gohman936a6522009-04-01 16:37:47 +0000149 ValueTable() : nextValueNumber(1) { }
Chris Lattnerff36c952009-09-21 02:42:51 +0000150 uint32_t lookup_or_add(Value *V);
151 uint32_t lookup(Value *V) const;
152 void add(Value *V, uint32_t num);
Owen Anderson85c40642007-07-24 17:55:58 +0000153 void clear();
Chris Lattnerff36c952009-09-21 02:42:51 +0000154 void erase(Value *v);
Owen Anderson85c40642007-07-24 17:55:58 +0000155 unsigned size();
Owen Andersonbcf2bd52008-05-12 20:15:55 +0000156 void setAliasAnalysis(AliasAnalysis* A) { AA = A; }
Chris Lattner02ca4422008-12-01 00:40:32 +0000157 AliasAnalysis *getAliasAnalysis() const { return AA; }
Owen Andersonbcf2bd52008-05-12 20:15:55 +0000158 void setMemDep(MemoryDependenceAnalysis* M) { MD = M; }
159 void setDomTree(DominatorTree* D) { DT = D; }
Owen Anderson8a8d13c2008-07-03 17:44:33 +0000160 uint32_t getNextUnusedValueNumber() { return nextValueNumber; }
Bill Wendling2a023742008-12-22 21:36:08 +0000161 void verifyRemoved(const Value *) const;
Owen Anderson85c40642007-07-24 17:55:58 +0000162 };
163}
164
165namespace llvm {
Chris Lattner92eea072007-09-17 18:34:04 +0000166template <> struct DenseMapInfo<Expression> {
Owen Andersonbf8a3eb2007-08-02 18:16:06 +0000167 static inline Expression getEmptyKey() {
168 return Expression(Expression::EMPTY);
169 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000170
Owen Andersonbf8a3eb2007-08-02 18:16:06 +0000171 static inline Expression getTombstoneKey() {
172 return Expression(Expression::TOMBSTONE);
173 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000174
Owen Anderson85c40642007-07-24 17:55:58 +0000175 static unsigned getHashValue(const Expression e) {
176 unsigned hash = e.opcode;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000177
Owen Anderson85c40642007-07-24 17:55:58 +0000178 hash = e.firstVN + hash * 37;
179 hash = e.secondVN + hash * 37;
180 hash = e.thirdVN + hash * 37;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000181
Anton Korobeynikov8522e1c2008-02-20 11:26:25 +0000182 hash = ((unsigned)((uintptr_t)e.type >> 4) ^
183 (unsigned)((uintptr_t)e.type >> 9)) +
184 hash * 37;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000185
Owen Andersonbf8a3eb2007-08-02 18:16:06 +0000186 for (SmallVector<uint32_t, 4>::const_iterator I = e.varargs.begin(),
187 E = e.varargs.end(); I != E; ++I)
Owen Anderson85c40642007-07-24 17:55:58 +0000188 hash = *I + hash * 37;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000189
Anton Korobeynikov8522e1c2008-02-20 11:26:25 +0000190 hash = ((unsigned)((uintptr_t)e.function >> 4) ^
191 (unsigned)((uintptr_t)e.function >> 9)) +
192 hash * 37;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000193
Owen Anderson85c40642007-07-24 17:55:58 +0000194 return hash;
195 }
Chris Lattner92eea072007-09-17 18:34:04 +0000196 static bool isEqual(const Expression &LHS, const Expression &RHS) {
197 return LHS == RHS;
198 }
Owen Anderson85c40642007-07-24 17:55:58 +0000199 static bool isPod() { return true; }
200};
201}
202
203//===----------------------------------------------------------------------===//
204// ValueTable Internal Functions
205//===----------------------------------------------------------------------===//
Chris Lattner3d7103e2008-03-21 21:14:38 +0000206Expression::ExpressionOpcode ValueTable::getOpcode(BinaryOperator* BO) {
Owen Anderson85c40642007-07-24 17:55:58 +0000207 switch(BO->getOpcode()) {
Chris Lattner3d7103e2008-03-21 21:14:38 +0000208 default: // THIS SHOULD NEVER HAPPEN
Edwin Törökbd448e32009-07-14 16:55:14 +0000209 llvm_unreachable("Binary operator with unknown opcode?");
Chris Lattner3d7103e2008-03-21 21:14:38 +0000210 case Instruction::Add: return Expression::ADD;
Dan Gohman7ce405e2009-06-04 22:49:04 +0000211 case Instruction::FAdd: return Expression::FADD;
Chris Lattner3d7103e2008-03-21 21:14:38 +0000212 case Instruction::Sub: return Expression::SUB;
Dan Gohman7ce405e2009-06-04 22:49:04 +0000213 case Instruction::FSub: return Expression::FSUB;
Chris Lattner3d7103e2008-03-21 21:14:38 +0000214 case Instruction::Mul: return Expression::MUL;
Dan Gohman7ce405e2009-06-04 22:49:04 +0000215 case Instruction::FMul: return Expression::FMUL;
Chris Lattner3d7103e2008-03-21 21:14:38 +0000216 case Instruction::UDiv: return Expression::UDIV;
217 case Instruction::SDiv: return Expression::SDIV;
218 case Instruction::FDiv: return Expression::FDIV;
219 case Instruction::URem: return Expression::UREM;
220 case Instruction::SRem: return Expression::SREM;
221 case Instruction::FRem: return Expression::FREM;
222 case Instruction::Shl: return Expression::SHL;
223 case Instruction::LShr: return Expression::LSHR;
224 case Instruction::AShr: return Expression::ASHR;
225 case Instruction::And: return Expression::AND;
226 case Instruction::Or: return Expression::OR;
227 case Instruction::Xor: return Expression::XOR;
Owen Anderson85c40642007-07-24 17:55:58 +0000228 }
229}
230
231Expression::ExpressionOpcode ValueTable::getOpcode(CmpInst* C) {
Nick Lewycky8f5253b2009-07-08 03:04:38 +0000232 if (isa<ICmpInst>(C)) {
Owen Anderson85c40642007-07-24 17:55:58 +0000233 switch (C->getPredicate()) {
Chris Lattner3d7103e2008-03-21 21:14:38 +0000234 default: // THIS SHOULD NEVER HAPPEN
Edwin Törökbd448e32009-07-14 16:55:14 +0000235 llvm_unreachable("Comparison with unknown predicate?");
Chris Lattner3d7103e2008-03-21 21:14:38 +0000236 case ICmpInst::ICMP_EQ: return Expression::ICMPEQ;
237 case ICmpInst::ICMP_NE: return Expression::ICMPNE;
238 case ICmpInst::ICMP_UGT: return Expression::ICMPUGT;
239 case ICmpInst::ICMP_UGE: return Expression::ICMPUGE;
240 case ICmpInst::ICMP_ULT: return Expression::ICMPULT;
241 case ICmpInst::ICMP_ULE: return Expression::ICMPULE;
242 case ICmpInst::ICMP_SGT: return Expression::ICMPSGT;
243 case ICmpInst::ICMP_SGE: return Expression::ICMPSGE;
244 case ICmpInst::ICMP_SLT: return Expression::ICMPSLT;
245 case ICmpInst::ICMP_SLE: return Expression::ICMPSLE;
Owen Anderson85c40642007-07-24 17:55:58 +0000246 }
Nick Lewycky8f5253b2009-07-08 03:04:38 +0000247 } else {
248 switch (C->getPredicate()) {
249 default: // THIS SHOULD NEVER HAPPEN
Edwin Törökbd448e32009-07-14 16:55:14 +0000250 llvm_unreachable("Comparison with unknown predicate?");
Nick Lewycky8f5253b2009-07-08 03:04:38 +0000251 case FCmpInst::FCMP_OEQ: return Expression::FCMPOEQ;
252 case FCmpInst::FCMP_OGT: return Expression::FCMPOGT;
253 case FCmpInst::FCMP_OGE: return Expression::FCMPOGE;
254 case FCmpInst::FCMP_OLT: return Expression::FCMPOLT;
255 case FCmpInst::FCMP_OLE: return Expression::FCMPOLE;
256 case FCmpInst::FCMP_ONE: return Expression::FCMPONE;
257 case FCmpInst::FCMP_ORD: return Expression::FCMPORD;
258 case FCmpInst::FCMP_UNO: return Expression::FCMPUNO;
259 case FCmpInst::FCMP_UEQ: return Expression::FCMPUEQ;
260 case FCmpInst::FCMP_UGT: return Expression::FCMPUGT;
261 case FCmpInst::FCMP_UGE: return Expression::FCMPUGE;
262 case FCmpInst::FCMP_ULT: return Expression::FCMPULT;
263 case FCmpInst::FCMP_ULE: return Expression::FCMPULE;
264 case FCmpInst::FCMP_UNE: return Expression::FCMPUNE;
265 }
Owen Anderson85c40642007-07-24 17:55:58 +0000266 }
267}
268
Chris Lattner3d7103e2008-03-21 21:14:38 +0000269Expression::ExpressionOpcode ValueTable::getOpcode(CastInst* C) {
Owen Anderson85c40642007-07-24 17:55:58 +0000270 switch(C->getOpcode()) {
Chris Lattner3d7103e2008-03-21 21:14:38 +0000271 default: // THIS SHOULD NEVER HAPPEN
Edwin Törökbd448e32009-07-14 16:55:14 +0000272 llvm_unreachable("Cast operator with unknown opcode?");
Chris Lattner3d7103e2008-03-21 21:14:38 +0000273 case Instruction::Trunc: return Expression::TRUNC;
274 case Instruction::ZExt: return Expression::ZEXT;
275 case Instruction::SExt: return Expression::SEXT;
276 case Instruction::FPToUI: return Expression::FPTOUI;
277 case Instruction::FPToSI: return Expression::FPTOSI;
278 case Instruction::UIToFP: return Expression::UITOFP;
279 case Instruction::SIToFP: return Expression::SITOFP;
280 case Instruction::FPTrunc: return Expression::FPTRUNC;
281 case Instruction::FPExt: return Expression::FPEXT;
282 case Instruction::PtrToInt: return Expression::PTRTOINT;
283 case Instruction::IntToPtr: return Expression::INTTOPTR;
284 case Instruction::BitCast: return Expression::BITCAST;
Owen Anderson85c40642007-07-24 17:55:58 +0000285 }
286}
287
Owen Anderson5e9366f2007-10-18 19:39:33 +0000288Expression ValueTable::create_expression(CallInst* C) {
289 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000290
Owen Anderson5e9366f2007-10-18 19:39:33 +0000291 e.type = C->getType();
292 e.firstVN = 0;
293 e.secondVN = 0;
294 e.thirdVN = 0;
295 e.function = C->getCalledFunction();
296 e.opcode = Expression::CALL;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000297
Owen Anderson5e9366f2007-10-18 19:39:33 +0000298 for (CallInst::op_iterator I = C->op_begin()+1, E = C->op_end();
299 I != E; ++I)
Owen Anderson07f478f2008-04-11 05:11:49 +0000300 e.varargs.push_back(lookup_or_add(*I));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000301
Owen Anderson5e9366f2007-10-18 19:39:33 +0000302 return e;
303}
304
Owen Anderson85c40642007-07-24 17:55:58 +0000305Expression ValueTable::create_expression(BinaryOperator* BO) {
306 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000307
Owen Anderson07f478f2008-04-11 05:11:49 +0000308 e.firstVN = lookup_or_add(BO->getOperand(0));
309 e.secondVN = lookup_or_add(BO->getOperand(1));
Owen Anderson85c40642007-07-24 17:55:58 +0000310 e.thirdVN = 0;
Owen Anderson5e9366f2007-10-18 19:39:33 +0000311 e.function = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000312 e.type = BO->getType();
313 e.opcode = getOpcode(BO);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000314
Owen Anderson85c40642007-07-24 17:55:58 +0000315 return e;
316}
317
318Expression ValueTable::create_expression(CmpInst* C) {
319 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000320
Owen Anderson07f478f2008-04-11 05:11:49 +0000321 e.firstVN = lookup_or_add(C->getOperand(0));
322 e.secondVN = lookup_or_add(C->getOperand(1));
Owen Anderson85c40642007-07-24 17:55:58 +0000323 e.thirdVN = 0;
Owen Anderson5e9366f2007-10-18 19:39:33 +0000324 e.function = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000325 e.type = C->getType();
326 e.opcode = getOpcode(C);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000327
Owen Anderson85c40642007-07-24 17:55:58 +0000328 return e;
329}
330
331Expression ValueTable::create_expression(CastInst* C) {
332 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000333
Owen Anderson07f478f2008-04-11 05:11:49 +0000334 e.firstVN = lookup_or_add(C->getOperand(0));
Owen Anderson85c40642007-07-24 17:55:58 +0000335 e.secondVN = 0;
336 e.thirdVN = 0;
Owen Anderson5e9366f2007-10-18 19:39:33 +0000337 e.function = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000338 e.type = C->getType();
339 e.opcode = getOpcode(C);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000340
Owen Anderson85c40642007-07-24 17:55:58 +0000341 return e;
342}
343
344Expression ValueTable::create_expression(ShuffleVectorInst* S) {
345 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000346
Owen Anderson07f478f2008-04-11 05:11:49 +0000347 e.firstVN = lookup_or_add(S->getOperand(0));
348 e.secondVN = lookup_or_add(S->getOperand(1));
349 e.thirdVN = lookup_or_add(S->getOperand(2));
Owen Anderson5e9366f2007-10-18 19:39:33 +0000350 e.function = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000351 e.type = S->getType();
352 e.opcode = Expression::SHUFFLE;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000353
Owen Anderson85c40642007-07-24 17:55:58 +0000354 return e;
355}
356
357Expression ValueTable::create_expression(ExtractElementInst* E) {
358 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000359
Owen Anderson07f478f2008-04-11 05:11:49 +0000360 e.firstVN = lookup_or_add(E->getOperand(0));
361 e.secondVN = lookup_or_add(E->getOperand(1));
Owen Anderson85c40642007-07-24 17:55:58 +0000362 e.thirdVN = 0;
Owen Anderson5e9366f2007-10-18 19:39:33 +0000363 e.function = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000364 e.type = E->getType();
365 e.opcode = Expression::EXTRACT;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000366
Owen Anderson85c40642007-07-24 17:55:58 +0000367 return e;
368}
369
370Expression ValueTable::create_expression(InsertElementInst* I) {
371 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000372
Owen Anderson07f478f2008-04-11 05:11:49 +0000373 e.firstVN = lookup_or_add(I->getOperand(0));
374 e.secondVN = lookup_or_add(I->getOperand(1));
375 e.thirdVN = lookup_or_add(I->getOperand(2));
Owen Anderson5e9366f2007-10-18 19:39:33 +0000376 e.function = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000377 e.type = I->getType();
378 e.opcode = Expression::INSERT;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000379
Owen Anderson85c40642007-07-24 17:55:58 +0000380 return e;
381}
382
383Expression ValueTable::create_expression(SelectInst* I) {
384 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000385
Owen Anderson07f478f2008-04-11 05:11:49 +0000386 e.firstVN = lookup_or_add(I->getCondition());
387 e.secondVN = lookup_or_add(I->getTrueValue());
388 e.thirdVN = lookup_or_add(I->getFalseValue());
Owen Anderson5e9366f2007-10-18 19:39:33 +0000389 e.function = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000390 e.type = I->getType();
391 e.opcode = Expression::SELECT;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000392
Owen Anderson85c40642007-07-24 17:55:58 +0000393 return e;
394}
395
396Expression ValueTable::create_expression(GetElementPtrInst* G) {
397 Expression e;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000398
Owen Anderson07f478f2008-04-11 05:11:49 +0000399 e.firstVN = lookup_or_add(G->getPointerOperand());
Owen Anderson85c40642007-07-24 17:55:58 +0000400 e.secondVN = 0;
401 e.thirdVN = 0;
Owen Anderson5e9366f2007-10-18 19:39:33 +0000402 e.function = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000403 e.type = G->getType();
404 e.opcode = Expression::GEP;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000405
Owen Anderson85c40642007-07-24 17:55:58 +0000406 for (GetElementPtrInst::op_iterator I = G->idx_begin(), E = G->idx_end();
407 I != E; ++I)
Owen Anderson07f478f2008-04-11 05:11:49 +0000408 e.varargs.push_back(lookup_or_add(*I));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000409
Owen Anderson85c40642007-07-24 17:55:58 +0000410 return e;
411}
412
413//===----------------------------------------------------------------------===//
414// ValueTable External Functions
415//===----------------------------------------------------------------------===//
416
Owen Andersone6b4ff82008-06-18 21:41:49 +0000417/// add - Insert a value into the table with a specified value number.
Chris Lattnerff36c952009-09-21 02:42:51 +0000418void ValueTable::add(Value *V, uint32_t num) {
Owen Andersone6b4ff82008-06-18 21:41:49 +0000419 valueNumbering.insert(std::make_pair(V, num));
420}
421
Owen Anderson85c40642007-07-24 17:55:58 +0000422/// lookup_or_add - Returns the value number for the specified value, assigning
423/// it a new number if it did not have one before.
Chris Lattnerff36c952009-09-21 02:42:51 +0000424uint32_t ValueTable::lookup_or_add(Value *V) {
Owen Anderson85c40642007-07-24 17:55:58 +0000425 DenseMap<Value*, uint32_t>::iterator VI = valueNumbering.find(V);
426 if (VI != valueNumbering.end())
427 return VI->second;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000428
Owen Anderson5e9366f2007-10-18 19:39:33 +0000429 if (CallInst* C = dyn_cast<CallInst>(V)) {
Owen Anderson07f478f2008-04-11 05:11:49 +0000430 if (AA->doesNotAccessMemory(C)) {
Owen Anderson5e9366f2007-10-18 19:39:33 +0000431 Expression e = create_expression(C);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000432
Owen Anderson5e9366f2007-10-18 19:39:33 +0000433 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
434 if (EI != expressionNumbering.end()) {
435 valueNumbering.insert(std::make_pair(V, EI->second));
436 return EI->second;
437 } else {
438 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
439 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000440
Owen Anderson5e9366f2007-10-18 19:39:33 +0000441 return nextValueNumber++;
442 }
Owen Andersona0b2b8e2008-04-17 05:36:50 +0000443 } else if (AA->onlyReadsMemory(C)) {
444 Expression e = create_expression(C);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000445
Owen Anderson771d1122008-05-13 08:17:22 +0000446 if (expressionNumbering.find(e) == expressionNumbering.end()) {
Owen Andersona0b2b8e2008-04-17 05:36:50 +0000447 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
448 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Owen Anderson771d1122008-05-13 08:17:22 +0000449 return nextValueNumber++;
450 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000451
Chris Lattner12cafbf2008-11-29 02:29:27 +0000452 MemDepResult local_dep = MD->getDependency(C);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000453
Chris Lattner4531da82008-12-05 21:04:20 +0000454 if (!local_dep.isDef() && !local_dep.isNonLocal()) {
Owen Anderson64fcc592008-05-13 23:18:30 +0000455 valueNumbering.insert(std::make_pair(V, nextValueNumber));
456 return nextValueNumber++;
Chris Lattnerd33b6662008-11-30 23:39:23 +0000457 }
Chris Lattner4531da82008-12-05 21:04:20 +0000458
459 if (local_dep.isDef()) {
460 CallInst* local_cdep = cast<CallInst>(local_dep.getInst());
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000461
Chris Lattner4531da82008-12-05 21:04:20 +0000462 if (local_cdep->getNumOperands() != C->getNumOperands()) {
Owen Anderson64fcc592008-05-13 23:18:30 +0000463 valueNumbering.insert(std::make_pair(V, nextValueNumber));
464 return nextValueNumber++;
465 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000466
Chris Lattnerd33b6662008-11-30 23:39:23 +0000467 for (unsigned i = 1; i < C->getNumOperands(); ++i) {
468 uint32_t c_vn = lookup_or_add(C->getOperand(i));
469 uint32_t cd_vn = lookup_or_add(local_cdep->getOperand(i));
470 if (c_vn != cd_vn) {
471 valueNumbering.insert(std::make_pair(V, nextValueNumber));
472 return nextValueNumber++;
473 }
474 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000475
Chris Lattnerd33b6662008-11-30 23:39:23 +0000476 uint32_t v = lookup_or_add(local_cdep);
477 valueNumbering.insert(std::make_pair(V, v));
478 return v;
Owen Anderson64fcc592008-05-13 23:18:30 +0000479 }
Chris Lattner46876282008-12-01 01:15:42 +0000480
Chris Lattner4531da82008-12-05 21:04:20 +0000481 // Non-local case.
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000482 const MemoryDependenceAnalysis::NonLocalDepInfo &deps =
Chris Lattner35d5cf52008-12-09 19:38:05 +0000483 MD->getNonLocalCallDependency(CallSite(C));
Chris Lattner4531da82008-12-05 21:04:20 +0000484 // FIXME: call/call dependencies for readonly calls should return def, not
485 // clobber! Move the checking logic to MemDep!
Owen Anderson3ebaca72008-05-13 13:41:23 +0000486 CallInst* cdep = 0;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000487
Chris Lattnerd33b6662008-11-30 23:39:23 +0000488 // Check to see if we have a single dominating call instruction that is
489 // identical to C.
Chris Lattner46876282008-12-01 01:15:42 +0000490 for (unsigned i = 0, e = deps.size(); i != e; ++i) {
491 const MemoryDependenceAnalysis::NonLocalDepEntry *I = &deps[i];
Chris Lattnerd33b6662008-11-30 23:39:23 +0000492 // Ignore non-local dependencies.
493 if (I->second.isNonLocal())
494 continue;
Owen Anderson771d1122008-05-13 08:17:22 +0000495
Chris Lattnerd33b6662008-11-30 23:39:23 +0000496 // We don't handle non-depedencies. If we already have a call, reject
497 // instruction dependencies.
Chris Lattner4531da82008-12-05 21:04:20 +0000498 if (I->second.isClobber() || cdep != 0) {
Chris Lattnerd33b6662008-11-30 23:39:23 +0000499 cdep = 0;
500 break;
Owen Anderson771d1122008-05-13 08:17:22 +0000501 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000502
Chris Lattnerd33b6662008-11-30 23:39:23 +0000503 CallInst *NonLocalDepCall = dyn_cast<CallInst>(I->second.getInst());
504 // FIXME: All duplicated with non-local case.
505 if (NonLocalDepCall && DT->properlyDominates(I->first, C->getParent())){
506 cdep = NonLocalDepCall;
507 continue;
508 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000509
Chris Lattnerd33b6662008-11-30 23:39:23 +0000510 cdep = 0;
511 break;
Owen Anderson771d1122008-05-13 08:17:22 +0000512 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000513
Owen Anderson3ebaca72008-05-13 13:41:23 +0000514 if (!cdep) {
Owen Anderson771d1122008-05-13 08:17:22 +0000515 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Owen Andersona0b2b8e2008-04-17 05:36:50 +0000516 return nextValueNumber++;
517 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000518
Chris Lattner4531da82008-12-05 21:04:20 +0000519 if (cdep->getNumOperands() != C->getNumOperands()) {
Owen Anderson771d1122008-05-13 08:17:22 +0000520 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Owen Andersona0b2b8e2008-04-17 05:36:50 +0000521 return nextValueNumber++;
Owen Andersona0b2b8e2008-04-17 05:36:50 +0000522 }
Chris Lattnerd33b6662008-11-30 23:39:23 +0000523 for (unsigned i = 1; i < C->getNumOperands(); ++i) {
524 uint32_t c_vn = lookup_or_add(C->getOperand(i));
525 uint32_t cd_vn = lookup_or_add(cdep->getOperand(i));
526 if (c_vn != cd_vn) {
527 valueNumbering.insert(std::make_pair(V, nextValueNumber));
528 return nextValueNumber++;
529 }
530 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000531
Chris Lattnerd33b6662008-11-30 23:39:23 +0000532 uint32_t v = lookup_or_add(cdep);
533 valueNumbering.insert(std::make_pair(V, v));
534 return v;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000535
Owen Anderson5e9366f2007-10-18 19:39:33 +0000536 } else {
537 valueNumbering.insert(std::make_pair(V, nextValueNumber));
538 return nextValueNumber++;
539 }
540 } else if (BinaryOperator* BO = dyn_cast<BinaryOperator>(V)) {
Owen Anderson85c40642007-07-24 17:55:58 +0000541 Expression e = create_expression(BO);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000542
Owen Anderson85c40642007-07-24 17:55:58 +0000543 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
544 if (EI != expressionNumbering.end()) {
545 valueNumbering.insert(std::make_pair(V, EI->second));
546 return EI->second;
547 } else {
548 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
549 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000550
Owen Anderson85c40642007-07-24 17:55:58 +0000551 return nextValueNumber++;
552 }
553 } else if (CmpInst* C = dyn_cast<CmpInst>(V)) {
554 Expression e = create_expression(C);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000555
Owen Anderson85c40642007-07-24 17:55:58 +0000556 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
557 if (EI != expressionNumbering.end()) {
558 valueNumbering.insert(std::make_pair(V, EI->second));
559 return EI->second;
560 } else {
561 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
562 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000563
Owen Anderson85c40642007-07-24 17:55:58 +0000564 return nextValueNumber++;
565 }
566 } else if (ShuffleVectorInst* U = dyn_cast<ShuffleVectorInst>(V)) {
567 Expression e = create_expression(U);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000568
Owen Anderson85c40642007-07-24 17:55:58 +0000569 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
570 if (EI != expressionNumbering.end()) {
571 valueNumbering.insert(std::make_pair(V, EI->second));
572 return EI->second;
573 } else {
574 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
575 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000576
Owen Anderson85c40642007-07-24 17:55:58 +0000577 return nextValueNumber++;
578 }
579 } else if (ExtractElementInst* U = dyn_cast<ExtractElementInst>(V)) {
580 Expression e = create_expression(U);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000581
Owen Anderson85c40642007-07-24 17:55:58 +0000582 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
583 if (EI != expressionNumbering.end()) {
584 valueNumbering.insert(std::make_pair(V, EI->second));
585 return EI->second;
586 } else {
587 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
588 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000589
Owen Anderson85c40642007-07-24 17:55:58 +0000590 return nextValueNumber++;
591 }
592 } else if (InsertElementInst* U = dyn_cast<InsertElementInst>(V)) {
593 Expression e = create_expression(U);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000594
Owen Anderson85c40642007-07-24 17:55:58 +0000595 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
596 if (EI != expressionNumbering.end()) {
597 valueNumbering.insert(std::make_pair(V, EI->second));
598 return EI->second;
599 } else {
600 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
601 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000602
Owen Anderson85c40642007-07-24 17:55:58 +0000603 return nextValueNumber++;
604 }
605 } else if (SelectInst* U = dyn_cast<SelectInst>(V)) {
606 Expression e = create_expression(U);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000607
Owen Anderson85c40642007-07-24 17:55:58 +0000608 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
609 if (EI != expressionNumbering.end()) {
610 valueNumbering.insert(std::make_pair(V, EI->second));
611 return EI->second;
612 } else {
613 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
614 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000615
Owen Anderson85c40642007-07-24 17:55:58 +0000616 return nextValueNumber++;
617 }
618 } else if (CastInst* U = dyn_cast<CastInst>(V)) {
619 Expression e = create_expression(U);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000620
Owen Anderson85c40642007-07-24 17:55:58 +0000621 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
622 if (EI != expressionNumbering.end()) {
623 valueNumbering.insert(std::make_pair(V, EI->second));
624 return EI->second;
625 } else {
626 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
627 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000628
Owen Anderson85c40642007-07-24 17:55:58 +0000629 return nextValueNumber++;
630 }
631 } else if (GetElementPtrInst* U = dyn_cast<GetElementPtrInst>(V)) {
632 Expression e = create_expression(U);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000633
Owen Anderson85c40642007-07-24 17:55:58 +0000634 DenseMap<Expression, uint32_t>::iterator EI = expressionNumbering.find(e);
635 if (EI != expressionNumbering.end()) {
636 valueNumbering.insert(std::make_pair(V, EI->second));
637 return EI->second;
638 } else {
639 expressionNumbering.insert(std::make_pair(e, nextValueNumber));
640 valueNumbering.insert(std::make_pair(V, nextValueNumber));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000641
Owen Anderson85c40642007-07-24 17:55:58 +0000642 return nextValueNumber++;
643 }
644 } else {
645 valueNumbering.insert(std::make_pair(V, nextValueNumber));
646 return nextValueNumber++;
647 }
648}
649
650/// lookup - Returns the value number of the specified value. Fails if
651/// the value has not yet been numbered.
Chris Lattnerff36c952009-09-21 02:42:51 +0000652uint32_t ValueTable::lookup(Value *V) const {
Owen Anderson85c40642007-07-24 17:55:58 +0000653 DenseMap<Value*, uint32_t>::iterator VI = valueNumbering.find(V);
Chris Lattner3d7103e2008-03-21 21:14:38 +0000654 assert(VI != valueNumbering.end() && "Value not numbered?");
655 return VI->second;
Owen Anderson85c40642007-07-24 17:55:58 +0000656}
657
658/// clear - Remove all entries from the ValueTable
659void ValueTable::clear() {
660 valueNumbering.clear();
661 expressionNumbering.clear();
662 nextValueNumber = 1;
663}
664
Owen Anderson5aff8002007-07-31 23:27:13 +0000665/// erase - Remove a value from the value numbering
Chris Lattnerff36c952009-09-21 02:42:51 +0000666void ValueTable::erase(Value *V) {
Owen Anderson5aff8002007-07-31 23:27:13 +0000667 valueNumbering.erase(V);
668}
669
Bill Wendling2a023742008-12-22 21:36:08 +0000670/// verifyRemoved - Verify that the value is removed from all internal data
671/// structures.
672void ValueTable::verifyRemoved(const Value *V) const {
673 for (DenseMap<Value*, uint32_t>::iterator
674 I = valueNumbering.begin(), E = valueNumbering.end(); I != E; ++I) {
675 assert(I->first != V && "Inst still occurs in value numbering map!");
676 }
677}
678
Owen Anderson85c40642007-07-24 17:55:58 +0000679//===----------------------------------------------------------------------===//
Bill Wendling42f17f62008-12-22 22:32:22 +0000680// GVN Pass
Owen Anderson85c40642007-07-24 17:55:58 +0000681//===----------------------------------------------------------------------===//
682
683namespace {
Chris Lattnerfa2d1ba2009-09-02 06:11:42 +0000684 struct ValueNumberScope {
Owen Anderson2a412722008-06-20 01:15:47 +0000685 ValueNumberScope* parent;
686 DenseMap<uint32_t, Value*> table;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000687
Owen Anderson2a412722008-06-20 01:15:47 +0000688 ValueNumberScope(ValueNumberScope* p) : parent(p) { }
689 };
690}
691
692namespace {
Owen Anderson85c40642007-07-24 17:55:58 +0000693
Chris Lattnerfa2d1ba2009-09-02 06:11:42 +0000694 class GVN : public FunctionPass {
Owen Anderson85c40642007-07-24 17:55:58 +0000695 bool runOnFunction(Function &F);
696 public:
697 static char ID; // Pass identification, replacement for typeid
Dan Gohman26f8c272008-09-04 17:05:41 +0000698 GVN() : FunctionPass(&ID) { }
Owen Anderson85c40642007-07-24 17:55:58 +0000699
700 private:
Chris Lattner02ca4422008-12-01 00:40:32 +0000701 MemoryDependenceAnalysis *MD;
702 DominatorTree *DT;
703
Owen Anderson85c40642007-07-24 17:55:58 +0000704 ValueTable VN;
Owen Anderson2a412722008-06-20 01:15:47 +0000705 DenseMap<BasicBlock*, ValueNumberScope*> localAvail;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000706
Owen Anderson5b299672007-08-07 23:12:31 +0000707 typedef DenseMap<Value*, SmallPtrSet<Instruction*, 4> > PhiMapType;
708 PhiMapType phiMap;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000709
710
Owen Anderson85c40642007-07-24 17:55:58 +0000711 // This transformation requires dominator postdominator info
712 virtual void getAnalysisUsage(AnalysisUsage &AU) const {
Owen Anderson85c40642007-07-24 17:55:58 +0000713 AU.addRequired<DominatorTree>();
714 AU.addRequired<MemoryDependenceAnalysis>();
Owen Anderson5e9366f2007-10-18 19:39:33 +0000715 AU.addRequired<AliasAnalysis>();
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000716
Owen Andersonaef6a922008-06-23 17:49:45 +0000717 AU.addPreserved<DominatorTree>();
Owen Anderson5e9366f2007-10-18 19:39:33 +0000718 AU.addPreserved<AliasAnalysis>();
Owen Anderson85c40642007-07-24 17:55:58 +0000719 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000720
Owen Anderson85c40642007-07-24 17:55:58 +0000721 // Helper fuctions
722 // FIXME: eliminate or document these better
Owen Anderson85c40642007-07-24 17:55:58 +0000723 bool processLoad(LoadInst* L,
Chris Lattner7de20452008-03-21 22:01:16 +0000724 SmallVectorImpl<Instruction*> &toErase);
Chris Lattnerff36c952009-09-21 02:42:51 +0000725 bool processInstruction(Instruction *I,
Chris Lattner7de20452008-03-21 22:01:16 +0000726 SmallVectorImpl<Instruction*> &toErase);
Owen Andersonbf8a3eb2007-08-02 18:16:06 +0000727 bool processNonLocalLoad(LoadInst* L,
Chris Lattner7de20452008-03-21 22:01:16 +0000728 SmallVectorImpl<Instruction*> &toErase);
Chris Lattnerff36c952009-09-21 02:42:51 +0000729 bool processBlock(BasicBlock *BB);
730 Value *GetValueForBlock(BasicBlock *BB, Instruction *orig,
Owen Andersonc6a31b92007-08-02 17:56:05 +0000731 DenseMap<BasicBlock*, Value*> &Phis,
732 bool top_level = false);
Owen Andersone6b4ff82008-06-18 21:41:49 +0000733 void dump(DenseMap<uint32_t, Value*>& d);
Owen Andersonbe168b32007-08-14 18:04:11 +0000734 bool iterateOnFunction(Function &F);
Chris Lattnerff36c952009-09-21 02:42:51 +0000735 Value *CollapsePhi(PHINode* p);
Owen Andersone6b4ff82008-06-18 21:41:49 +0000736 bool performPRE(Function& F);
Chris Lattnerff36c952009-09-21 02:42:51 +0000737 Value *lookupNumber(BasicBlock *BB, uint32_t num);
738 Value *AttemptRedundancyElimination(Instruction *orig, unsigned valno);
Nuno Lopes274474b2008-10-10 16:25:50 +0000739 void cleanupGlobalSets();
Bill Wendling2a023742008-12-22 21:36:08 +0000740 void verifyRemoved(const Instruction *I) const;
Owen Anderson85c40642007-07-24 17:55:58 +0000741 };
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000742
Owen Anderson85c40642007-07-24 17:55:58 +0000743 char GVN::ID = 0;
Owen Anderson85c40642007-07-24 17:55:58 +0000744}
745
746// createGVNPass - The public interface to this file...
747FunctionPass *llvm::createGVNPass() { return new GVN(); }
748
749static RegisterPass<GVN> X("gvn",
750 "Global Value Numbering");
751
Owen Andersone6b4ff82008-06-18 21:41:49 +0000752void GVN::dump(DenseMap<uint32_t, Value*>& d) {
Owen Anderson5d72a422007-07-25 19:57:03 +0000753 printf("{\n");
Owen Andersone6b4ff82008-06-18 21:41:49 +0000754 for (DenseMap<uint32_t, Value*>::iterator I = d.begin(),
Owen Anderson5d72a422007-07-25 19:57:03 +0000755 E = d.end(); I != E; ++I) {
Owen Andersone6b4ff82008-06-18 21:41:49 +0000756 printf("%d\n", I->first);
Owen Anderson5d72a422007-07-25 19:57:03 +0000757 I->second->dump();
758 }
759 printf("}\n");
760}
761
Chris Lattnerff36c952009-09-21 02:42:51 +0000762static bool isSafeReplacement(PHINode* p, Instruction *inst) {
Owen Andersond68b1af2009-08-26 22:55:11 +0000763 if (!isa<PHINode>(inst))
764 return true;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000765
Owen Andersond68b1af2009-08-26 22:55:11 +0000766 for (Instruction::use_iterator UI = p->use_begin(), E = p->use_end();
767 UI != E; ++UI)
768 if (PHINode* use_phi = dyn_cast<PHINode>(UI))
769 if (use_phi->getParent() == inst->getParent())
770 return false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000771
Owen Andersond68b1af2009-08-26 22:55:11 +0000772 return true;
773}
774
Chris Lattnerff36c952009-09-21 02:42:51 +0000775Value *GVN::CollapsePhi(PHINode *PN) {
776 Value *ConstVal = PN->hasConstantValue(DT);
777 if (!ConstVal) return 0;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000778
Chris Lattnerff36c952009-09-21 02:42:51 +0000779 Instruction *Inst = dyn_cast<Instruction>(ConstVal);
780 if (!Inst)
781 return ConstVal;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000782
Chris Lattnerff36c952009-09-21 02:42:51 +0000783 if (DT->dominates(Inst, PN))
784 if (isSafeReplacement(PN, Inst))
785 return Inst;
Owen Andersone02ad522007-08-16 22:51:56 +0000786 return 0;
787}
Owen Anderson5d72a422007-07-25 19:57:03 +0000788
Owen Andersonacfa3ad2007-07-26 18:26:51 +0000789/// GetValueForBlock - Get the value to use within the specified basic block.
790/// available values are in Phis.
Chris Lattnerff36c952009-09-21 02:42:51 +0000791Value *GVN::GetValueForBlock(BasicBlock *BB, Instruction *Orig,
Chris Lattner3d7103e2008-03-21 21:14:38 +0000792 DenseMap<BasicBlock*, Value*> &Phis,
Chris Lattnerff36c952009-09-21 02:42:51 +0000793 bool TopLevel) {
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000794
Owen Andersonacfa3ad2007-07-26 18:26:51 +0000795 // If we have already computed this value, return the previously computed val.
Owen Andersoned7f9932007-08-03 19:59:35 +0000796 DenseMap<BasicBlock*, Value*>::iterator V = Phis.find(BB);
Chris Lattnerff36c952009-09-21 02:42:51 +0000797 if (V != Phis.end() && !TopLevel) return V->second;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000798
Owen Andersonc3714b22008-07-02 18:15:31 +0000799 // If the block is unreachable, just return undef, since this path
800 // can't actually occur at runtime.
Chris Lattner02ca4422008-12-01 00:40:32 +0000801 if (!DT->isReachableFromEntry(BB))
Chris Lattnerff36c952009-09-21 02:42:51 +0000802 return Phis[BB] = UndefValue::get(Orig->getType());
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000803
Chris Lattner4bab29b2008-12-09 19:21:47 +0000804 if (BasicBlock *Pred = BB->getSinglePredecessor()) {
Chris Lattnerff36c952009-09-21 02:42:51 +0000805 Value *ret = GetValueForBlock(Pred, Orig, Phis);
Owen Andersoned7f9932007-08-03 19:59:35 +0000806 Phis[BB] = ret;
807 return ret;
Owen Anderson30463f12007-08-03 11:03:26 +0000808 }
Chris Lattner4bab29b2008-12-09 19:21:47 +0000809
810 // Get the number of predecessors of this block so we can reserve space later.
811 // If there is already a PHI in it, use the #preds from it, otherwise count.
812 // Getting it from the PHI is constant time.
813 unsigned NumPreds;
814 if (PHINode *ExistingPN = dyn_cast<PHINode>(BB->begin()))
815 NumPreds = ExistingPN->getNumIncomingValues();
816 else
817 NumPreds = std::distance(pred_begin(BB), pred_end(BB));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000818
Owen Andersonacfa3ad2007-07-26 18:26:51 +0000819 // Otherwise, the idom is the loop, so we need to insert a PHI node. Do so
820 // now, then get values to fill in the incoming values for the PHI.
Chris Lattnerff36c952009-09-21 02:42:51 +0000821 PHINode *PN = PHINode::Create(Orig->getType(), Orig->getName()+".rle",
Gabor Greifd6da1d02008-04-06 20:25:17 +0000822 BB->begin());
Chris Lattner4bab29b2008-12-09 19:21:47 +0000823 PN->reserveOperandSpace(NumPreds);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000824
Chris Lattner4bab29b2008-12-09 19:21:47 +0000825 Phis.insert(std::make_pair(BB, PN));
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000826
Owen Andersonacfa3ad2007-07-26 18:26:51 +0000827 // Fill in the incoming values for the block.
Owen Anderson9f577412007-07-31 17:43:14 +0000828 for (pred_iterator PI = pred_begin(BB), E = pred_end(BB); PI != E; ++PI) {
Chris Lattnerff36c952009-09-21 02:42:51 +0000829 Value *val = GetValueForBlock(*PI, Orig, Phis);
Owen Anderson9f577412007-07-31 17:43:14 +0000830 PN->addIncoming(val, *PI);
831 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000832
Chris Lattnerff36c952009-09-21 02:42:51 +0000833 VN.getAliasAnalysis()->copyValue(Orig, PN);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000834
Owen Andersone0143452007-08-16 22:02:55 +0000835 // Attempt to collapse PHI nodes that are trivially redundant
Chris Lattnerff36c952009-09-21 02:42:51 +0000836 Value *v = CollapsePhi(PN);
Chris Lattner3d7103e2008-03-21 21:14:38 +0000837 if (!v) {
838 // Cache our phi construction results
Chris Lattnerff36c952009-09-21 02:42:51 +0000839 if (LoadInst* L = dyn_cast<LoadInst>(Orig))
Owen Anderson5e5e5612008-12-14 19:10:35 +0000840 phiMap[L->getPointerOperand()].insert(PN);
841 else
Chris Lattnerff36c952009-09-21 02:42:51 +0000842 phiMap[Orig].insert(PN);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000843
Chris Lattner3d7103e2008-03-21 21:14:38 +0000844 return PN;
Owen Anderson9f577412007-07-31 17:43:14 +0000845 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000846
Chris Lattner3d7103e2008-03-21 21:14:38 +0000847 PN->replaceAllUsesWith(v);
Chris Lattnerf81b0142008-12-09 22:06:23 +0000848 if (isa<PointerType>(v->getType()))
849 MD->invalidateCachedPointerInfo(v);
Chris Lattner3d7103e2008-03-21 21:14:38 +0000850
851 for (DenseMap<BasicBlock*, Value*>::iterator I = Phis.begin(),
852 E = Phis.end(); I != E; ++I)
853 if (I->second == PN)
854 I->second = v;
855
Dan Gohman7e124382009-07-31 20:24:18 +0000856 DEBUG(errs() << "GVN removed: " << *PN << '\n');
Chris Lattner02ca4422008-12-01 00:40:32 +0000857 MD->removeInstruction(PN);
Chris Lattner3d7103e2008-03-21 21:14:38 +0000858 PN->eraseFromParent();
Bill Wendling2a023742008-12-22 21:36:08 +0000859 DEBUG(verifyRemoved(PN));
Chris Lattner3d7103e2008-03-21 21:14:38 +0000860
861 Phis[BB] = v;
862 return v;
Owen Anderson5d72a422007-07-25 19:57:03 +0000863}
864
Chris Lattnerdcded152008-12-02 08:16:11 +0000865/// IsValueFullyAvailableInBlock - Return true if we can prove that the value
866/// we're analyzing is fully available in the specified block. As we go, keep
Chris Lattner159b98f2008-12-05 07:49:08 +0000867/// track of which blocks we know are fully alive in FullyAvailableBlocks. This
868/// map is actually a tri-state map with the following values:
869/// 0) we know the block *is not* fully available.
870/// 1) we know the block *is* fully available.
871/// 2) we do not know whether the block is fully available or not, but we are
872/// currently speculating that it will be.
873/// 3) we are speculating for this block and have used that to speculate for
874/// other blocks.
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000875static bool IsValueFullyAvailableInBlock(BasicBlock *BB,
Chris Lattner159b98f2008-12-05 07:49:08 +0000876 DenseMap<BasicBlock*, char> &FullyAvailableBlocks) {
Chris Lattnerdcded152008-12-02 08:16:11 +0000877 // Optimistically assume that the block is fully available and check to see
878 // if we already know about this block in one lookup.
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000879 std::pair<DenseMap<BasicBlock*, char>::iterator, char> IV =
Chris Lattner159b98f2008-12-05 07:49:08 +0000880 FullyAvailableBlocks.insert(std::make_pair(BB, 2));
Chris Lattnerdcded152008-12-02 08:16:11 +0000881
882 // If the entry already existed for this block, return the precomputed value.
Chris Lattner159b98f2008-12-05 07:49:08 +0000883 if (!IV.second) {
884 // If this is a speculative "available" value, mark it as being used for
885 // speculation of other blocks.
886 if (IV.first->second == 2)
887 IV.first->second = 3;
888 return IV.first->second != 0;
889 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000890
Chris Lattnerdcded152008-12-02 08:16:11 +0000891 // Otherwise, see if it is fully available in all predecessors.
892 pred_iterator PI = pred_begin(BB), PE = pred_end(BB);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000893
Chris Lattnerdcded152008-12-02 08:16:11 +0000894 // If this block has no predecessors, it isn't live-in here.
895 if (PI == PE)
Chris Lattner159b98f2008-12-05 07:49:08 +0000896 goto SpeculationFailure;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000897
Chris Lattnerdcded152008-12-02 08:16:11 +0000898 for (; PI != PE; ++PI)
899 // If the value isn't fully available in one of our predecessors, then it
900 // isn't fully available in this block either. Undo our previous
901 // optimistic assumption and bail out.
902 if (!IsValueFullyAvailableInBlock(*PI, FullyAvailableBlocks))
Chris Lattner159b98f2008-12-05 07:49:08 +0000903 goto SpeculationFailure;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000904
Chris Lattnerdcded152008-12-02 08:16:11 +0000905 return true;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000906
Chris Lattner159b98f2008-12-05 07:49:08 +0000907// SpeculationFailure - If we get here, we found out that this is not, after
908// all, a fully-available block. We have a problem if we speculated on this and
909// used the speculation to mark other blocks as available.
910SpeculationFailure:
911 char &BBVal = FullyAvailableBlocks[BB];
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000912
Chris Lattner159b98f2008-12-05 07:49:08 +0000913 // If we didn't speculate on this, just return with it set to false.
914 if (BBVal == 2) {
915 BBVal = 0;
916 return false;
917 }
918
919 // If we did speculate on this value, we could have blocks set to 1 that are
920 // incorrect. Walk the (transitive) successors of this block and mark them as
921 // 0 if set to one.
922 SmallVector<BasicBlock*, 32> BBWorklist;
923 BBWorklist.push_back(BB);
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000924
Chris Lattner159b98f2008-12-05 07:49:08 +0000925 while (!BBWorklist.empty()) {
926 BasicBlock *Entry = BBWorklist.pop_back_val();
927 // Note that this sets blocks to 0 (unavailable) if they happen to not
928 // already be in FullyAvailableBlocks. This is safe.
929 char &EntryVal = FullyAvailableBlocks[Entry];
930 if (EntryVal == 0) continue; // Already unavailable.
931
932 // Mark as unavailable.
933 EntryVal = 0;
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000934
Chris Lattner159b98f2008-12-05 07:49:08 +0000935 for (succ_iterator I = succ_begin(Entry), E = succ_end(Entry); I != E; ++I)
936 BBWorklist.push_back(*I);
937 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +0000938
Chris Lattner159b98f2008-12-05 07:49:08 +0000939 return false;
Chris Lattnerdcded152008-12-02 08:16:11 +0000940}
941
Chris Lattnerd6b1d052009-09-20 20:09:34 +0000942
943/// CoerceAvailableValueToLoadType - If we saw a store of a value to memory, and
944/// then a load from a must-aliased pointer of a different type, try to coerce
945/// the stored value. LoadedTy is the type of the load we want to replace and
946/// InsertPt is the place to insert new instructions.
947///
948/// If we can't do it, return null.
949static Value *CoerceAvailableValueToLoadType(Value *StoredVal,
950 const Type *LoadedTy,
951 Instruction *InsertPt,
952 const TargetData &TD) {
953 const Type *StoredValTy = StoredVal->getType();
954
955 uint64_t StoreSize = TD.getTypeSizeInBits(StoredValTy);
956 uint64_t LoadSize = TD.getTypeSizeInBits(LoadedTy);
957
958 // If the store and reload are the same size, we can always reuse it.
959 if (StoreSize == LoadSize) {
960 if (isa<PointerType>(StoredValTy) && isa<PointerType>(LoadedTy)) {
961 // Pointer to Pointer -> use bitcast.
962 return new BitCastInst(StoredVal, LoadedTy, "", InsertPt);
963 }
964
965 // Convert source pointers to integers, which can be bitcast.
966 if (isa<PointerType>(StoredValTy)) {
967 StoredValTy = TD.getIntPtrType(StoredValTy->getContext());
968 StoredVal = new PtrToIntInst(StoredVal, StoredValTy, "", InsertPt);
969 }
970
971 const Type *TypeToCastTo = LoadedTy;
972 if (isa<PointerType>(TypeToCastTo))
973 TypeToCastTo = TD.getIntPtrType(StoredValTy->getContext());
974
975 if (StoredValTy != TypeToCastTo)
976 StoredVal = new BitCastInst(StoredVal, TypeToCastTo, "", InsertPt);
977
978 // Cast to pointer if the load needs a pointer type.
979 if (isa<PointerType>(LoadedTy))
980 StoredVal = new IntToPtrInst(StoredVal, LoadedTy, "", InsertPt);
981
982 return StoredVal;
983 }
984
985 // If the loaded value is smaller than the available value, then we can
986 // extract out a piece from it. If the available value is too small, then we
987 // can't do anything.
988 if (StoreSize < LoadSize)
989 return 0;
990
991 // Convert source pointers to integers, which can be manipulated.
992 if (isa<PointerType>(StoredValTy)) {
993 StoredValTy = TD.getIntPtrType(StoredValTy->getContext());
994 StoredVal = new PtrToIntInst(StoredVal, StoredValTy, "", InsertPt);
995 }
996
997 // Convert vectors and fp to integer, which can be manipulated.
998 if (!isa<IntegerType>(StoredValTy)) {
999 StoredValTy = IntegerType::get(StoredValTy->getContext(), StoreSize);
1000 StoredVal = new BitCastInst(StoredVal, StoredValTy, "", InsertPt);
1001 }
1002
1003 // If this is a big-endian system, we need to shift the value down to the low
1004 // bits so that a truncate will work.
1005 if (TD.isBigEndian()) {
1006 Constant *Val = ConstantInt::get(StoredVal->getType(), StoreSize-LoadSize);
1007 StoredVal = BinaryOperator::CreateLShr(StoredVal, Val, "tmp", InsertPt);
1008 }
1009
1010 // Truncate the integer to the right size now.
1011 const Type *NewIntTy = IntegerType::get(StoredValTy->getContext(), LoadSize);
1012 StoredVal = new TruncInst(StoredVal, NewIntTy, "trunc", InsertPt);
1013
1014 if (LoadedTy == NewIntTy)
1015 return StoredVal;
1016
1017 // If the result is a pointer, inttoptr.
1018 if (isa<PointerType>(LoadedTy))
1019 return new IntToPtrInst(StoredVal, LoadedTy, "inttoptr", InsertPt);
1020
1021 // Otherwise, bitcast.
1022 return new BitCastInst(StoredVal, LoadedTy, "bitcast", InsertPt);
1023}
1024
1025static void
1026GetAvailableBlockValues(DenseMap<BasicBlock*, Value*> &BlockReplValues,
1027 SmallVector<std::pair<BasicBlock*,
1028 Value*>, 16> &ValuesPerBlock,
1029 const Type *LoadTy,
1030 const TargetData *TD) {
1031
1032 for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i) {
1033 BasicBlock *BB = ValuesPerBlock[i].first;
1034 Value *AvailableVal = ValuesPerBlock[i].second;
1035
1036 Value *&BlockEntry = BlockReplValues[BB];
1037 if (BlockEntry) continue;
1038
1039 if (AvailableVal->getType() != LoadTy) {
1040 assert(TD && "Need target data to handle type mismatch case");
1041 AvailableVal = CoerceAvailableValueToLoadType(AvailableVal, LoadTy,
1042 BB->getTerminator(), *TD);
1043 DEBUG(errs() << "GVN COERCED NONLOCAL VAL:\n"
1044 << *ValuesPerBlock[i].second << '\n'
1045 << *AvailableVal << '\n' << "\n\n\n");
1046 }
1047 BlockEntry = AvailableVal;
1048 }
1049}
1050
Owen Andersone0143452007-08-16 22:02:55 +00001051/// processNonLocalLoad - Attempt to eliminate a load whose dependencies are
1052/// non-local by performing PHI construction.
Chris Lattnerdcded152008-12-02 08:16:11 +00001053bool GVN::processNonLocalLoad(LoadInst *LI,
Chris Lattner7de20452008-03-21 22:01:16 +00001054 SmallVectorImpl<Instruction*> &toErase) {
Chris Lattnerdcded152008-12-02 08:16:11 +00001055 // Find the non-local dependencies of the load.
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001056 SmallVector<MemoryDependenceAnalysis::NonLocalDepEntry, 64> Deps;
Chris Lattneraf713862008-12-09 19:25:07 +00001057 MD->getNonLocalPointerDependency(LI->getOperand(0), true, LI->getParent(),
1058 Deps);
Dan Gohman7e124382009-07-31 20:24:18 +00001059 //DEBUG(errs() << "INVESTIGATING NONLOCAL LOAD: "
1060 // << Deps.size() << *LI << '\n');
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001061
Owen Anderson90e717d2008-08-26 22:07:42 +00001062 // If we had to process more than one hundred blocks to find the
1063 // dependencies, this load isn't worth worrying about. Optimizing
1064 // it will be too expensive.
Chris Lattneraf713862008-12-09 19:25:07 +00001065 if (Deps.size() > 100)
Owen Anderson90e717d2008-08-26 22:07:42 +00001066 return false;
Chris Lattner8d1686f2008-12-18 00:51:32 +00001067
1068 // If we had a phi translation failure, we'll have a single entry which is a
1069 // clobber in the current block. Reject this early.
Edwin Török3ffffac2009-06-17 18:48:18 +00001070 if (Deps.size() == 1 && Deps[0].second.isClobber()) {
1071 DEBUG(
Dan Gohman0be10b02009-07-25 01:43:01 +00001072 errs() << "GVN: non-local load ";
1073 WriteAsOperand(errs(), LI);
Dan Gohman7e124382009-07-31 20:24:18 +00001074 errs() << " is clobbered by " << *Deps[0].second.getInst() << '\n';
Edwin Török3ffffac2009-06-17 18:48:18 +00001075 );
Chris Lattner8d1686f2008-12-18 00:51:32 +00001076 return false;
Edwin Török3ffffac2009-06-17 18:48:18 +00001077 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001078
Chris Lattnerdcded152008-12-02 08:16:11 +00001079 // Filter out useless results (non-locals, etc). Keep track of the blocks
1080 // where we have a value available in repl, also keep track of whether we see
1081 // dependencies that produce an unknown value for the load (such as a call
1082 // that could potentially clobber the load).
1083 SmallVector<std::pair<BasicBlock*, Value*>, 16> ValuesPerBlock;
1084 SmallVector<BasicBlock*, 16> UnavailableBlocks;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001085
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001086 const TargetData *TD = 0;
1087
Chris Lattneraf713862008-12-09 19:25:07 +00001088 for (unsigned i = 0, e = Deps.size(); i != e; ++i) {
1089 BasicBlock *DepBB = Deps[i].first;
1090 MemDepResult DepInfo = Deps[i].second;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001091
Chris Lattner4531da82008-12-05 21:04:20 +00001092 if (DepInfo.isClobber()) {
1093 UnavailableBlocks.push_back(DepBB);
1094 continue;
1095 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001096
Chris Lattner4531da82008-12-05 21:04:20 +00001097 Instruction *DepInst = DepInfo.getInst();
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001098
Chris Lattner4531da82008-12-05 21:04:20 +00001099 // Loading the allocation -> undef.
Victor Hernandez48c3c542009-09-18 22:35:49 +00001100 if (isa<AllocationInst>(DepInst) || isMalloc(DepInst)) {
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001101 ValuesPerBlock.push_back(std::make_pair(DepBB,
Owen Andersonb99ecca2009-07-30 23:03:37 +00001102 UndefValue::get(LI->getType())));
Chris Lattner46876282008-12-01 01:15:42 +00001103 continue;
1104 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001105
Chris Lattneraf713862008-12-09 19:25:07 +00001106 if (StoreInst* S = dyn_cast<StoreInst>(DepInst)) {
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001107 // Reject loads and stores that are to the same address but are of
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001108 // different types if we have to.
Chris Lattnerdcded152008-12-02 08:16:11 +00001109 if (S->getOperand(0)->getType() != LI->getType()) {
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001110 if (TD == 0)
1111 TD = getAnalysisIfAvailable<TargetData>();
1112
1113 // If the stored value is larger or equal to the loaded value, we can
1114 // reuse it.
1115 if (TD == 0 ||
1116 TD->getTypeSizeInBits(S->getOperand(0)->getType()) <
1117 TD->getTypeSizeInBits(LI->getType())) {
1118 UnavailableBlocks.push_back(DepBB);
1119 continue;
1120 }
Chris Lattnerdcded152008-12-02 08:16:11 +00001121 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001122
Chris Lattnerdcded152008-12-02 08:16:11 +00001123 ValuesPerBlock.push_back(std::make_pair(DepBB, S->getOperand(0)));
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001124
Chris Lattneraf713862008-12-09 19:25:07 +00001125 } else if (LoadInst* LD = dyn_cast<LoadInst>(DepInst)) {
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001126 // If the types mismatch and we can't handle it, reject reuse of the load.
Chris Lattnerdcded152008-12-02 08:16:11 +00001127 if (LD->getType() != LI->getType()) {
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001128 if (TD == 0)
1129 TD = getAnalysisIfAvailable<TargetData>();
1130
1131 // If the stored value is larger or equal to the loaded value, we can
1132 // reuse it.
1133 if (TD == 0 ||
1134 TD->getTypeSizeInBits(LD->getType()) <
1135 TD->getTypeSizeInBits(LI->getType())) {
1136 UnavailableBlocks.push_back(DepBB);
1137 continue;
1138 }
Chris Lattnerdcded152008-12-02 08:16:11 +00001139 }
Chris Lattnerdcded152008-12-02 08:16:11 +00001140 ValuesPerBlock.push_back(std::make_pair(DepBB, LD));
Owen Anderson5d72a422007-07-25 19:57:03 +00001141 } else {
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001142 // FIXME: Handle memset/memcpy.
Chris Lattnerdcded152008-12-02 08:16:11 +00001143 UnavailableBlocks.push_back(DepBB);
1144 continue;
Owen Anderson5d72a422007-07-25 19:57:03 +00001145 }
Chris Lattner3d7103e2008-03-21 21:14:38 +00001146 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001147
Chris Lattnerdcded152008-12-02 08:16:11 +00001148 // If we have no predecessors that produce a known value for this load, exit
1149 // early.
1150 if (ValuesPerBlock.empty()) return false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001151
Chris Lattnerdcded152008-12-02 08:16:11 +00001152 // If all of the instructions we depend on produce a known value for this
1153 // load, then it is fully redundant and we can use PHI insertion to compute
1154 // its value. Insert PHIs and remove the fully redundant value now.
1155 if (UnavailableBlocks.empty()) {
1156 // Use cached PHI construction information from previous runs
1157 SmallPtrSet<Instruction*, 4> &p = phiMap[LI->getPointerOperand()];
Chris Lattneraf713862008-12-09 19:25:07 +00001158 // FIXME: What does phiMap do? Are we positive it isn't getting invalidated?
Chris Lattnerdcded152008-12-02 08:16:11 +00001159 for (SmallPtrSet<Instruction*, 4>::iterator I = p.begin(), E = p.end();
1160 I != E; ++I) {
1161 if ((*I)->getParent() == LI->getParent()) {
Dan Gohman7e124382009-07-31 20:24:18 +00001162 DEBUG(errs() << "GVN REMOVING NONLOCAL LOAD #1: " << *LI << '\n');
Chris Lattnerdcded152008-12-02 08:16:11 +00001163 LI->replaceAllUsesWith(*I);
Chris Lattnerf81b0142008-12-09 22:06:23 +00001164 if (isa<PointerType>((*I)->getType()))
1165 MD->invalidateCachedPointerInfo(*I);
Chris Lattnerdcded152008-12-02 08:16:11 +00001166 toErase.push_back(LI);
1167 NumGVNLoad++;
1168 return true;
1169 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001170
Chris Lattnerdcded152008-12-02 08:16:11 +00001171 ValuesPerBlock.push_back(std::make_pair((*I)->getParent(), *I));
Owen Anderson5b299672007-08-07 23:12:31 +00001172 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001173
Dan Gohman7e124382009-07-31 20:24:18 +00001174 DEBUG(errs() << "GVN REMOVING NONLOCAL LOAD: " << *LI << '\n');
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001175
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001176 // Convert the block information to a map, and insert coersions as needed.
Chris Lattnerdcded152008-12-02 08:16:11 +00001177 DenseMap<BasicBlock*, Value*> BlockReplValues;
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001178 GetAvailableBlockValues(BlockReplValues, ValuesPerBlock, LI->getType(), TD);
1179
Chris Lattnerdcded152008-12-02 08:16:11 +00001180 // Perform PHI construction.
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001181 Value *V = GetValueForBlock(LI->getParent(), LI, BlockReplValues, true);
1182 LI->replaceAllUsesWith(V);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001183
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001184 if (isa<PHINode>(V))
1185 V->takeName(LI);
1186 if (isa<PointerType>(V->getType()))
1187 MD->invalidateCachedPointerInfo(V);
Chris Lattnerdcded152008-12-02 08:16:11 +00001188 toErase.push_back(LI);
1189 NumGVNLoad++;
1190 return true;
1191 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001192
Chris Lattnerdcded152008-12-02 08:16:11 +00001193 if (!EnablePRE || !EnableLoadPRE)
1194 return false;
1195
1196 // Okay, we have *some* definitions of the value. This means that the value
1197 // is available in some of our (transitive) predecessors. Lets think about
1198 // doing PRE of this load. This will involve inserting a new load into the
1199 // predecessor when it's not available. We could do this in general, but
1200 // prefer to not increase code size. As such, we only do this when we know
1201 // that we only have to insert *one* load (which means we're basically moving
1202 // the load, not inserting a new one).
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001203
Owen Andersondd37b182009-05-31 09:03:40 +00001204 SmallPtrSet<BasicBlock *, 4> Blockers;
1205 for (unsigned i = 0, e = UnavailableBlocks.size(); i != e; ++i)
1206 Blockers.insert(UnavailableBlocks[i]);
1207
1208 // Lets find first basic block with more than one predecessor. Walk backwards
1209 // through predecessors if needed.
Chris Lattnerdcded152008-12-02 08:16:11 +00001210 BasicBlock *LoadBB = LI->getParent();
Owen Andersondd37b182009-05-31 09:03:40 +00001211 BasicBlock *TmpBB = LoadBB;
1212
1213 bool isSinglePred = false;
Dale Johannesena19b67f2009-06-17 20:48:23 +00001214 bool allSingleSucc = true;
Owen Andersondd37b182009-05-31 09:03:40 +00001215 while (TmpBB->getSinglePredecessor()) {
1216 isSinglePred = true;
1217 TmpBB = TmpBB->getSinglePredecessor();
1218 if (!TmpBB) // If haven't found any, bail now.
1219 return false;
1220 if (TmpBB == LoadBB) // Infinite (unreachable) loop.
1221 return false;
1222 if (Blockers.count(TmpBB))
1223 return false;
Dale Johannesena19b67f2009-06-17 20:48:23 +00001224 if (TmpBB->getTerminator()->getNumSuccessors() != 1)
1225 allSingleSucc = false;
Owen Andersondd37b182009-05-31 09:03:40 +00001226 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001227
Owen Andersondd37b182009-05-31 09:03:40 +00001228 assert(TmpBB);
1229 LoadBB = TmpBB;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001230
Chris Lattnerdcded152008-12-02 08:16:11 +00001231 // If we have a repl set with LI itself in it, this means we have a loop where
1232 // at least one of the values is LI. Since this means that we won't be able
1233 // to eliminate LI even if we insert uses in the other predecessors, we will
1234 // end up increasing code size. Reject this by scanning for LI.
1235 for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i)
1236 if (ValuesPerBlock[i].second == LI)
1237 return false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001238
Owen Andersondd37b182009-05-31 09:03:40 +00001239 if (isSinglePred) {
1240 bool isHot = false;
1241 for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i)
1242 if (Instruction *I = dyn_cast<Instruction>(ValuesPerBlock[i].second))
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001243 // "Hot" Instruction is in some loop (because it dominates its dep.
1244 // instruction).
1245 if (DT->dominates(LI, I)) {
1246 isHot = true;
1247 break;
1248 }
Owen Andersondd37b182009-05-31 09:03:40 +00001249
1250 // We are interested only in "hot" instructions. We don't want to do any
1251 // mis-optimizations here.
1252 if (!isHot)
1253 return false;
1254 }
1255
Chris Lattnerdcded152008-12-02 08:16:11 +00001256 // Okay, we have some hope :). Check to see if the loaded value is fully
1257 // available in all but one predecessor.
1258 // FIXME: If we could restructure the CFG, we could make a common pred with
1259 // all the preds that don't have an available LI and insert a new load into
1260 // that one block.
1261 BasicBlock *UnavailablePred = 0;
1262
Chris Lattner159b98f2008-12-05 07:49:08 +00001263 DenseMap<BasicBlock*, char> FullyAvailableBlocks;
Chris Lattnerdcded152008-12-02 08:16:11 +00001264 for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i)
1265 FullyAvailableBlocks[ValuesPerBlock[i].first] = true;
1266 for (unsigned i = 0, e = UnavailableBlocks.size(); i != e; ++i)
1267 FullyAvailableBlocks[UnavailableBlocks[i]] = false;
1268
1269 for (pred_iterator PI = pred_begin(LoadBB), E = pred_end(LoadBB);
1270 PI != E; ++PI) {
1271 if (IsValueFullyAvailableInBlock(*PI, FullyAvailableBlocks))
1272 continue;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001273
Chris Lattnerdcded152008-12-02 08:16:11 +00001274 // If this load is not available in multiple predecessors, reject it.
1275 if (UnavailablePred && UnavailablePred != *PI)
1276 return false;
1277 UnavailablePred = *PI;
1278 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001279
Chris Lattnerdcded152008-12-02 08:16:11 +00001280 assert(UnavailablePred != 0 &&
1281 "Fully available value should be eliminated above!");
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001282
Chris Lattnerdcded152008-12-02 08:16:11 +00001283 // If the loaded pointer is PHI node defined in this block, do PHI translation
1284 // to get its value in the predecessor.
1285 Value *LoadPtr = LI->getOperand(0)->DoPHITranslation(LoadBB, UnavailablePred);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001286
Chris Lattnerdcded152008-12-02 08:16:11 +00001287 // Make sure the value is live in the predecessor. If it was defined by a
1288 // non-PHI instruction in this block, we don't know how to recompute it above.
1289 if (Instruction *LPInst = dyn_cast<Instruction>(LoadPtr))
1290 if (!DT->dominates(LPInst->getParent(), UnavailablePred)) {
Daniel Dunbar005975c2009-07-25 00:23:56 +00001291 DEBUG(errs() << "COULDN'T PRE LOAD BECAUSE PTR IS UNAVAILABLE IN PRED: "
Dan Gohman7e124382009-07-31 20:24:18 +00001292 << *LPInst << '\n' << *LI << "\n");
Chris Lattnerdcded152008-12-02 08:16:11 +00001293 return false;
1294 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001295
Chris Lattnerdcded152008-12-02 08:16:11 +00001296 // We don't currently handle critical edges :(
1297 if (UnavailablePred->getTerminator()->getNumSuccessors() != 1) {
Daniel Dunbar005975c2009-07-25 00:23:56 +00001298 DEBUG(errs() << "COULD NOT PRE LOAD BECAUSE OF CRITICAL EDGE '"
Dan Gohman7e124382009-07-31 20:24:18 +00001299 << UnavailablePred->getName() << "': " << *LI << '\n');
Chris Lattnerdcded152008-12-02 08:16:11 +00001300 return false;
Owen Anderson5b299672007-08-07 23:12:31 +00001301 }
Dale Johannesena19b67f2009-06-17 20:48:23 +00001302
1303 // Make sure it is valid to move this load here. We have to watch out for:
1304 // @1 = getelementptr (i8* p, ...
1305 // test p and branch if == 0
1306 // load @1
1307 // It is valid to have the getelementptr before the test, even if p can be 0,
1308 // as getelementptr only does address arithmetic.
1309 // If we are not pushing the value through any multiple-successor blocks
1310 // we do not have this case. Otherwise, check that the load is safe to
1311 // put anywhere; this can be improved, but should be conservatively safe.
1312 if (!allSingleSucc &&
1313 !isSafeToLoadUnconditionally(LoadPtr, UnavailablePred->getTerminator()))
1314 return false;
1315
Chris Lattnerdcded152008-12-02 08:16:11 +00001316 // Okay, we can eliminate this load by inserting a reload in the predecessor
1317 // and using PHI construction to get the value in the other predecessors, do
1318 // it.
Dan Gohman7e124382009-07-31 20:24:18 +00001319 DEBUG(errs() << "GVN REMOVING PRE LOAD: " << *LI << '\n');
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001320
Chris Lattnerdcded152008-12-02 08:16:11 +00001321 Value *NewLoad = new LoadInst(LoadPtr, LI->getName()+".pre", false,
1322 LI->getAlignment(),
1323 UnavailablePred->getTerminator());
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001324
Owen Anderson1c057ee2009-05-29 05:37:54 +00001325 SmallPtrSet<Instruction*, 4> &p = phiMap[LI->getPointerOperand()];
1326 for (SmallPtrSet<Instruction*, 4>::iterator I = p.begin(), E = p.end();
1327 I != E; ++I)
1328 ValuesPerBlock.push_back(std::make_pair((*I)->getParent(), *I));
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001329
Chris Lattnerdcded152008-12-02 08:16:11 +00001330 DenseMap<BasicBlock*, Value*> BlockReplValues;
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001331 GetAvailableBlockValues(BlockReplValues, ValuesPerBlock, LI->getType(), TD);
Chris Lattnerdcded152008-12-02 08:16:11 +00001332 BlockReplValues[UnavailablePred] = NewLoad;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001333
Chris Lattnerdcded152008-12-02 08:16:11 +00001334 // Perform PHI construction.
Chris Lattnerd6b1d052009-09-20 20:09:34 +00001335 Value *V = GetValueForBlock(LI->getParent(), LI, BlockReplValues, true);
1336 LI->replaceAllUsesWith(V);
1337 if (isa<PHINode>(V))
1338 V->takeName(LI);
1339 if (isa<PointerType>(V->getType()))
1340 MD->invalidateCachedPointerInfo(V);
Chris Lattnerdcded152008-12-02 08:16:11 +00001341 toErase.push_back(LI);
1342 NumPRELoad++;
Owen Anderson5d72a422007-07-25 19:57:03 +00001343 return true;
1344}
1345
Chris Lattner0907b522009-09-21 05:57:11 +00001346/// GetBaseWithConstantOffset - Analyze the specified pointer to see if it can
1347/// be expressed as a base pointer plus a constant offset. Return the base and
1348/// offset to the caller.
1349static Value *GetBaseWithConstantOffset(Value *Ptr, int64_t &Offset,
1350 const TargetData *TD) {
1351 Operator *PtrOp = dyn_cast<Operator>(Ptr);
1352 if (PtrOp == 0) return Ptr;
1353
1354 // Just look through bitcasts.
1355 if (PtrOp->getOpcode() == Instruction::BitCast)
1356 return GetBaseWithConstantOffset(PtrOp->getOperand(0), Offset, TD);
1357
1358 // If this is a GEP with constant indices, we can look through it.
1359 GEPOperator *GEP = dyn_cast<GEPOperator>(PtrOp);
1360 if (GEP == 0 || !GEP->hasAllConstantIndices()) return Ptr;
1361
1362 gep_type_iterator GTI = gep_type_begin(GEP);
1363 for (User::op_iterator I = GEP->idx_begin(), E = GEP->idx_end(); I != E;
1364 ++I, ++GTI) {
1365 ConstantInt *OpC = cast<ConstantInt>(*I);
1366 if (OpC->isZero()) continue;
1367
1368 // Handle a struct and array indices which add their offset to the pointer.
1369 if (const StructType *STy = dyn_cast<StructType>(*GTI)) {
1370 Offset += TD->getStructLayout(STy)->getElementOffset(OpC->getZExtValue());
1371 } else {
1372 uint64_t Size = TD->getTypeAllocSize(GTI.getIndexedType());
1373 Offset += OpC->getSExtValue()*Size;
1374 }
1375 }
1376
1377 // Re-sign extend from the pointer size if needed to get overflow edge cases
1378 // right.
1379 unsigned PtrSize = TD->getPointerSizeInBits();
1380 if (PtrSize < 64)
1381 Offset = (Offset << (64-PtrSize)) >> (64-PtrSize);
1382
1383 return GetBaseWithConstantOffset(GEP->getPointerOperand(), Offset, TD);
1384}
1385
1386
1387/// HandleLoadFromClobberingStore - This function is called when we have a
1388/// memdep query of a load that ends up being a clobbering store. This means
1389/// that the store *may* provide bits used by the load but we can't be sure
1390/// because the pointers don't mustalias. Check this case to see if there is
1391/// anything more we can do before we give up.
1392static Value *HandleLoadFromClobberingStore(LoadInst *L, StoreInst *DepSI,
1393 const TargetData *TD) {
1394 int64_t StoreOffset = 0, LoadOffset = 0;
1395 Value *StoreBase =
1396 GetBaseWithConstantOffset(DepSI->getPointerOperand(), StoreOffset, TD);
1397 Value *LoadBase =
1398 GetBaseWithConstantOffset(L->getPointerOperand(), LoadOffset, TD);
1399 if (StoreBase != LoadBase)
1400 return 0;
1401
1402 // If the load and store are to the exact same address, they should have been
1403 // a must alias. AA must have gotten confused.
1404 // FIXME: Study to see if/when this happens.
1405 if (LoadOffset == StoreOffset) {
1406#if 0
1407 errs() << "STORE/LOAD DEP WITH COMMON POINTER MISSED:\n"
1408 << "Base = " << *StoreBase << "\n"
1409 << "Store Ptr = " << *DepSI->getPointerOperand() << "\n"
1410 << "Store Offs = " << StoreOffset << " - " << *DepSI << "\n"
1411 << "Load Ptr = " << *L->getPointerOperand() << "\n"
1412 << "Load Offs = " << LoadOffset << " - " << *L << "\n\n";
1413 errs() << "'" << L->getParent()->getParent()->getName() << "'"
1414 << *L->getParent();
1415#endif
1416 return 0;
1417 }
1418
1419 // If the load and store don't overlap at all, the store doesn't provide
1420 // anything to the load. In this case, they really don't alias at all, AA
1421 // must have gotten confused.
1422 // FIXME: Investigate cases where this bails out, e.g. rdar://7238614. Then
1423 // remove this check, as it is duplicated with what we have below.
1424 uint64_t StoreSize = TD->getTypeSizeInBits(DepSI->getOperand(0)->getType());
1425 uint64_t LoadSize = TD->getTypeSizeInBits(L->getType());
1426
1427 if ((StoreSize & 7) | (LoadSize & 7))
1428 return 0;
1429 StoreSize >>= 3; // Convert to bytes.
1430 LoadSize >>= 3;
1431
1432
1433 bool isAAFailure = false;
1434 if (StoreOffset < LoadOffset) {
1435 isAAFailure = StoreOffset+int64_t(StoreSize) <= LoadOffset;
1436 } else {
1437 isAAFailure = LoadOffset+int64_t(LoadSize) <= StoreOffset;
1438 }
1439 if (isAAFailure) {
1440#if 0
1441 errs() << "STORE LOAD DEP WITH COMMON BASE:\n"
1442 << "Base = " << *StoreBase << "\n"
1443 << "Store Ptr = " << *DepSI->getPointerOperand() << "\n"
1444 << "Store Offs = " << StoreOffset << " - " << *DepSI << "\n"
1445 << "Load Ptr = " << *L->getPointerOperand() << "\n"
1446 << "Load Offs = " << LoadOffset << " - " << *L << "\n\n";
1447 errs() << "'" << L->getParent()->getParent()->getName() << "'"
1448 << *L->getParent();
1449#endif
1450 return 0;
1451 }
1452
1453 // If the Load isn't completely contained within the stored bits, we don't
1454 // have all the bits to feed it. We could do something crazy in the future
1455 // (issue a smaller load then merge the bits in) but this seems unlikely to be
1456 // valuable.
1457 if (StoreOffset > LoadOffset ||
1458 StoreOffset+StoreSize < LoadOffset+LoadSize)
1459 return 0;
1460
1461 // Adjust LoadOffset to be relative from the start of StoreOffset.
1462 LoadOffset -= StoreOffset;
1463
1464 Value *SrcVal = DepSI->getOperand(0);
1465
1466 LLVMContext &Ctx = SrcVal->getType()->getContext();
1467
1468 // Compute which bits of the stored value are being used by the load. Convert
1469 // to an integer type to start with.
1470 if (isa<PointerType>(SrcVal->getType()))
1471 SrcVal = new PtrToIntInst(SrcVal, TD->getIntPtrType(Ctx), "tmp", L);
1472 if (!isa<IntegerType>(SrcVal->getType()))
1473 SrcVal = new BitCastInst(SrcVal, IntegerType::get(Ctx, StoreSize*8), "", L);
1474
1475 // Shift the bits to the least significant depending on endianness.
1476 unsigned ShiftAmt;
1477 if (TD->isLittleEndian()) {
1478 ShiftAmt = LoadOffset*8;
1479 } else {
1480 ShiftAmt = StoreSize-LoadSize-LoadOffset;
1481 }
1482
1483 SrcVal = BinaryOperator::CreateLShr(SrcVal,
1484 ConstantInt::get(SrcVal->getType(), ShiftAmt), "tmp", L);
1485
1486 SrcVal = new TruncInst(SrcVal, IntegerType::get(Ctx, LoadSize*8), "", L);
1487
1488 return CoerceAvailableValueToLoadType(SrcVal, L->getType(), L, *TD);
1489}
1490
1491
1492
Owen Andersone0143452007-08-16 22:02:55 +00001493/// processLoad - Attempt to eliminate a load, first by eliminating it
1494/// locally, and then attempting non-local elimination if that fails.
Chris Lattner4531da82008-12-05 21:04:20 +00001495bool GVN::processLoad(LoadInst *L, SmallVectorImpl<Instruction*> &toErase) {
1496 if (L->isVolatile())
Owen Anderson85c40642007-07-24 17:55:58 +00001497 return false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001498
Owen Anderson85c40642007-07-24 17:55:58 +00001499 // ... to a pointer that has been loaded from before...
Chris Lattnerff36c952009-09-21 02:42:51 +00001500 MemDepResult Dep = MD->getDependency(L);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001501
Chris Lattner4531da82008-12-05 21:04:20 +00001502 // If the value isn't available, don't do anything!
Chris Lattnerff36c952009-09-21 02:42:51 +00001503 if (Dep.isClobber()) {
Chris Lattner0907b522009-09-21 05:57:11 +00001504 // FIXME: We should handle memset/memcpy/memmove as dependent instructions
1505 // to forward the value if available.
1506 //if (isa<MemIntrinsic>(Dep.getInst()))
1507 //errs() << "LOAD DEPENDS ON MEM: " << *L << "\n" << *Dep.getInst()<<"\n\n";
1508
1509 // Check to see if we have something like this:
Chris Lattner7741aa52009-09-20 19:03:47 +00001510 // store i32 123, i32* %P
1511 // %A = bitcast i32* %P to i8*
1512 // %B = gep i8* %A, i32 1
1513 // %C = load i8* %B
1514 //
1515 // We could do that by recognizing if the clobber instructions are obviously
1516 // a common base + constant offset, and if the previous store (or memset)
1517 // completely covers this load. This sort of thing can happen in bitfield
1518 // access code.
Chris Lattner0907b522009-09-21 05:57:11 +00001519 if (StoreInst *DepSI = dyn_cast<StoreInst>(Dep.getInst()))
1520 if (const TargetData *TD = getAnalysisIfAvailable<TargetData>())
1521 if (Value *AvailVal = HandleLoadFromClobberingStore(L, DepSI, TD)) {
1522 DEBUG(errs() << "GVN COERCED STORE BITS:\n" << *DepSI << '\n'
1523 << *AvailVal << '\n' << *L << "\n\n\n");
1524
1525 // Replace the load!
1526 L->replaceAllUsesWith(AvailVal);
1527 if (isa<PointerType>(AvailVal->getType()))
1528 MD->invalidateCachedPointerInfo(AvailVal);
1529 toErase.push_back(L);
1530 NumGVNLoad++;
1531 return true;
1532 }
1533
Edwin Török47cf8842009-05-29 09:46:03 +00001534 DEBUG(
1535 // fast print dep, using operator<< on instruction would be too slow
Dan Gohman0be10b02009-07-25 01:43:01 +00001536 errs() << "GVN: load ";
1537 WriteAsOperand(errs(), L);
Chris Lattnerff36c952009-09-21 02:42:51 +00001538 Instruction *I = Dep.getInst();
Dan Gohman7e124382009-07-31 20:24:18 +00001539 errs() << " is clobbered by " << *I << '\n';
Edwin Török47cf8842009-05-29 09:46:03 +00001540 );
Chris Lattner4531da82008-12-05 21:04:20 +00001541 return false;
Edwin Török47cf8842009-05-29 09:46:03 +00001542 }
Chris Lattner4531da82008-12-05 21:04:20 +00001543
1544 // If it is defined in another block, try harder.
Chris Lattnerff36c952009-09-21 02:42:51 +00001545 if (Dep.isNonLocal())
Chris Lattner4531da82008-12-05 21:04:20 +00001546 return processNonLocalLoad(L, toErase);
Eli Friedman350307f2008-02-12 12:08:14 +00001547
Chris Lattnerff36c952009-09-21 02:42:51 +00001548 Instruction *DepInst = Dep.getInst();
Chris Lattner4531da82008-12-05 21:04:20 +00001549 if (StoreInst *DepSI = dyn_cast<StoreInst>(DepInst)) {
Chris Lattner7741aa52009-09-20 19:03:47 +00001550 Value *StoredVal = DepSI->getOperand(0);
1551
1552 // The store and load are to a must-aliased pointer, but they may not
1553 // actually have the same type. See if we know how to reuse the stored
1554 // value (depending on its type).
1555 const TargetData *TD = 0;
1556 if (StoredVal->getType() != L->getType() &&
1557 (TD = getAnalysisIfAvailable<TargetData>())) {
Chris Lattner3de5c8c2009-09-20 19:31:14 +00001558 StoredVal = CoerceAvailableValueToLoadType(StoredVal, L->getType(), L, *TD);
Chris Lattner7741aa52009-09-20 19:03:47 +00001559 if (StoredVal == 0)
1560 return false;
1561
1562 DEBUG(errs() << "GVN COERCED STORE:\n" << *DepSI << '\n' << *StoredVal
1563 << '\n' << *L << "\n\n\n");
1564 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001565
Chris Lattner4531da82008-12-05 21:04:20 +00001566 // Remove it!
Chris Lattner7741aa52009-09-20 19:03:47 +00001567 L->replaceAllUsesWith(StoredVal);
1568 if (isa<PointerType>(StoredVal->getType()))
1569 MD->invalidateCachedPointerInfo(StoredVal);
Chris Lattner4531da82008-12-05 21:04:20 +00001570 toErase.push_back(L);
1571 NumGVNLoad++;
1572 return true;
1573 }
1574
1575 if (LoadInst *DepLI = dyn_cast<LoadInst>(DepInst)) {
Chris Lattner7741aa52009-09-20 19:03:47 +00001576 Value *AvailableVal = DepLI;
1577
1578 // The loads are of a must-aliased pointer, but they may not actually have
1579 // the same type. See if we know how to reuse the previously loaded value
1580 // (depending on its type).
1581 const TargetData *TD = 0;
1582 if (DepLI->getType() != L->getType() &&
1583 (TD = getAnalysisIfAvailable<TargetData>())) {
Chris Lattner3de5c8c2009-09-20 19:31:14 +00001584 AvailableVal = CoerceAvailableValueToLoadType(DepLI, L->getType(), L, *TD);
Chris Lattner7741aa52009-09-20 19:03:47 +00001585 if (AvailableVal == 0)
1586 return false;
1587
1588 DEBUG(errs() << "GVN COERCED LOAD:\n" << *DepLI << "\n" << *AvailableVal
1589 << "\n" << *L << "\n\n\n");
1590 }
1591
Chris Lattner4531da82008-12-05 21:04:20 +00001592 // Remove it!
Chris Lattner7741aa52009-09-20 19:03:47 +00001593 L->replaceAllUsesWith(AvailableVal);
Chris Lattnerf81b0142008-12-09 22:06:23 +00001594 if (isa<PointerType>(DepLI->getType()))
1595 MD->invalidateCachedPointerInfo(DepLI);
Chris Lattner4531da82008-12-05 21:04:20 +00001596 toErase.push_back(L);
1597 NumGVNLoad++;
1598 return true;
1599 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001600
Chris Lattner8ea60462008-11-30 01:39:32 +00001601 // If this load really doesn't depend on anything, then we must be loading an
1602 // undef value. This can happen when loading for a fresh allocation with no
1603 // intervening stores, for example.
Victor Hernandez48c3c542009-09-18 22:35:49 +00001604 if (isa<AllocationInst>(DepInst) || isMalloc(DepInst)) {
Owen Andersonb99ecca2009-07-30 23:03:37 +00001605 L->replaceAllUsesWith(UndefValue::get(L->getType()));
Chris Lattner8ea60462008-11-30 01:39:32 +00001606 toErase.push_back(L);
Chris Lattner8ea60462008-11-30 01:39:32 +00001607 NumGVNLoad++;
Chris Lattner4531da82008-12-05 21:04:20 +00001608 return true;
Eli Friedman350307f2008-02-12 12:08:14 +00001609 }
1610
Chris Lattner4531da82008-12-05 21:04:20 +00001611 return false;
Owen Anderson85c40642007-07-24 17:55:58 +00001612}
1613
Chris Lattnerff36c952009-09-21 02:42:51 +00001614Value *GVN::lookupNumber(BasicBlock *BB, uint32_t num) {
Owen Andersonaef6a922008-06-23 17:49:45 +00001615 DenseMap<BasicBlock*, ValueNumberScope*>::iterator I = localAvail.find(BB);
1616 if (I == localAvail.end())
1617 return 0;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001618
Chris Lattnerff36c952009-09-21 02:42:51 +00001619 ValueNumberScope *Locals = I->second;
1620 while (Locals) {
1621 DenseMap<uint32_t, Value*>::iterator I = Locals->table.find(num);
1622 if (I != Locals->table.end())
Owen Anderson2a412722008-06-20 01:15:47 +00001623 return I->second;
Chris Lattnerff36c952009-09-21 02:42:51 +00001624 Locals = Locals->parent;
Owen Anderson2a412722008-06-20 01:15:47 +00001625 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001626
Owen Anderson2a412722008-06-20 01:15:47 +00001627 return 0;
1628}
1629
Owen Andersona03e7862008-12-15 02:03:00 +00001630/// AttemptRedundancyElimination - If the "fast path" of redundancy elimination
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001631/// by inheritance from the dominator fails, see if we can perform phi
Owen Andersona03e7862008-12-15 02:03:00 +00001632/// construction to eliminate the redundancy.
Chris Lattnerff36c952009-09-21 02:42:51 +00001633Value *GVN::AttemptRedundancyElimination(Instruction *orig, unsigned valno) {
1634 BasicBlock *BaseBlock = orig->getParent();
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001635
Owen Andersona03e7862008-12-15 02:03:00 +00001636 SmallPtrSet<BasicBlock*, 4> Visited;
1637 SmallVector<BasicBlock*, 8> Stack;
1638 Stack.push_back(BaseBlock);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001639
Owen Andersona03e7862008-12-15 02:03:00 +00001640 DenseMap<BasicBlock*, Value*> Results;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001641
Owen Andersona03e7862008-12-15 02:03:00 +00001642 // Walk backwards through our predecessors, looking for instances of the
1643 // value number we're looking for. Instances are recorded in the Results
1644 // map, which is then used to perform phi construction.
1645 while (!Stack.empty()) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001646 BasicBlock *Current = Stack.back();
Owen Andersona03e7862008-12-15 02:03:00 +00001647 Stack.pop_back();
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001648
Owen Andersona03e7862008-12-15 02:03:00 +00001649 // If we've walked all the way to a proper dominator, then give up. Cases
1650 // where the instance is in the dominator will have been caught by the fast
1651 // path, and any cases that require phi construction further than this are
1652 // probably not worth it anyways. Note that this is a SIGNIFICANT compile
1653 // time improvement.
1654 if (DT->properlyDominates(Current, orig->getParent())) return 0;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001655
Owen Andersona03e7862008-12-15 02:03:00 +00001656 DenseMap<BasicBlock*, ValueNumberScope*>::iterator LA =
1657 localAvail.find(Current);
1658 if (LA == localAvail.end()) return 0;
Chris Lattner6f33e552009-01-19 22:00:18 +00001659 DenseMap<uint32_t, Value*>::iterator V = LA->second->table.find(valno);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001660
Owen Andersona03e7862008-12-15 02:03:00 +00001661 if (V != LA->second->table.end()) {
1662 // Found an instance, record it.
1663 Results.insert(std::make_pair(Current, V->second));
1664 continue;
1665 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001666
Owen Andersona03e7862008-12-15 02:03:00 +00001667 // If we reach the beginning of the function, then give up.
1668 if (pred_begin(Current) == pred_end(Current))
1669 return 0;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001670
Owen Andersona03e7862008-12-15 02:03:00 +00001671 for (pred_iterator PI = pred_begin(Current), PE = pred_end(Current);
1672 PI != PE; ++PI)
1673 if (Visited.insert(*PI))
1674 Stack.push_back(*PI);
1675 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001676
Owen Andersona03e7862008-12-15 02:03:00 +00001677 // If we didn't find instances, give up. Otherwise, perform phi construction.
1678 if (Results.size() == 0)
1679 return 0;
1680 else
1681 return GetValueForBlock(BaseBlock, orig, Results, true);
1682}
1683
Owen Andersonf631bb62007-08-14 18:16:29 +00001684/// processInstruction - When calculating availability, handle an instruction
Owen Anderson85c40642007-07-24 17:55:58 +00001685/// by inserting it into the appropriate sets
Owen Anderson9334fc62008-06-12 19:25:32 +00001686bool GVN::processInstruction(Instruction *I,
Chris Lattner7de20452008-03-21 22:01:16 +00001687 SmallVectorImpl<Instruction*> &toErase) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001688 if (LoadInst *LI = dyn_cast<LoadInst>(I)) {
1689 bool Changed = processLoad(LI, toErase);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001690
Chris Lattnerff36c952009-09-21 02:42:51 +00001691 if (!Changed) {
1692 unsigned Num = VN.lookup_or_add(LI);
1693 localAvail[I->getParent()]->table.insert(std::make_pair(Num, LI));
Owen Andersone6b4ff82008-06-18 21:41:49 +00001694 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001695
Chris Lattnerff36c952009-09-21 02:42:51 +00001696 return Changed;
Owen Andersone6b4ff82008-06-18 21:41:49 +00001697 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001698
Chris Lattnerff36c952009-09-21 02:42:51 +00001699 uint32_t NextNum = VN.getNextUnusedValueNumber();
1700 unsigned Num = VN.lookup_or_add(I);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001701
Chris Lattnerff36c952009-09-21 02:42:51 +00001702 if (BranchInst *BI = dyn_cast<BranchInst>(I)) {
1703 localAvail[I->getParent()]->table.insert(std::make_pair(Num, I));
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001704
Owen Andersonef8bf0f2009-04-01 23:53:49 +00001705 if (!BI->isConditional() || isa<Constant>(BI->getCondition()))
1706 return false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001707
Chris Lattnerff36c952009-09-21 02:42:51 +00001708 Value *BranchCond = BI->getCondition();
1709 uint32_t CondVN = VN.lookup_or_add(BranchCond);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001710
Chris Lattnerff36c952009-09-21 02:42:51 +00001711 BasicBlock *TrueSucc = BI->getSuccessor(0);
1712 BasicBlock *FalseSucc = BI->getSuccessor(1);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001713
Chris Lattnerff36c952009-09-21 02:42:51 +00001714 if (TrueSucc->getSinglePredecessor())
1715 localAvail[TrueSucc]->table[CondVN] =
1716 ConstantInt::getTrue(TrueSucc->getContext());
1717 if (FalseSucc->getSinglePredecessor())
1718 localAvail[FalseSucc]->table[CondVN] =
1719 ConstantInt::getFalse(TrueSucc->getContext());
Owen Andersonef8bf0f2009-04-01 23:53:49 +00001720
1721 return false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001722
Owen Andersonced50f82008-04-07 09:59:07 +00001723 // Allocations are always uniquely numbered, so we can save time and memory
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001724 // by fast failing them.
Victor Hernandez48c3c542009-09-18 22:35:49 +00001725 } else if (isa<AllocationInst>(I) || isMalloc(I) || isa<TerminatorInst>(I)) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001726 localAvail[I->getParent()]->table.insert(std::make_pair(Num, I));
Owen Andersonced50f82008-04-07 09:59:07 +00001727 return false;
Owen Andersone6b4ff82008-06-18 21:41:49 +00001728 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001729
Owen Andersone0143452007-08-16 22:02:55 +00001730 // Collapse PHI nodes
Owen Anderson98f6a6b2007-08-14 18:33:27 +00001731 if (PHINode* p = dyn_cast<PHINode>(I)) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001732 Value *constVal = CollapsePhi(p);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001733
Owen Anderson98f6a6b2007-08-14 18:33:27 +00001734 if (constVal) {
Owen Andersone02ad522007-08-16 22:51:56 +00001735 for (PhiMapType::iterator PI = phiMap.begin(), PE = phiMap.end();
1736 PI != PE; ++PI)
Chris Lattner4bab29b2008-12-09 19:21:47 +00001737 PI->second.erase(p);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001738
Owen Andersone02ad522007-08-16 22:51:56 +00001739 p->replaceAllUsesWith(constVal);
Chris Lattnerf81b0142008-12-09 22:06:23 +00001740 if (isa<PointerType>(constVal->getType()))
1741 MD->invalidateCachedPointerInfo(constVal);
Owen Anderson575f2812008-12-23 00:49:51 +00001742 VN.erase(p);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001743
Owen Andersone02ad522007-08-16 22:51:56 +00001744 toErase.push_back(p);
Owen Andersone6b4ff82008-06-18 21:41:49 +00001745 } else {
Chris Lattnerff36c952009-09-21 02:42:51 +00001746 localAvail[I->getParent()]->table.insert(std::make_pair(Num, I));
Owen Anderson98f6a6b2007-08-14 18:33:27 +00001747 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001748
Owen Anderson8a8d13c2008-07-03 17:44:33 +00001749 // If the number we were assigned was a brand new VN, then we don't
1750 // need to do a lookup to see if the number already exists
1751 // somewhere in the domtree: it can't!
Chris Lattnerff36c952009-09-21 02:42:51 +00001752 } else if (Num == NextNum) {
1753 localAvail[I->getParent()]->table.insert(std::make_pair(Num, I));
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001754
Owen Andersona03e7862008-12-15 02:03:00 +00001755 // Perform fast-path value-number based elimination of values inherited from
1756 // dominators.
Chris Lattnerff36c952009-09-21 02:42:51 +00001757 } else if (Value *repl = lookupNumber(I->getParent(), Num)) {
Owen Andersonc772be72007-12-08 01:37:09 +00001758 // Remove it!
Owen Anderson5aff8002007-07-31 23:27:13 +00001759 VN.erase(I);
Owen Anderson85c40642007-07-24 17:55:58 +00001760 I->replaceAllUsesWith(repl);
Chris Lattnerf81b0142008-12-09 22:06:23 +00001761 if (isa<PointerType>(repl->getType()))
1762 MD->invalidateCachedPointerInfo(repl);
Owen Anderson85c40642007-07-24 17:55:58 +00001763 toErase.push_back(I);
1764 return true;
Owen Andersona03e7862008-12-15 02:03:00 +00001765
1766#if 0
1767 // Perform slow-pathvalue-number based elimination with phi construction.
Chris Lattnerff36c952009-09-21 02:42:51 +00001768 } else if (Value *repl = AttemptRedundancyElimination(I, Num)) {
Owen Andersona03e7862008-12-15 02:03:00 +00001769 // Remove it!
1770 VN.erase(I);
1771 I->replaceAllUsesWith(repl);
1772 if (isa<PointerType>(repl->getType()))
1773 MD->invalidateCachedPointerInfo(repl);
1774 toErase.push_back(I);
1775 return true;
1776#endif
Owen Anderson8a8d13c2008-07-03 17:44:33 +00001777 } else {
Chris Lattnerff36c952009-09-21 02:42:51 +00001778 localAvail[I->getParent()]->table.insert(std::make_pair(Num, I));
Owen Anderson85c40642007-07-24 17:55:58 +00001779 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001780
Owen Anderson85c40642007-07-24 17:55:58 +00001781 return false;
1782}
1783
Bill Wendling42f17f62008-12-22 22:32:22 +00001784/// runOnFunction - This is the main transformation entry point for a function.
Owen Andersonbe168b32007-08-14 18:04:11 +00001785bool GVN::runOnFunction(Function& F) {
Chris Lattner02ca4422008-12-01 00:40:32 +00001786 MD = &getAnalysis<MemoryDependenceAnalysis>();
1787 DT = &getAnalysis<DominatorTree>();
Owen Andersonbcf2bd52008-05-12 20:15:55 +00001788 VN.setAliasAnalysis(&getAnalysis<AliasAnalysis>());
Chris Lattner02ca4422008-12-01 00:40:32 +00001789 VN.setMemDep(MD);
1790 VN.setDomTree(DT);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001791
Chris Lattnerff36c952009-09-21 02:42:51 +00001792 bool Changed = false;
1793 bool ShouldContinue = true;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001794
Owen Anderson26ed2572008-07-16 17:52:31 +00001795 // Merge unconditional branches, allowing PRE to catch more
1796 // optimization opportunities.
1797 for (Function::iterator FI = F.begin(), FE = F.end(); FI != FE; ) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001798 BasicBlock *BB = FI;
Owen Anderson26ed2572008-07-16 17:52:31 +00001799 ++FI;
Owen Andersonf59eef82008-07-17 00:01:40 +00001800 bool removedBlock = MergeBlockIntoPredecessor(BB, this);
1801 if (removedBlock) NumGVNBlocks++;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001802
Chris Lattnerff36c952009-09-21 02:42:51 +00001803 Changed |= removedBlock;
Owen Anderson26ed2572008-07-16 17:52:31 +00001804 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001805
Chris Lattner4bab29b2008-12-09 19:21:47 +00001806 unsigned Iteration = 0;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001807
Chris Lattnerff36c952009-09-21 02:42:51 +00001808 while (ShouldContinue) {
Dan Gohman0be10b02009-07-25 01:43:01 +00001809 DEBUG(errs() << "GVN iteration: " << Iteration << "\n");
Chris Lattnerff36c952009-09-21 02:42:51 +00001810 ShouldContinue = iterateOnFunction(F);
1811 Changed |= ShouldContinue;
Chris Lattner4bab29b2008-12-09 19:21:47 +00001812 ++Iteration;
Owen Andersonbe168b32007-08-14 18:04:11 +00001813 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001814
Owen Anderson916f4732008-07-18 18:03:38 +00001815 if (EnablePRE) {
Owen Anderson9c935902008-09-03 23:06:07 +00001816 bool PREChanged = true;
1817 while (PREChanged) {
1818 PREChanged = performPRE(F);
Chris Lattnerff36c952009-09-21 02:42:51 +00001819 Changed |= PREChanged;
Owen Anderson9c935902008-09-03 23:06:07 +00001820 }
Owen Anderson916f4732008-07-18 18:03:38 +00001821 }
Chris Lattner4bab29b2008-12-09 19:21:47 +00001822 // FIXME: Should perform GVN again after PRE does something. PRE can move
1823 // computations into blocks where they become fully redundant. Note that
1824 // we can't do this until PRE's critical edge splitting updates memdep.
1825 // Actually, when this happens, we should just fully integrate PRE into GVN.
Nuno Lopes274474b2008-10-10 16:25:50 +00001826
1827 cleanupGlobalSets();
1828
Chris Lattnerff36c952009-09-21 02:42:51 +00001829 return Changed;
Owen Andersonbe168b32007-08-14 18:04:11 +00001830}
1831
1832
Chris Lattnerff36c952009-09-21 02:42:51 +00001833bool GVN::processBlock(BasicBlock *BB) {
Chris Lattner4bab29b2008-12-09 19:21:47 +00001834 // FIXME: Kill off toErase by doing erasing eagerly in a helper function (and
1835 // incrementing BI before processing an instruction).
Owen Anderson9334fc62008-06-12 19:25:32 +00001836 SmallVector<Instruction*, 8> toErase;
Chris Lattnerff36c952009-09-21 02:42:51 +00001837 bool ChangedFunction = false;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001838
Owen Anderson9334fc62008-06-12 19:25:32 +00001839 for (BasicBlock::iterator BI = BB->begin(), BE = BB->end();
1840 BI != BE;) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001841 ChangedFunction |= processInstruction(BI, toErase);
Owen Anderson9334fc62008-06-12 19:25:32 +00001842 if (toErase.empty()) {
1843 ++BI;
1844 continue;
1845 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001846
Owen Anderson9334fc62008-06-12 19:25:32 +00001847 // If we need some instructions deleted, do it now.
1848 NumGVNInstr += toErase.size();
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001849
Owen Anderson9334fc62008-06-12 19:25:32 +00001850 // Avoid iterator invalidation.
1851 bool AtStart = BI == BB->begin();
1852 if (!AtStart)
1853 --BI;
1854
1855 for (SmallVector<Instruction*, 4>::iterator I = toErase.begin(),
Chris Lattner02ca4422008-12-01 00:40:32 +00001856 E = toErase.end(); I != E; ++I) {
Dan Gohman7e124382009-07-31 20:24:18 +00001857 DEBUG(errs() << "GVN removed: " << **I << '\n');
Chris Lattner02ca4422008-12-01 00:40:32 +00001858 MD->removeInstruction(*I);
Owen Anderson9334fc62008-06-12 19:25:32 +00001859 (*I)->eraseFromParent();
Bill Wendling84049422008-12-22 21:57:30 +00001860 DEBUG(verifyRemoved(*I));
Chris Lattner02ca4422008-12-01 00:40:32 +00001861 }
Chris Lattner4bab29b2008-12-09 19:21:47 +00001862 toErase.clear();
Owen Anderson9334fc62008-06-12 19:25:32 +00001863
1864 if (AtStart)
1865 BI = BB->begin();
1866 else
1867 ++BI;
Owen Anderson9334fc62008-06-12 19:25:32 +00001868 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001869
Chris Lattnerff36c952009-09-21 02:42:51 +00001870 return ChangedFunction;
Owen Anderson9334fc62008-06-12 19:25:32 +00001871}
1872
Owen Andersone6b4ff82008-06-18 21:41:49 +00001873/// performPRE - Perform a purely local form of PRE that looks for diamond
1874/// control flow patterns and attempts to perform simple PRE at the join point.
1875bool GVN::performPRE(Function& F) {
Chris Lattner66a3a3e2008-12-01 07:35:54 +00001876 bool Changed = false;
Owen Andersonec747c42008-06-19 19:54:19 +00001877 SmallVector<std::pair<TerminatorInst*, unsigned>, 4> toSplit;
Chris Lattner3304b562008-12-01 07:29:03 +00001878 DenseMap<BasicBlock*, Value*> predMap;
Owen Andersone6b4ff82008-06-18 21:41:49 +00001879 for (df_iterator<BasicBlock*> DI = df_begin(&F.getEntryBlock()),
1880 DE = df_end(&F.getEntryBlock()); DI != DE; ++DI) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001881 BasicBlock *CurrentBlock = *DI;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001882
Owen Andersone6b4ff82008-06-18 21:41:49 +00001883 // Nothing to PRE in the entry block.
1884 if (CurrentBlock == &F.getEntryBlock()) continue;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001885
Owen Andersone6b4ff82008-06-18 21:41:49 +00001886 for (BasicBlock::iterator BI = CurrentBlock->begin(),
1887 BE = CurrentBlock->end(); BI != BE; ) {
Chris Lattner66a3a3e2008-12-01 07:35:54 +00001888 Instruction *CurInst = BI++;
Duncan Sands2f500832009-05-06 06:49:50 +00001889
Victor Hernandez48c3c542009-09-18 22:35:49 +00001890 if (isa<AllocationInst>(CurInst) || isMalloc(CurInst) ||
1891 isa<TerminatorInst>(CurInst) || isa<PHINode>(CurInst) ||
Owen Anderson35b47072009-08-13 21:58:54 +00001892 (CurInst->getType() == Type::getVoidTy(F.getContext())) ||
Duncan Sands2f500832009-05-06 06:49:50 +00001893 CurInst->mayReadFromMemory() || CurInst->mayHaveSideEffects() ||
John Criswell6e0aa282009-03-10 15:04:53 +00001894 isa<DbgInfoIntrinsic>(CurInst))
Chris Lattner66a3a3e2008-12-01 07:35:54 +00001895 continue;
Duncan Sands2f500832009-05-06 06:49:50 +00001896
Chris Lattnerff36c952009-09-21 02:42:51 +00001897 uint32_t ValNo = VN.lookup(CurInst);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001898
Owen Andersone6b4ff82008-06-18 21:41:49 +00001899 // Look for the predecessors for PRE opportunities. We're
1900 // only trying to solve the basic diamond case, where
1901 // a value is computed in the successor and one predecessor,
1902 // but not the other. We also explicitly disallow cases
1903 // where the successor is its own predecessor, because they're
1904 // more complicated to get right.
Chris Lattnerff36c952009-09-21 02:42:51 +00001905 unsigned NumWith = 0;
1906 unsigned NumWithout = 0;
1907 BasicBlock *PREPred = 0;
Chris Lattner3304b562008-12-01 07:29:03 +00001908 predMap.clear();
1909
Owen Andersone6b4ff82008-06-18 21:41:49 +00001910 for (pred_iterator PI = pred_begin(CurrentBlock),
1911 PE = pred_end(CurrentBlock); PI != PE; ++PI) {
1912 // We're not interested in PRE where the block is its
Owen Anderson2a412722008-06-20 01:15:47 +00001913 // own predecessor, on in blocks with predecessors
1914 // that are not reachable.
1915 if (*PI == CurrentBlock) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001916 NumWithout = 2;
Owen Anderson2a412722008-06-20 01:15:47 +00001917 break;
1918 } else if (!localAvail.count(*PI)) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001919 NumWithout = 2;
Owen Anderson2a412722008-06-20 01:15:47 +00001920 break;
1921 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001922
1923 DenseMap<uint32_t, Value*>::iterator predV =
Chris Lattnerff36c952009-09-21 02:42:51 +00001924 localAvail[*PI]->table.find(ValNo);
Owen Anderson2a412722008-06-20 01:15:47 +00001925 if (predV == localAvail[*PI]->table.end()) {
Owen Andersone6b4ff82008-06-18 21:41:49 +00001926 PREPred = *PI;
Chris Lattnerff36c952009-09-21 02:42:51 +00001927 NumWithout++;
Chris Lattner66a3a3e2008-12-01 07:35:54 +00001928 } else if (predV->second == CurInst) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001929 NumWithout = 2;
Owen Andersone6b4ff82008-06-18 21:41:49 +00001930 } else {
Owen Anderson2a412722008-06-20 01:15:47 +00001931 predMap[*PI] = predV->second;
Chris Lattnerff36c952009-09-21 02:42:51 +00001932 NumWith++;
Owen Andersone6b4ff82008-06-18 21:41:49 +00001933 }
1934 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001935
Owen Andersone6b4ff82008-06-18 21:41:49 +00001936 // Don't do PRE when it might increase code size, i.e. when
1937 // we would need to insert instructions in more than one pred.
Chris Lattnerff36c952009-09-21 02:42:51 +00001938 if (NumWithout != 1 || NumWith == 0)
Owen Andersone6b4ff82008-06-18 21:41:49 +00001939 continue;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001940
Owen Andersonec747c42008-06-19 19:54:19 +00001941 // We can't do PRE safely on a critical edge, so instead we schedule
1942 // the edge to be split and perform the PRE the next time we iterate
1943 // on the function.
Chris Lattnerff36c952009-09-21 02:42:51 +00001944 unsigned SuccNum = 0;
Owen Andersonec747c42008-06-19 19:54:19 +00001945 for (unsigned i = 0, e = PREPred->getTerminator()->getNumSuccessors();
1946 i != e; ++i)
Owen Anderson9c935902008-09-03 23:06:07 +00001947 if (PREPred->getTerminator()->getSuccessor(i) == CurrentBlock) {
Chris Lattnerff36c952009-09-21 02:42:51 +00001948 SuccNum = i;
Owen Andersonec747c42008-06-19 19:54:19 +00001949 break;
1950 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001951
Chris Lattnerff36c952009-09-21 02:42:51 +00001952 if (isCriticalEdge(PREPred->getTerminator(), SuccNum)) {
1953 toSplit.push_back(std::make_pair(PREPred->getTerminator(), SuccNum));
Owen Andersonec747c42008-06-19 19:54:19 +00001954 continue;
1955 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001956
Owen Andersone6b4ff82008-06-18 21:41:49 +00001957 // Instantiate the expression the in predecessor that lacked it.
1958 // Because we are going top-down through the block, all value numbers
1959 // will be available in the predecessor by the time we need them. Any
1960 // that weren't original present will have been instantiated earlier
1961 // in this loop.
Chris Lattnerff36c952009-09-21 02:42:51 +00001962 Instruction *PREInstr = CurInst->clone(CurInst->getContext());
Owen Andersone6b4ff82008-06-18 21:41:49 +00001963 bool success = true;
Chris Lattner66a3a3e2008-12-01 07:35:54 +00001964 for (unsigned i = 0, e = CurInst->getNumOperands(); i != e; ++i) {
1965 Value *Op = PREInstr->getOperand(i);
1966 if (isa<Argument>(Op) || isa<Constant>(Op) || isa<GlobalValue>(Op))
1967 continue;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001968
Chris Lattner66a3a3e2008-12-01 07:35:54 +00001969 if (Value *V = lookupNumber(PREPred, VN.lookup(Op))) {
1970 PREInstr->setOperand(i, V);
1971 } else {
1972 success = false;
1973 break;
Owen Anderson14c612f2008-07-11 20:05:13 +00001974 }
Owen Andersone6b4ff82008-06-18 21:41:49 +00001975 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001976
Owen Andersone6b4ff82008-06-18 21:41:49 +00001977 // Fail out if we encounter an operand that is not available in
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001978 // the PRE predecessor. This is typically because of loads which
Owen Andersone6b4ff82008-06-18 21:41:49 +00001979 // are not value numbered precisely.
1980 if (!success) {
1981 delete PREInstr;
Bill Wendling3858cae2008-12-22 22:14:07 +00001982 DEBUG(verifyRemoved(PREInstr));
Owen Andersone6b4ff82008-06-18 21:41:49 +00001983 continue;
1984 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001985
Owen Andersone6b4ff82008-06-18 21:41:49 +00001986 PREInstr->insertBefore(PREPred->getTerminator());
Chris Lattner66a3a3e2008-12-01 07:35:54 +00001987 PREInstr->setName(CurInst->getName() + ".pre");
Owen Anderson2a412722008-06-20 01:15:47 +00001988 predMap[PREPred] = PREInstr;
Chris Lattnerff36c952009-09-21 02:42:51 +00001989 VN.add(PREInstr, ValNo);
Owen Andersone6b4ff82008-06-18 21:41:49 +00001990 NumGVNPRE++;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001991
Owen Andersone6b4ff82008-06-18 21:41:49 +00001992 // Update the availability map to include the new instruction.
Chris Lattnerff36c952009-09-21 02:42:51 +00001993 localAvail[PREPred]->table.insert(std::make_pair(ValNo, PREInstr));
Daniel Dunbar3be44e62009-09-20 02:20:51 +00001994
Owen Andersone6b4ff82008-06-18 21:41:49 +00001995 // Create a PHI to make the value available in this block.
Chris Lattner66a3a3e2008-12-01 07:35:54 +00001996 PHINode* Phi = PHINode::Create(CurInst->getType(),
1997 CurInst->getName() + ".pre-phi",
Owen Andersone6b4ff82008-06-18 21:41:49 +00001998 CurrentBlock->begin());
1999 for (pred_iterator PI = pred_begin(CurrentBlock),
2000 PE = pred_end(CurrentBlock); PI != PE; ++PI)
Owen Anderson2a412722008-06-20 01:15:47 +00002001 Phi->addIncoming(predMap[*PI], *PI);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00002002
Chris Lattnerff36c952009-09-21 02:42:51 +00002003 VN.add(Phi, ValNo);
2004 localAvail[CurrentBlock]->table[ValNo] = Phi;
Daniel Dunbar3be44e62009-09-20 02:20:51 +00002005
Chris Lattner66a3a3e2008-12-01 07:35:54 +00002006 CurInst->replaceAllUsesWith(Phi);
Chris Lattnerf81b0142008-12-09 22:06:23 +00002007 if (isa<PointerType>(Phi->getType()))
2008 MD->invalidateCachedPointerInfo(Phi);
Chris Lattner66a3a3e2008-12-01 07:35:54 +00002009 VN.erase(CurInst);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00002010
Dan Gohman7e124382009-07-31 20:24:18 +00002011 DEBUG(errs() << "GVN PRE removed: " << *CurInst << '\n');
Chris Lattner66a3a3e2008-12-01 07:35:54 +00002012 MD->removeInstruction(CurInst);
2013 CurInst->eraseFromParent();
Bill Wendling84049422008-12-22 21:57:30 +00002014 DEBUG(verifyRemoved(CurInst));
Chris Lattner66a3a3e2008-12-01 07:35:54 +00002015 Changed = true;
Owen Andersone6b4ff82008-06-18 21:41:49 +00002016 }
2017 }
Daniel Dunbar3be44e62009-09-20 02:20:51 +00002018
Owen Andersonec747c42008-06-19 19:54:19 +00002019 for (SmallVector<std::pair<TerminatorInst*, unsigned>, 4>::iterator
Anton Korobeynikov2e8710c2008-12-05 19:38:49 +00002020 I = toSplit.begin(), E = toSplit.end(); I != E; ++I)
Owen Andersonec747c42008-06-19 19:54:19 +00002021 SplitCriticalEdge(I->first, I->second, this);
Daniel Dunbar3be44e62009-09-20 02:20:51 +00002022
Anton Korobeynikov2e8710c2008-12-05 19:38:49 +00002023 return Changed || toSplit.size();
Owen Andersone6b4ff82008-06-18 21:41:49 +00002024}
2025
Bill Wendling42f17f62008-12-22 22:32:22 +00002026/// iterateOnFunction - Executes one iteration of GVN
Owen Andersonbe168b32007-08-14 18:04:11 +00002027bool GVN::iterateOnFunction(Function &F) {
Nuno Lopes274474b2008-10-10 16:25:50 +00002028 cleanupGlobalSets();
Chris Lattner98054902008-03-21 21:33:23 +00002029
Owen Andersonef8bf0f2009-04-01 23:53:49 +00002030 for (df_iterator<DomTreeNode*> DI = df_begin(DT->getRootNode()),
2031 DE = df_end(DT->getRootNode()); DI != DE; ++DI) {
2032 if (DI->getIDom())
2033 localAvail[DI->getBlock()] =
2034 new ValueNumberScope(localAvail[DI->getIDom()->getBlock()]);
2035 else
2036 localAvail[DI->getBlock()] = new ValueNumberScope(0);
2037 }
2038
Owen Anderson85c40642007-07-24 17:55:58 +00002039 // Top-down walk of the dominator tree
Chris Lattnerff36c952009-09-21 02:42:51 +00002040 bool Changed = false;
Owen Andersonef136f52008-12-15 03:52:17 +00002041#if 0
2042 // Needed for value numbering with phi construction to work.
Owen Andersona03e7862008-12-15 02:03:00 +00002043 ReversePostOrderTraversal<Function*> RPOT(&F);
2044 for (ReversePostOrderTraversal<Function*>::rpo_iterator RI = RPOT.begin(),
2045 RE = RPOT.end(); RI != RE; ++RI)
Chris Lattnerff36c952009-09-21 02:42:51 +00002046 Changed |= processBlock(*RI);
Owen Andersonef136f52008-12-15 03:52:17 +00002047#else
2048 for (df_iterator<DomTreeNode*> DI = df_begin(DT->getRootNode()),
2049 DE = df_end(DT->getRootNode()); DI != DE; ++DI)
Chris Lattnerff36c952009-09-21 02:42:51 +00002050 Changed |= processBlock(DI->getBlock());
Owen Andersonef136f52008-12-15 03:52:17 +00002051#endif
2052
Chris Lattnerff36c952009-09-21 02:42:51 +00002053 return Changed;
Owen Anderson85c40642007-07-24 17:55:58 +00002054}
Nuno Lopes274474b2008-10-10 16:25:50 +00002055
2056void GVN::cleanupGlobalSets() {
2057 VN.clear();
2058 phiMap.clear();
2059
2060 for (DenseMap<BasicBlock*, ValueNumberScope*>::iterator
2061 I = localAvail.begin(), E = localAvail.end(); I != E; ++I)
2062 delete I->second;
2063 localAvail.clear();
2064}
Bill Wendling2a023742008-12-22 21:36:08 +00002065
2066/// verifyRemoved - Verify that the specified instruction does not occur in our
2067/// internal data structures.
Bill Wendlingf9c0e9e2008-12-22 22:28:56 +00002068void GVN::verifyRemoved(const Instruction *Inst) const {
2069 VN.verifyRemoved(Inst);
Bill Wendling3858cae2008-12-22 22:14:07 +00002070
2071 // Walk through the PHI map to make sure the instruction isn't hiding in there
2072 // somewhere.
2073 for (PhiMapType::iterator
Bill Wendlingf9c0e9e2008-12-22 22:28:56 +00002074 I = phiMap.begin(), E = phiMap.end(); I != E; ++I) {
2075 assert(I->first != Inst && "Inst is still a key in PHI map!");
Bill Wendling3858cae2008-12-22 22:14:07 +00002076
2077 for (SmallPtrSet<Instruction*, 4>::iterator
Bill Wendlingf9c0e9e2008-12-22 22:28:56 +00002078 II = I->second.begin(), IE = I->second.end(); II != IE; ++II) {
2079 assert(*II != Inst && "Inst is still a value in PHI map!");
2080 }
2081 }
2082
2083 // Walk through the value number scope to make sure the instruction isn't
2084 // ferreted away in it.
2085 for (DenseMap<BasicBlock*, ValueNumberScope*>::iterator
2086 I = localAvail.begin(), E = localAvail.end(); I != E; ++I) {
2087 const ValueNumberScope *VNS = I->second;
2088
2089 while (VNS) {
2090 for (DenseMap<uint32_t, Value*>::iterator
2091 II = VNS->table.begin(), IE = VNS->table.end(); II != IE; ++II) {
2092 assert(II->second != Inst && "Inst still in value numbering scope!");
2093 }
2094
2095 VNS = VNS->parent;
Bill Wendling3858cae2008-12-22 22:14:07 +00002096 }
2097 }
Bill Wendling2a023742008-12-22 21:36:08 +00002098}