Nick Lewycky | 7ed1dbf | 2013-06-10 23:10:59 +0000 | [diff] [blame] | 1 | //===- MemoryDependenceAnalysis.cpp - Mem Deps Implementation -------------===// |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | f3ebc3f | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file implements an analysis that determines, for a given memory |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 11 | // operation, what preceding memory operations it depends on. It builds on |
Owen Anderson | fa78835 | 2007-08-08 22:01:54 +0000 | [diff] [blame] | 12 | // alias analysis information, and tries to provide a lazy, caching interface to |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 13 | // a common kind of alias information query. |
| 14 | // |
| 15 | //===----------------------------------------------------------------------===// |
| 16 | |
| 17 | #include "llvm/Analysis/MemoryDependenceAnalysis.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 18 | #include "llvm/ADT/STLExtras.h" |
| 19 | #include "llvm/ADT/Statistic.h" |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 20 | #include "llvm/Analysis/AliasAnalysis.h" |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 21 | #include "llvm/Analysis/AssumptionCache.h" |
Chris Lattner | 5030c6a | 2009-11-27 00:34:38 +0000 | [diff] [blame] | 22 | #include "llvm/Analysis/InstructionSimplify.h" |
Victor Hernandez | f390e04 | 2009-10-27 20:05:49 +0000 | [diff] [blame] | 23 | #include "llvm/Analysis/MemoryBuiltins.h" |
Chris Lattner | 972e6d8 | 2009-12-09 01:59:31 +0000 | [diff] [blame] | 24 | #include "llvm/Analysis/PHITransAddr.h" |
Bruno Cardoso Lopes | dfc1d96 | 2015-07-31 14:31:35 +0000 | [diff] [blame] | 25 | #include "llvm/Analysis/OrderedBasicBlock.h" |
Dan Gohman | a4fcd24 | 2010-12-15 20:02:24 +0000 | [diff] [blame] | 26 | #include "llvm/Analysis/ValueTracking.h" |
Chandler Carruth | d06034d | 2015-08-12 17:47:44 +0000 | [diff] [blame] | 27 | #include "llvm/Analysis/TargetLibraryInfo.h" |
Chandler Carruth | 9fb823b | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 28 | #include "llvm/IR/DataLayout.h" |
Chandler Carruth | 5ad5f15 | 2014-01-13 09:26:24 +0000 | [diff] [blame] | 29 | #include "llvm/IR/Dominators.h" |
Chandler Carruth | 9fb823b | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 30 | #include "llvm/IR/Function.h" |
| 31 | #include "llvm/IR/Instructions.h" |
| 32 | #include "llvm/IR/IntrinsicInst.h" |
| 33 | #include "llvm/IR/LLVMContext.h" |
Chandler Carruth | aa0ab63 | 2014-03-04 12:09:19 +0000 | [diff] [blame] | 34 | #include "llvm/IR/PredIteratorCache.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 35 | #include "llvm/Support/Debug.h" |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 36 | using namespace llvm; |
| 37 | |
Chandler Carruth | f1221bd | 2014-04-22 02:48:03 +0000 | [diff] [blame] | 38 | #define DEBUG_TYPE "memdep" |
| 39 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 40 | STATISTIC(NumCacheNonLocal, "Number of fully cached non-local responses"); |
| 41 | STATISTIC(NumCacheDirtyNonLocal, "Number of dirty cached non-local responses"); |
Chris Lattner | e7d7e13 | 2008-11-29 22:02:15 +0000 | [diff] [blame] | 42 | STATISTIC(NumUncacheNonLocal, "Number of uncached non-local responses"); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 43 | |
| 44 | STATISTIC(NumCacheNonLocalPtr, |
| 45 | "Number of fully cached non-local ptr responses"); |
| 46 | STATISTIC(NumCacheDirtyNonLocalPtr, |
| 47 | "Number of cached, but dirty, non-local ptr responses"); |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 48 | STATISTIC(NumUncacheNonLocalPtr, "Number of uncached non-local ptr responses"); |
Chris Lattner | 5ed409e | 2008-12-08 07:31:50 +0000 | [diff] [blame] | 49 | STATISTIC(NumCacheCompleteNonLocalPtr, |
| 50 | "Number of block queries that were completely cached"); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 51 | |
Eli Friedman | 8b098b0 | 2011-06-15 23:59:25 +0000 | [diff] [blame] | 52 | // Limit for the number of instructions to scan in a block. |
Jingyue Wu | d058ea9 | 2015-07-21 21:50:39 +0000 | [diff] [blame] | 53 | |
| 54 | static cl::opt<unsigned> BlockScanLimit( |
| 55 | "memdep-block-scan-limit", cl::Hidden, cl::init(100), |
| 56 | cl::desc("The number of instructions to scan in a block in memory " |
| 57 | "dependency analysis (default = 100)")); |
Eli Friedman | 8b098b0 | 2011-06-15 23:59:25 +0000 | [diff] [blame] | 58 | |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 59 | static cl::opt<unsigned> |
| 60 | BlockNumberLimit("memdep-block-number-limit", cl::Hidden, cl::init(1000), |
| 61 | cl::desc("The number of blocks to scan during memory " |
| 62 | "dependency analysis (default = 1000)")); |
Joerg Sonnenberger | 36894dc | 2016-02-20 11:24:44 +0000 | [diff] [blame] | 63 | |
Bruno Cardoso Lopes | e3c513a | 2014-10-01 20:07:13 +0000 | [diff] [blame] | 64 | // Limit on the number of memdep results to process. |
Aaron Ballman | 254dd7e | 2014-10-02 13:17:11 +0000 | [diff] [blame] | 65 | static const unsigned int NumResultsLimit = 100; |
Bruno Cardoso Lopes | e3c513a | 2014-10-01 20:07:13 +0000 | [diff] [blame] | 66 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 67 | /// This is a helper function that removes Val from 'Inst's set in ReverseMap. |
| 68 | /// |
| 69 | /// If the set becomes empty, remove Inst's entry. |
Chris Lattner | de4440c | 2008-12-07 18:39:13 +0000 | [diff] [blame] | 70 | template <typename KeyTy> |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 71 | static void |
| 72 | RemoveFromReverseMap(DenseMap<Instruction *, SmallPtrSet<KeyTy, 4>> &ReverseMap, |
| 73 | Instruction *Inst, KeyTy Val) { |
| 74 | typename DenseMap<Instruction *, SmallPtrSet<KeyTy, 4>>::iterator InstIt = |
| 75 | ReverseMap.find(Inst); |
Chris Lattner | de4440c | 2008-12-07 18:39:13 +0000 | [diff] [blame] | 76 | assert(InstIt != ReverseMap.end() && "Reverse map out of sync?"); |
| 77 | bool Found = InstIt->second.erase(Val); |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 78 | assert(Found && "Invalid reverse map!"); |
| 79 | (void)Found; |
Chris Lattner | de4440c | 2008-12-07 18:39:13 +0000 | [diff] [blame] | 80 | if (InstIt->second.empty()) |
| 81 | ReverseMap.erase(InstIt); |
| 82 | } |
| 83 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 84 | /// If the given instruction references a specific memory location, fill in Loc |
| 85 | /// with the details, otherwise set Loc.Ptr to null. |
| 86 | /// |
| 87 | /// Returns a ModRefInfo value describing the general behavior of the |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 88 | /// instruction. |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 89 | static ModRefInfo GetLocation(const Instruction *Inst, MemoryLocation &Loc, |
Chandler Carruth | d06034d | 2015-08-12 17:47:44 +0000 | [diff] [blame] | 90 | const TargetLibraryInfo &TLI) { |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 91 | if (const LoadInst *LI = dyn_cast<LoadInst>(Inst)) { |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 92 | if (LI->isUnordered()) { |
Chandler Carruth | 70c61c1 | 2015-06-04 02:03:15 +0000 | [diff] [blame] | 93 | Loc = MemoryLocation::get(LI); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 94 | return MRI_Ref; |
Jakub Staszak | fa41def | 2013-03-20 23:53:45 +0000 | [diff] [blame] | 95 | } |
| 96 | if (LI->getOrdering() == Monotonic) { |
Chandler Carruth | 70c61c1 | 2015-06-04 02:03:15 +0000 | [diff] [blame] | 97 | Loc = MemoryLocation::get(LI); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 98 | return MRI_ModRef; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 99 | } |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 100 | Loc = MemoryLocation(); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 101 | return MRI_ModRef; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 102 | } |
| 103 | |
| 104 | if (const StoreInst *SI = dyn_cast<StoreInst>(Inst)) { |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 105 | if (SI->isUnordered()) { |
Chandler Carruth | 70c61c1 | 2015-06-04 02:03:15 +0000 | [diff] [blame] | 106 | Loc = MemoryLocation::get(SI); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 107 | return MRI_Mod; |
Jakub Staszak | fa41def | 2013-03-20 23:53:45 +0000 | [diff] [blame] | 108 | } |
| 109 | if (SI->getOrdering() == Monotonic) { |
Chandler Carruth | 70c61c1 | 2015-06-04 02:03:15 +0000 | [diff] [blame] | 110 | Loc = MemoryLocation::get(SI); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 111 | return MRI_ModRef; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 112 | } |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 113 | Loc = MemoryLocation(); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 114 | return MRI_ModRef; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 115 | } |
| 116 | |
| 117 | if (const VAArgInst *V = dyn_cast<VAArgInst>(Inst)) { |
Chandler Carruth | 70c61c1 | 2015-06-04 02:03:15 +0000 | [diff] [blame] | 118 | Loc = MemoryLocation::get(V); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 119 | return MRI_ModRef; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 120 | } |
| 121 | |
Chandler Carruth | d06034d | 2015-08-12 17:47:44 +0000 | [diff] [blame] | 122 | if (const CallInst *CI = isFreeCall(Inst, &TLI)) { |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 123 | // calls to free() deallocate the entire structure |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 124 | Loc = MemoryLocation(CI->getArgOperand(0)); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 125 | return MRI_Mod; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 126 | } |
| 127 | |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 128 | if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(Inst)) { |
| 129 | AAMDNodes AAInfo; |
| 130 | |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 131 | switch (II->getIntrinsicID()) { |
| 132 | case Intrinsic::lifetime_start: |
| 133 | case Intrinsic::lifetime_end: |
| 134 | case Intrinsic::invariant_start: |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 135 | II->getAAMetadata(AAInfo); |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 136 | Loc = MemoryLocation( |
| 137 | II->getArgOperand(1), |
| 138 | cast<ConstantInt>(II->getArgOperand(0))->getZExtValue(), AAInfo); |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 139 | // These intrinsics don't really modify the memory, but returning Mod |
| 140 | // will allow them to be handled conservatively. |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 141 | return MRI_Mod; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 142 | case Intrinsic::invariant_end: |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 143 | II->getAAMetadata(AAInfo); |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 144 | Loc = MemoryLocation( |
| 145 | II->getArgOperand(2), |
| 146 | cast<ConstantInt>(II->getArgOperand(1))->getZExtValue(), AAInfo); |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 147 | // These intrinsics don't really modify the memory, but returning Mod |
| 148 | // will allow them to be handled conservatively. |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 149 | return MRI_Mod; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 150 | default: |
| 151 | break; |
| 152 | } |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 153 | } |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 154 | |
| 155 | // Otherwise, just do the coarse-grained thing that always works. |
| 156 | if (Inst->mayWriteToMemory()) |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 157 | return MRI_ModRef; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 158 | if (Inst->mayReadFromMemory()) |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 159 | return MRI_Ref; |
| 160 | return MRI_NoModRef; |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 161 | } |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 162 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 163 | /// Private helper for finding the local dependencies of a call site. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 164 | MemDepResult MemoryDependenceResults::getCallSiteDependencyFrom( |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 165 | CallSite CS, bool isReadOnlyCall, BasicBlock::iterator ScanIt, |
| 166 | BasicBlock *BB) { |
Eli Friedman | 8b098b0 | 2011-06-15 23:59:25 +0000 | [diff] [blame] | 167 | unsigned Limit = BlockScanLimit; |
| 168 | |
Owen Anderson | 2b21c3c | 2007-08-08 22:26:03 +0000 | [diff] [blame] | 169 | // Walk backwards through the block, looking for dependencies |
Chris Lattner | 51ba8d0 | 2008-11-29 03:47:00 +0000 | [diff] [blame] | 170 | while (ScanIt != BB->begin()) { |
Eli Friedman | 8b098b0 | 2011-06-15 23:59:25 +0000 | [diff] [blame] | 171 | // Limit the amount of scanning we do so we don't end up with quadratic |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 172 | // running time on extreme testcases. |
Eli Friedman | 8b098b0 | 2011-06-15 23:59:25 +0000 | [diff] [blame] | 173 | --Limit; |
| 174 | if (!Limit) |
| 175 | return MemDepResult::getUnknown(); |
| 176 | |
Duncan P. N. Exon Smith | 5a82c91 | 2015-10-10 00:53:03 +0000 | [diff] [blame] | 177 | Instruction *Inst = &*--ScanIt; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 178 | |
Owen Anderson | 9c88457 | 2007-07-10 17:59:22 +0000 | [diff] [blame] | 179 | // If this inst is a memory op, get the pointer it accessed |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 180 | MemoryLocation Loc; |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 181 | ModRefInfo MR = GetLocation(Inst, Loc, TLI); |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 182 | if (Loc.Ptr) { |
| 183 | // A simple instruction. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 184 | if (AA.getModRefInfo(CS, Loc) != MRI_NoModRef) |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 185 | return MemDepResult::getClobber(Inst); |
| 186 | continue; |
| 187 | } |
| 188 | |
Benjamin Kramer | 3a09ef6 | 2015-04-10 14:50:08 +0000 | [diff] [blame] | 189 | if (auto InstCS = CallSite(Inst)) { |
Owen Anderson | f9a9cf9 | 2009-03-09 05:12:38 +0000 | [diff] [blame] | 190 | // Debug intrinsics don't cause dependences. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 191 | if (isa<DbgInfoIntrinsic>(Inst)) |
| 192 | continue; |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 193 | // If these two calls do not interfere, look past it. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 194 | switch (AA.getModRefInfo(CS, InstCS)) { |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 195 | case MRI_NoModRef: |
Dan Gohman | 26ef7c7 | 2010-08-05 22:09:15 +0000 | [diff] [blame] | 196 | // If the two calls are the same, return InstCS as a Def, so that |
| 197 | // CS can be found redundant and eliminated. |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 198 | if (isReadOnlyCall && !(MR & MRI_Mod) && |
Dan Gohman | 26ef7c7 | 2010-08-05 22:09:15 +0000 | [diff] [blame] | 199 | CS.getInstruction()->isIdenticalToWhenDefined(Inst)) |
| 200 | return MemDepResult::getDef(Inst); |
| 201 | |
| 202 | // Otherwise if the two calls don't interact (e.g. InstCS is readnone) |
| 203 | // keep scanning. |
Nadav Rotem | 5d4e205 | 2012-08-13 23:03:43 +0000 | [diff] [blame] | 204 | continue; |
Chris Lattner | 702e46e | 2008-12-09 21:19:42 +0000 | [diff] [blame] | 205 | default: |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 206 | return MemDepResult::getClobber(Inst); |
Chris Lattner | 702e46e | 2008-12-09 21:19:42 +0000 | [diff] [blame] | 207 | } |
Chris Lattner | ff862c4 | 2008-11-30 01:44:00 +0000 | [diff] [blame] | 208 | } |
Nadav Rotem | 5d4e205 | 2012-08-13 23:03:43 +0000 | [diff] [blame] | 209 | |
| 210 | // If we could not obtain a pointer for the instruction and the instruction |
| 211 | // touches memory then assume that this is a dependency. |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 212 | if (MR != MRI_NoModRef) |
Nadav Rotem | 5d4e205 | 2012-08-13 23:03:43 +0000 | [diff] [blame] | 213 | return MemDepResult::getClobber(Inst); |
Owen Anderson | 9c88457 | 2007-07-10 17:59:22 +0000 | [diff] [blame] | 214 | } |
Nadav Rotem | 5d4e205 | 2012-08-13 23:03:43 +0000 | [diff] [blame] | 215 | |
Eli Friedman | 7d58bc7 | 2011-06-15 00:47:34 +0000 | [diff] [blame] | 216 | // No dependence found. If this is the entry block of the function, it is |
| 217 | // unknown, otherwise it is non-local. |
Chris Lattner | 2faa2c7 | 2008-12-07 02:15:47 +0000 | [diff] [blame] | 218 | if (BB != &BB->getParent()->getEntryBlock()) |
| 219 | return MemDepResult::getNonLocal(); |
Eli Friedman | c1702c8 | 2011-10-13 22:14:57 +0000 | [diff] [blame] | 220 | return MemDepResult::getNonFuncLocal(); |
Owen Anderson | 9c88457 | 2007-07-10 17:59:22 +0000 | [diff] [blame] | 221 | } |
| 222 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 223 | /// Return true if LI is a load that would fully overlap MemLoc if done as |
| 224 | /// a wider legal integer load. |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 225 | /// |
| 226 | /// MemLocBase, MemLocOffset are lazily computed here the first time the |
| 227 | /// base/offs of memloc is needed. |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 228 | static bool isLoadLoadClobberIfExtendedToFullWidth(const MemoryLocation &MemLoc, |
| 229 | const Value *&MemLocBase, |
| 230 | int64_t &MemLocOffs, |
| 231 | const LoadInst *LI) { |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 232 | const DataLayout &DL = LI->getModule()->getDataLayout(); |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 233 | |
| 234 | // If we haven't already computed the base/offset of MemLoc, do so now. |
Craig Topper | 9f00886 | 2014-04-15 04:59:12 +0000 | [diff] [blame] | 235 | if (!MemLocBase) |
Rafael Espindola | 7c68beb | 2014-02-18 15:33:12 +0000 | [diff] [blame] | 236 | MemLocBase = GetPointerBaseWithConstantOffset(MemLoc.Ptr, MemLocOffs, DL); |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 237 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 238 | unsigned Size = MemoryDependenceResults::getLoadLoadClobberFullWidthSize( |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 239 | MemLocBase, MemLocOffs, MemLoc.Size, LI); |
Chris Lattner | 827a270 | 2011-04-28 07:29:08 +0000 | [diff] [blame] | 240 | return Size != 0; |
| 241 | } |
| 242 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 243 | unsigned MemoryDependenceResults::getLoadLoadClobberFullWidthSize( |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 244 | const Value *MemLocBase, int64_t MemLocOffs, unsigned MemLocSize, |
| 245 | const LoadInst *LI) { |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 246 | // We can only extend simple integer loads. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 247 | if (!isa<IntegerType>(LI->getType()) || !LI->isSimple()) |
| 248 | return 0; |
Kostya Serebryany | 3838f27 | 2013-02-13 05:59:45 +0000 | [diff] [blame] | 249 | |
| 250 | // Load widening is hostile to ThreadSanitizer: it may cause false positives |
| 251 | // or make the reports more cryptic (access sizes are wrong). |
Duncan P. N. Exon Smith | b3fc83c | 2015-02-14 00:12:15 +0000 | [diff] [blame] | 252 | if (LI->getParent()->getParent()->hasFnAttribute(Attribute::SanitizeThread)) |
Kostya Serebryany | 3838f27 | 2013-02-13 05:59:45 +0000 | [diff] [blame] | 253 | return 0; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 254 | |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 255 | const DataLayout &DL = LI->getModule()->getDataLayout(); |
| 256 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 257 | // Get the base of this load. |
| 258 | int64_t LIOffs = 0; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 259 | const Value *LIBase = |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 260 | GetPointerBaseWithConstantOffset(LI->getPointerOperand(), LIOffs, DL); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 261 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 262 | // If the two pointers are not based on the same pointer, we can't tell that |
| 263 | // they are related. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 264 | if (LIBase != MemLocBase) |
| 265 | return 0; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 266 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 267 | // Okay, the two values are based on the same pointer, but returned as |
| 268 | // no-alias. This happens when we have things like two byte loads at "P+1" |
| 269 | // and "P+3". Check to see if increasing the size of the "LI" load up to its |
| 270 | // alignment (or the largest native integer type) will allow us to load all |
| 271 | // the bits required by MemLoc. |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 272 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 273 | // If MemLoc is before LI, then no widening of LI will help us out. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 274 | if (MemLocOffs < LIOffs) |
| 275 | return 0; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 276 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 277 | // Get the alignment of the load in bytes. We assume that it is safe to load |
| 278 | // any legal integer up to this size without a problem. For example, if we're |
| 279 | // looking at an i8 load on x86-32 that is known 1024 byte aligned, we can |
| 280 | // widen it up to an i32 load. If it is known 2-byte aligned, we can widen it |
| 281 | // to i16. |
| 282 | unsigned LoadAlign = LI->getAlignment(); |
| 283 | |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 284 | int64_t MemLocEnd = MemLocOffs + MemLocSize; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 285 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 286 | // If no amount of rounding up will let MemLoc fit into LI, then bail out. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 287 | if (LIOffs + LoadAlign < MemLocEnd) |
| 288 | return 0; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 289 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 290 | // This is the size of the load to try. Start with the next larger power of |
| 291 | // two. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 292 | unsigned NewLoadByteSize = LI->getType()->getPrimitiveSizeInBits() / 8U; |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 293 | NewLoadByteSize = NextPowerOf2(NewLoadByteSize); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 294 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 295 | while (1) { |
| 296 | // If this load size is bigger than our known alignment or would not fit |
| 297 | // into a native integer register, then we fail. |
| 298 | if (NewLoadByteSize > LoadAlign || |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 299 | !DL.fitsInLegalInteger(NewLoadByteSize * 8)) |
Chris Lattner | 827a270 | 2011-04-28 07:29:08 +0000 | [diff] [blame] | 300 | return 0; |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 301 | |
Duncan P. N. Exon Smith | b3fc83c | 2015-02-14 00:12:15 +0000 | [diff] [blame] | 302 | if (LIOffs + NewLoadByteSize > MemLocEnd && |
| 303 | LI->getParent()->getParent()->hasFnAttribute( |
| 304 | Attribute::SanitizeAddress)) |
Kostya Serebryany | 9e0d377 | 2012-02-06 22:48:56 +0000 | [diff] [blame] | 305 | // We will be reading past the location accessed by the original program. |
| 306 | // While this is safe in a regular build, Address Safety analysis tools |
| 307 | // may start reporting false warnings. So, don't do widening. |
| 308 | return 0; |
Kostya Serebryany | 9e0d377 | 2012-02-06 22:48:56 +0000 | [diff] [blame] | 309 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 310 | // If a load of this width would include all of MemLoc, then we succeed. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 311 | if (LIOffs + NewLoadByteSize >= MemLocEnd) |
Chris Lattner | 827a270 | 2011-04-28 07:29:08 +0000 | [diff] [blame] | 312 | return NewLoadByteSize; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 313 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 314 | NewLoadByteSize <<= 1; |
| 315 | } |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 316 | } |
| 317 | |
Philip Reames | a7ad6a5 | 2015-01-26 18:54:27 +0000 | [diff] [blame] | 318 | static bool isVolatile(Instruction *Inst) { |
| 319 | if (LoadInst *LI = dyn_cast<LoadInst>(Inst)) |
| 320 | return LI->isVolatile(); |
| 321 | else if (StoreInst *SI = dyn_cast<StoreInst>(Inst)) |
| 322 | return SI->isVolatile(); |
| 323 | else if (AtomicCmpXchgInst *AI = dyn_cast<AtomicCmpXchgInst>(Inst)) |
| 324 | return AI->isVolatile(); |
| 325 | return false; |
| 326 | } |
| 327 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 328 | MemDepResult MemoryDependenceResults::getPointerDependencyFrom( |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 329 | const MemoryLocation &MemLoc, bool isLoad, BasicBlock::iterator ScanIt, |
| 330 | BasicBlock *BB, Instruction *QueryInst) { |
Chris Lattner | 2faa2c7 | 2008-12-07 02:15:47 +0000 | [diff] [blame] | 331 | |
Piotr Padlewski | dc9b2cf | 2015-10-02 22:12:22 +0000 | [diff] [blame] | 332 | if (QueryInst != nullptr) { |
| 333 | if (auto *LI = dyn_cast<LoadInst>(QueryInst)) { |
| 334 | MemDepResult invariantGroupDependency = |
| 335 | getInvariantGroupPointerDependency(LI, BB); |
| 336 | |
| 337 | if (invariantGroupDependency.isDef()) |
| 338 | return invariantGroupDependency; |
| 339 | } |
| 340 | } |
| 341 | return getSimplePointerDependencyFrom(MemLoc, isLoad, ScanIt, BB, QueryInst); |
| 342 | } |
| 343 | |
| 344 | MemDepResult |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 345 | MemoryDependenceResults::getInvariantGroupPointerDependency(LoadInst *LI, |
Piotr Padlewski | dc9b2cf | 2015-10-02 22:12:22 +0000 | [diff] [blame] | 346 | BasicBlock *BB) { |
| 347 | Value *LoadOperand = LI->getPointerOperand(); |
| 348 | // It's is not safe to walk the use list of global value, because function |
| 349 | // passes aren't allowed to look outside their functions. |
| 350 | if (isa<GlobalValue>(LoadOperand)) |
| 351 | return MemDepResult::getUnknown(); |
| 352 | |
| 353 | auto *InvariantGroupMD = LI->getMetadata(LLVMContext::MD_invariant_group); |
| 354 | if (!InvariantGroupMD) |
| 355 | return MemDepResult::getUnknown(); |
| 356 | |
| 357 | MemDepResult Result = MemDepResult::getUnknown(); |
| 358 | llvm::SmallSet<Value *, 14> Seen; |
| 359 | // Queue to process all pointers that are equivalent to load operand. |
| 360 | llvm::SmallVector<Value *, 8> LoadOperandsQueue; |
| 361 | LoadOperandsQueue.push_back(LoadOperand); |
| 362 | while (!LoadOperandsQueue.empty()) { |
| 363 | Value *Ptr = LoadOperandsQueue.pop_back_val(); |
| 364 | if (isa<GlobalValue>(Ptr)) |
| 365 | continue; |
| 366 | |
| 367 | if (auto *BCI = dyn_cast<BitCastInst>(Ptr)) { |
| 368 | if (!Seen.count(BCI->getOperand(0))) { |
| 369 | LoadOperandsQueue.push_back(BCI->getOperand(0)); |
| 370 | Seen.insert(BCI->getOperand(0)); |
| 371 | } |
| 372 | } |
| 373 | |
| 374 | for (Use &Us : Ptr->uses()) { |
| 375 | auto *U = dyn_cast<Instruction>(Us.getUser()); |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 376 | if (!U || U == LI || !DT.dominates(U, LI)) |
Piotr Padlewski | dc9b2cf | 2015-10-02 22:12:22 +0000 | [diff] [blame] | 377 | continue; |
| 378 | |
| 379 | if (auto *BCI = dyn_cast<BitCastInst>(U)) { |
| 380 | if (!Seen.count(BCI)) { |
| 381 | LoadOperandsQueue.push_back(BCI); |
| 382 | Seen.insert(BCI); |
| 383 | } |
| 384 | continue; |
| 385 | } |
| 386 | // If we hit load/store with the same invariant.group metadata (and the |
| 387 | // same pointer operand) we can assume that value pointed by pointer |
| 388 | // operand didn't change. |
| 389 | if ((isa<LoadInst>(U) || isa<StoreInst>(U)) && U->getParent() == BB && |
| 390 | U->getMetadata(LLVMContext::MD_invariant_group) == InvariantGroupMD) |
| 391 | return MemDepResult::getDef(U); |
| 392 | } |
| 393 | } |
| 394 | return Result; |
| 395 | } |
| 396 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 397 | MemDepResult MemoryDependenceResults::getSimplePointerDependencyFrom( |
Piotr Padlewski | dc9b2cf | 2015-10-02 22:12:22 +0000 | [diff] [blame] | 398 | const MemoryLocation &MemLoc, bool isLoad, BasicBlock::iterator ScanIt, |
| 399 | BasicBlock *BB, Instruction *QueryInst) { |
| 400 | |
Craig Topper | 9f00886 | 2014-04-15 04:59:12 +0000 | [diff] [blame] | 401 | const Value *MemLocBase = nullptr; |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 402 | int64_t MemLocOffset = 0; |
Eli Friedman | 8b098b0 | 2011-06-15 23:59:25 +0000 | [diff] [blame] | 403 | unsigned Limit = BlockScanLimit; |
Shuxin Yang | 408bdad | 2013-03-06 17:48:48 +0000 | [diff] [blame] | 404 | bool isInvariantLoad = false; |
Robin Morisset | 163ef04 | 2014-08-29 20:32:58 +0000 | [diff] [blame] | 405 | |
| 406 | // We must be careful with atomic accesses, as they may allow another thread |
| 407 | // to touch this location, cloberring it. We are conservative: if the |
| 408 | // QueryInst is not a simple (non-atomic) memory access, we automatically |
| 409 | // return getClobber. |
| 410 | // If it is simple, we know based on the results of |
| 411 | // "Compiler testing via a theory of sound optimisations in the C11/C++11 |
| 412 | // memory model" in PLDI 2013, that a non-atomic location can only be |
| 413 | // clobbered between a pair of a release and an acquire action, with no |
| 414 | // access to the location in between. |
| 415 | // Here is an example for giving the general intuition behind this rule. |
| 416 | // In the following code: |
| 417 | // store x 0; |
| 418 | // release action; [1] |
| 419 | // acquire action; [4] |
| 420 | // %val = load x; |
| 421 | // It is unsafe to replace %val by 0 because another thread may be running: |
| 422 | // acquire action; [2] |
| 423 | // store x 42; |
| 424 | // release action; [3] |
| 425 | // with synchronization from 1 to 2 and from 3 to 4, resulting in %val |
| 426 | // being 42. A key property of this program however is that if either |
| 427 | // 1 or 4 were missing, there would be a race between the store of 42 |
| 428 | // either the store of 0 or the load (making the whole progam racy). |
Nick Lewycky | 947ca8a | 2016-01-04 16:44:44 +0000 | [diff] [blame] | 429 | // The paper mentioned above shows that the same property is respected |
Robin Morisset | 163ef04 | 2014-08-29 20:32:58 +0000 | [diff] [blame] | 430 | // by every program that can detect any optimisation of that kind: either |
| 431 | // it is racy (undefined) or there is a release followed by an acquire |
| 432 | // between the pair of accesses under consideration. |
Robin Morisset | 163ef04 | 2014-08-29 20:32:58 +0000 | [diff] [blame] | 433 | |
Philip Reames | 4dbd88f | 2015-03-24 23:54:54 +0000 | [diff] [blame] | 434 | // If the load is invariant, we "know" that it doesn't alias *any* write. We |
| 435 | // do want to respect mustalias results since defs are useful for value |
| 436 | // forwarding, but any mayalias write can be assumed to be noalias. |
| 437 | // Arguably, this logic should be pushed inside AliasAnalysis itself. |
Shuxin Yang | 408bdad | 2013-03-06 17:48:48 +0000 | [diff] [blame] | 438 | if (isLoad && QueryInst) { |
| 439 | LoadInst *LI = dyn_cast<LoadInst>(QueryInst); |
Craig Topper | 9f00886 | 2014-04-15 04:59:12 +0000 | [diff] [blame] | 440 | if (LI && LI->getMetadata(LLVMContext::MD_invariant_load) != nullptr) |
Shuxin Yang | 408bdad | 2013-03-06 17:48:48 +0000 | [diff] [blame] | 441 | isInvariantLoad = true; |
| 442 | } |
Eli Friedman | 8b098b0 | 2011-06-15 23:59:25 +0000 | [diff] [blame] | 443 | |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 444 | const DataLayout &DL = BB->getModule()->getDataLayout(); |
| 445 | |
Bruno Cardoso Lopes | dfc1d96 | 2015-07-31 14:31:35 +0000 | [diff] [blame] | 446 | // Create a numbered basic block to lazily compute and cache instruction |
| 447 | // positions inside a BB. This is used to provide fast queries for relative |
| 448 | // position between two instructions in a BB and can be used by |
| 449 | // AliasAnalysis::callCapturesBefore. |
| 450 | OrderedBasicBlock OBB(BB); |
| 451 | |
Krzysztof Parzyszek | e261e5a | 2016-02-22 23:07:43 +0000 | [diff] [blame] | 452 | // Return "true" if and only if the instruction I is either a non-simple |
| 453 | // load or a non-simple store. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 454 | auto isNonSimpleLoadOrStore = [](Instruction *I) -> bool { |
Krzysztof Parzyszek | e261e5a | 2016-02-22 23:07:43 +0000 | [diff] [blame] | 455 | if (auto *LI = dyn_cast<LoadInst>(I)) |
| 456 | return !LI->isSimple(); |
| 457 | if (auto *SI = dyn_cast<StoreInst>(I)) |
| 458 | return !SI->isSimple(); |
| 459 | return false; |
| 460 | }; |
| 461 | |
| 462 | // Return "true" if I is not a load and not a store, but it does access |
| 463 | // memory. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 464 | auto isOtherMemAccess = [](Instruction *I) -> bool { |
Krzysztof Parzyszek | e261e5a | 2016-02-22 23:07:43 +0000 | [diff] [blame] | 465 | return !isa<LoadInst>(I) && !isa<StoreInst>(I) && I->mayReadOrWriteMemory(); |
| 466 | }; |
| 467 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 468 | // Walk backwards through the basic block, looking for dependencies. |
Philip Reames | 090a824 | 2015-02-15 19:07:31 +0000 | [diff] [blame] | 469 | while (ScanIt != BB->begin()) { |
Duncan P. N. Exon Smith | 5a82c91 | 2015-10-10 00:53:03 +0000 | [diff] [blame] | 470 | Instruction *Inst = &*--ScanIt; |
Yunzhong Gao | 5cbcf56 | 2013-11-14 01:10:52 +0000 | [diff] [blame] | 471 | |
| 472 | if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(Inst)) |
| 473 | // Debug intrinsics don't (and can't) cause dependencies. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 474 | if (isa<DbgInfoIntrinsic>(II)) |
| 475 | continue; |
Yunzhong Gao | 5cbcf56 | 2013-11-14 01:10:52 +0000 | [diff] [blame] | 476 | |
Eli Friedman | 8b098b0 | 2011-06-15 23:59:25 +0000 | [diff] [blame] | 477 | // Limit the amount of scanning we do so we don't end up with quadratic |
| 478 | // running time on extreme testcases. |
| 479 | --Limit; |
| 480 | if (!Limit) |
| 481 | return MemDepResult::getUnknown(); |
| 482 | |
Chris Lattner | 506b858 | 2009-12-01 21:15:15 +0000 | [diff] [blame] | 483 | if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(Inst)) { |
Owen Anderson | 2b2bd28 | 2009-10-28 07:05:35 +0000 | [diff] [blame] | 484 | // If we reach a lifetime begin or end marker, then the query ends here |
| 485 | // because the value is undefined. |
Chris Lattner | a58edd1 | 2010-09-06 03:58:04 +0000 | [diff] [blame] | 486 | if (II->getIntrinsicID() == Intrinsic::lifetime_start) { |
Owen Anderson | b9878ee | 2009-12-02 07:35:19 +0000 | [diff] [blame] | 487 | // FIXME: This only considers queries directly on the invariant-tagged |
| 488 | // pointer, not on query pointers that are indexed off of them. It'd |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 489 | // be nice to handle that at some point (the right approach is to use |
| 490 | // GetPointerBaseWithConstantOffset). |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 491 | if (AA.isMustAlias(MemoryLocation(II->getArgOperand(1)), MemLoc)) |
Owen Anderson | 2b2bd28 | 2009-10-28 07:05:35 +0000 | [diff] [blame] | 492 | return MemDepResult::getDef(II); |
Chris Lattner | a58edd1 | 2010-09-06 03:58:04 +0000 | [diff] [blame] | 493 | continue; |
Owen Anderson | d0e86d5 | 2009-10-28 06:18:42 +0000 | [diff] [blame] | 494 | } |
| 495 | } |
| 496 | |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 497 | // Values depend on loads if the pointers are must aliased. This means |
| 498 | // that a load depends on another must aliased load from the same value. |
| 499 | // One exception is atomic loads: a value can depend on an atomic load that |
| 500 | // it does not alias with when this atomic load indicates that another |
| 501 | // thread may be accessing the location. |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 502 | if (LoadInst *LI = dyn_cast<LoadInst>(Inst)) { |
Philip Reames | a7ad6a5 | 2015-01-26 18:54:27 +0000 | [diff] [blame] | 503 | |
| 504 | // While volatile access cannot be eliminated, they do not have to clobber |
| 505 | // non-aliasing locations, as normal accesses, for example, can be safely |
| 506 | // reordered with volatile accesses. |
| 507 | if (LI->isVolatile()) { |
| 508 | if (!QueryInst) |
| 509 | // Original QueryInst *may* be volatile |
| 510 | return MemDepResult::getClobber(LI); |
| 511 | if (isVolatile(QueryInst)) |
| 512 | // Ordering required if QueryInst is itself volatile |
| 513 | return MemDepResult::getClobber(LI); |
| 514 | // Otherwise, volatile doesn't imply any special ordering |
| 515 | } |
Krzysztof Parzyszek | e261e5a | 2016-02-22 23:07:43 +0000 | [diff] [blame] | 516 | |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 517 | // Atomic loads have complications involved. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 518 | // A Monotonic (or higher) load is OK if the query inst is itself not |
| 519 | // atomic. |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 520 | // FIXME: This is overly conservative. |
Philip Reames | a7ad6a5 | 2015-01-26 18:54:27 +0000 | [diff] [blame] | 521 | if (LI->isAtomic() && LI->getOrdering() > Unordered) { |
Krzysztof Parzyszek | e261e5a | 2016-02-22 23:07:43 +0000 | [diff] [blame] | 522 | if (!QueryInst || isNonSimpleLoadOrStore(QueryInst) || |
| 523 | isOtherMemAccess(QueryInst)) |
Robin Morisset | 9e98e7f | 2014-08-18 22:18:14 +0000 | [diff] [blame] | 524 | return MemDepResult::getClobber(LI); |
David Majnemer | e165502 | 2015-03-21 06:19:17 +0000 | [diff] [blame] | 525 | if (LI->getOrdering() != Monotonic) |
| 526 | return MemDepResult::getClobber(LI); |
Robin Morisset | 4ffe8aa | 2014-08-18 22:18:11 +0000 | [diff] [blame] | 527 | } |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 528 | |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 529 | MemoryLocation LoadLoc = MemoryLocation::get(LI); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 530 | |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 531 | // If we found a pointer, check if it could be the same as our pointer. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 532 | AliasResult R = AA.alias(LoadLoc, MemLoc); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 533 | |
Chris Lattner | 6f83d06 | 2011-04-26 01:21:15 +0000 | [diff] [blame] | 534 | if (isLoad) { |
Chandler Carruth | c3f49eb | 2015-06-22 02:16:51 +0000 | [diff] [blame] | 535 | if (R == NoAlias) { |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 536 | // If this is an over-aligned integer load (for example, |
| 537 | // "load i8* %P, align 4") see if it would obviously overlap with the |
| 538 | // queried location if widened to a larger load (e.g. if the queried |
| 539 | // location is 1 byte at P+1). If so, return it as a load/load |
| 540 | // clobber result, allowing the client to decide to widen the load if |
| 541 | // it wants to. |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 542 | if (IntegerType *ITy = dyn_cast<IntegerType>(LI->getType())) { |
| 543 | if (LI->getAlignment() * 8 > ITy->getPrimitiveSizeInBits() && |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 544 | isLoadLoadClobberIfExtendedToFullWidth(MemLoc, MemLocBase, |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 545 | MemLocOffset, LI)) |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 546 | return MemDepResult::getClobber(Inst); |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 547 | } |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 548 | continue; |
| 549 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 550 | |
Chris Lattner | 6f83d06 | 2011-04-26 01:21:15 +0000 | [diff] [blame] | 551 | // Must aliased loads are defs of each other. |
Chandler Carruth | c3f49eb | 2015-06-22 02:16:51 +0000 | [diff] [blame] | 552 | if (R == MustAlias) |
Chris Lattner | 6f83d06 | 2011-04-26 01:21:15 +0000 | [diff] [blame] | 553 | return MemDepResult::getDef(Inst); |
| 554 | |
Dan Gohman | a471751 | 2011-06-04 06:48:50 +0000 | [diff] [blame] | 555 | #if 0 // FIXME: Temporarily disabled. GVN is cleverly rewriting loads |
| 556 | // in terms of clobbering loads, but since it does this by looking |
| 557 | // at the clobbering load directly, it doesn't know about any |
| 558 | // phi translation that may have happened along the way. |
| 559 | |
Chris Lattner | 6f83d06 | 2011-04-26 01:21:15 +0000 | [diff] [blame] | 560 | // If we have a partial alias, then return this as a clobber for the |
| 561 | // client to handle. |
Chandler Carruth | c3f49eb | 2015-06-22 02:16:51 +0000 | [diff] [blame] | 562 | if (R == PartialAlias) |
Chris Lattner | 6f83d06 | 2011-04-26 01:21:15 +0000 | [diff] [blame] | 563 | return MemDepResult::getClobber(Inst); |
Dan Gohman | a471751 | 2011-06-04 06:48:50 +0000 | [diff] [blame] | 564 | #endif |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 565 | |
Chris Lattner | 6f83d06 | 2011-04-26 01:21:15 +0000 | [diff] [blame] | 566 | // Random may-alias loads don't depend on each other without a |
| 567 | // dependence. |
Chris Lattner | 80c0818 | 2008-11-29 09:09:48 +0000 | [diff] [blame] | 568 | continue; |
Chris Lattner | 6f83d06 | 2011-04-26 01:21:15 +0000 | [diff] [blame] | 569 | } |
Dan Gohman | 15a4396 | 2010-10-29 01:14:04 +0000 | [diff] [blame] | 570 | |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 571 | // Stores don't depend on other no-aliased accesses. |
Chandler Carruth | c3f49eb | 2015-06-22 02:16:51 +0000 | [diff] [blame] | 572 | if (R == NoAlias) |
Chris Lattner | 7aab279 | 2011-04-26 22:42:01 +0000 | [diff] [blame] | 573 | continue; |
| 574 | |
Dan Gohman | 15a4396 | 2010-10-29 01:14:04 +0000 | [diff] [blame] | 575 | // Stores don't alias loads from read-only memory. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 576 | if (AA.pointsToConstantMemory(LoadLoc)) |
Dan Gohman | 15a4396 | 2010-10-29 01:14:04 +0000 | [diff] [blame] | 577 | continue; |
| 578 | |
Chris Lattner | 6f83d06 | 2011-04-26 01:21:15 +0000 | [diff] [blame] | 579 | // Stores depend on may/must aliased loads. |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 580 | return MemDepResult::getDef(Inst); |
| 581 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 582 | |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 583 | if (StoreInst *SI = dyn_cast<StoreInst>(Inst)) { |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 584 | // Atomic stores have complications involved. |
Robin Morisset | 163ef04 | 2014-08-29 20:32:58 +0000 | [diff] [blame] | 585 | // A Monotonic store is OK if the query inst is itself not atomic. |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 586 | // FIXME: This is overly conservative. |
Krzysztof Parzyszek | e261e5a | 2016-02-22 23:07:43 +0000 | [diff] [blame] | 587 | if (!SI->isUnordered() && SI->isAtomic()) { |
| 588 | if (!QueryInst || isNonSimpleLoadOrStore(QueryInst) || |
| 589 | isOtherMemAccess(QueryInst)) |
Robin Morisset | 9e98e7f | 2014-08-18 22:18:14 +0000 | [diff] [blame] | 590 | return MemDepResult::getClobber(SI); |
David Majnemer | e165502 | 2015-03-21 06:19:17 +0000 | [diff] [blame] | 591 | if (SI->getOrdering() != Monotonic) |
| 592 | return MemDepResult::getClobber(SI); |
Robin Morisset | 4ffe8aa | 2014-08-18 22:18:11 +0000 | [diff] [blame] | 593 | } |
Eli Friedman | 5494ada | 2011-08-15 20:54:19 +0000 | [diff] [blame] | 594 | |
Robin Morisset | 9e98e7f | 2014-08-18 22:18:14 +0000 | [diff] [blame] | 595 | // FIXME: this is overly conservative. |
| 596 | // While volatile access cannot be eliminated, they do not have to clobber |
| 597 | // non-aliasing locations, as normal accesses can for example be reordered |
| 598 | // with volatile accesses. |
| 599 | if (SI->isVolatile()) |
Krzysztof Parzyszek | e261e5a | 2016-02-22 23:07:43 +0000 | [diff] [blame] | 600 | if (!QueryInst || isNonSimpleLoadOrStore(QueryInst) || |
| 601 | isOtherMemAccess(QueryInst)) |
| 602 | return MemDepResult::getClobber(SI); |
Robin Morisset | 9e98e7f | 2014-08-18 22:18:14 +0000 | [diff] [blame] | 603 | |
Chris Lattner | 02274a7 | 2009-05-25 21:28:56 +0000 | [diff] [blame] | 604 | // If alias analysis can tell that this store is guaranteed to not modify |
| 605 | // the query pointer, ignore it. Use getModRefInfo to handle cases where |
| 606 | // the query pointer points to constant memory etc. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 607 | if (AA.getModRefInfo(SI, MemLoc) == MRI_NoModRef) |
Chris Lattner | 02274a7 | 2009-05-25 21:28:56 +0000 | [diff] [blame] | 608 | continue; |
| 609 | |
| 610 | // Ok, this store might clobber the query pointer. Check to see if it is |
| 611 | // a must alias: in this case, we want to return this as a def. |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 612 | MemoryLocation StoreLoc = MemoryLocation::get(SI); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 613 | |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 614 | // If we found a pointer, check if it could be the same as our pointer. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 615 | AliasResult R = AA.alias(StoreLoc, MemLoc); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 616 | |
Chandler Carruth | c3f49eb | 2015-06-22 02:16:51 +0000 | [diff] [blame] | 617 | if (R == NoAlias) |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 618 | continue; |
Chandler Carruth | c3f49eb | 2015-06-22 02:16:51 +0000 | [diff] [blame] | 619 | if (R == MustAlias) |
Dan Gohman | ba5d0ab | 2010-12-13 22:47:57 +0000 | [diff] [blame] | 620 | return MemDepResult::getDef(Inst); |
Shuxin Yang | 408bdad | 2013-03-06 17:48:48 +0000 | [diff] [blame] | 621 | if (isInvariantLoad) |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 622 | continue; |
Dan Gohman | ba5d0ab | 2010-12-13 22:47:57 +0000 | [diff] [blame] | 623 | return MemDepResult::getClobber(Inst); |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 624 | } |
Chris Lattner | 3ff6d01 | 2008-11-30 01:39:32 +0000 | [diff] [blame] | 625 | |
| 626 | // If this is an allocation, and if we know that the accessed pointer is to |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 627 | // the allocation, return Def. This means that there is no dependence and |
Chris Lattner | 3ff6d01 | 2008-11-30 01:39:32 +0000 | [diff] [blame] | 628 | // the access can be optimized based on that. For example, a load could |
Philip Reames | d9f4a3d | 2016-03-09 23:19:56 +0000 | [diff] [blame] | 629 | // turn into undef. Note that we can bypass the allocation itself when |
| 630 | // looking for a clobber in many cases; that's an alias property and is |
| 631 | // handled by BasicAA. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 632 | if (isa<AllocaInst>(Inst) || isNoAliasFn(Inst, &TLI)) { |
Rafael Espindola | 7c68beb | 2014-02-18 15:33:12 +0000 | [diff] [blame] | 633 | const Value *AccessPtr = GetUnderlyingObject(MemLoc.Ptr, DL); |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 634 | if (AccessPtr == Inst || AA.isMustAlias(Inst, AccessPtr)) |
Victor Hernandez | 537d8d9 | 2009-09-18 21:34:51 +0000 | [diff] [blame] | 635 | return MemDepResult::getDef(Inst); |
Victor Hernandez | 537d8d9 | 2009-09-18 21:34:51 +0000 | [diff] [blame] | 636 | } |
| 637 | |
Philip Reames | 4dbd88f | 2015-03-24 23:54:54 +0000 | [diff] [blame] | 638 | if (isInvariantLoad) |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 639 | continue; |
Philip Reames | 4dbd88f | 2015-03-24 23:54:54 +0000 | [diff] [blame] | 640 | |
Philip Reames | b568113 | 2016-03-25 22:40:35 +0000 | [diff] [blame^] | 641 | // A release fence requires that all stores complete before it, but does |
| 642 | // not prevent the reordering of following loads or stores 'before' the |
| 643 | // fence. As a result, we look past it when finding a dependency for |
| 644 | // loads. DSE uses this to find preceeding stores to delete and thus we |
| 645 | // can't bypass the fence if the query instruction is a store. |
| 646 | if (FenceInst *FI = dyn_cast<FenceInst>(Inst)) |
| 647 | if (isLoad && FI->getOrdering() == Release) |
| 648 | continue; |
| 649 | |
Chris Lattner | 0e3d633 | 2008-12-05 21:04:20 +0000 | [diff] [blame] | 650 | // See if this instruction (e.g. a call or vaarg) mod/ref's the pointer. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 651 | ModRefInfo MR = AA.getModRefInfo(Inst, MemLoc); |
Chad Rosier | a968caf | 2012-05-14 20:35:04 +0000 | [diff] [blame] | 652 | // If necessary, perform additional analysis. |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 653 | if (MR == MRI_ModRef) |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 654 | MR = AA.callCapturesBefore(Inst, MemLoc, &DT, &OBB); |
Chad Rosier | a968caf | 2012-05-14 20:35:04 +0000 | [diff] [blame] | 655 | switch (MR) { |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 656 | case MRI_NoModRef: |
Chris Lattner | 41efb68 | 2008-12-09 19:47:40 +0000 | [diff] [blame] | 657 | // If the call has no effect on the queried pointer, just ignore it. |
Chris Lattner | 81f19e9 | 2008-11-29 08:51:16 +0000 | [diff] [blame] | 658 | continue; |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 659 | case MRI_Mod: |
Owen Anderson | fc16e5a | 2009-10-28 06:30:52 +0000 | [diff] [blame] | 660 | return MemDepResult::getClobber(Inst); |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 661 | case MRI_Ref: |
Chris Lattner | 41efb68 | 2008-12-09 19:47:40 +0000 | [diff] [blame] | 662 | // If the call is known to never store to the pointer, and if this is a |
| 663 | // load query, we can safely ignore it (scan past it). |
| 664 | if (isLoad) |
| 665 | continue; |
Chris Lattner | 41efb68 | 2008-12-09 19:47:40 +0000 | [diff] [blame] | 666 | default: |
| 667 | // Otherwise, there is a potential dependence. Return a clobber. |
| 668 | return MemDepResult::getClobber(Inst); |
| 669 | } |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 670 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 671 | |
Eli Friedman | 7d58bc7 | 2011-06-15 00:47:34 +0000 | [diff] [blame] | 672 | // No dependence found. If this is the entry block of the function, it is |
| 673 | // unknown, otherwise it is non-local. |
Chris Lattner | 2faa2c7 | 2008-12-07 02:15:47 +0000 | [diff] [blame] | 674 | if (BB != &BB->getParent()->getEntryBlock()) |
| 675 | return MemDepResult::getNonLocal(); |
Eli Friedman | c1702c8 | 2011-10-13 22:14:57 +0000 | [diff] [blame] | 676 | return MemDepResult::getNonFuncLocal(); |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 677 | } |
| 678 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 679 | MemDepResult MemoryDependenceResults::getDependency(Instruction *QueryInst) { |
Chris Lattner | 51ba8d0 | 2008-11-29 03:47:00 +0000 | [diff] [blame] | 680 | Instruction *ScanPos = QueryInst; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 681 | |
Chris Lattner | 51ba8d0 | 2008-11-29 03:47:00 +0000 | [diff] [blame] | 682 | // Check for a cached result |
Chris Lattner | 47e81d0 | 2008-11-30 23:17:19 +0000 | [diff] [blame] | 683 | MemDepResult &LocalCache = LocalDeps[QueryInst]; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 684 | |
Chris Lattner | e7d7e13 | 2008-11-29 22:02:15 +0000 | [diff] [blame] | 685 | // If the cached entry is non-dirty, just return it. Note that this depends |
Chris Lattner | 47e81d0 | 2008-11-30 23:17:19 +0000 | [diff] [blame] | 686 | // on MemDepResult's default constructing to 'dirty'. |
| 687 | if (!LocalCache.isDirty()) |
| 688 | return LocalCache; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 689 | |
Chris Lattner | 51ba8d0 | 2008-11-29 03:47:00 +0000 | [diff] [blame] | 690 | // Otherwise, if we have a dirty entry, we know we can start the scan at that |
| 691 | // instruction, which may save us some work. |
Chris Lattner | 47e81d0 | 2008-11-30 23:17:19 +0000 | [diff] [blame] | 692 | if (Instruction *Inst = LocalCache.getInst()) { |
Chris Lattner | 51ba8d0 | 2008-11-29 03:47:00 +0000 | [diff] [blame] | 693 | ScanPos = Inst; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 694 | |
Chris Lattner | de4440c | 2008-12-07 18:39:13 +0000 | [diff] [blame] | 695 | RemoveFromReverseMap(ReverseLocalDeps, Inst, QueryInst); |
Chris Lattner | 4410427 | 2008-11-30 02:52:26 +0000 | [diff] [blame] | 696 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 697 | |
Chris Lattner | 5a78604 | 2008-12-07 01:50:16 +0000 | [diff] [blame] | 698 | BasicBlock *QueryParent = QueryInst->getParent(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 699 | |
Chris Lattner | 51ba8d0 | 2008-11-29 03:47:00 +0000 | [diff] [blame] | 700 | // Do the scan. |
Chris Lattner | 5a78604 | 2008-12-07 01:50:16 +0000 | [diff] [blame] | 701 | if (BasicBlock::iterator(QueryInst) == QueryParent->begin()) { |
Eli Friedman | 7d58bc7 | 2011-06-15 00:47:34 +0000 | [diff] [blame] | 702 | // No dependence found. If this is the entry block of the function, it is |
| 703 | // unknown, otherwise it is non-local. |
Chris Lattner | 2faa2c7 | 2008-12-07 02:15:47 +0000 | [diff] [blame] | 704 | if (QueryParent != &QueryParent->getParent()->getEntryBlock()) |
| 705 | LocalCache = MemDepResult::getNonLocal(); |
| 706 | else |
Eli Friedman | c1702c8 | 2011-10-13 22:14:57 +0000 | [diff] [blame] | 707 | LocalCache = MemDepResult::getNonFuncLocal(); |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 708 | } else { |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 709 | MemoryLocation MemLoc; |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 710 | ModRefInfo MR = GetLocation(QueryInst, MemLoc, TLI); |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 711 | if (MemLoc.Ptr) { |
| 712 | // If we can do a pointer scan, make it happen. |
Chandler Carruth | 194f59c | 2015-07-22 23:15:57 +0000 | [diff] [blame] | 713 | bool isLoad = !(MR & MRI_Mod); |
Chris Lattner | d540a5d | 2010-11-30 01:56:13 +0000 | [diff] [blame] | 714 | if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(QueryInst)) |
Owen Anderson | 97f0cf3 | 2011-05-17 00:05:49 +0000 | [diff] [blame] | 715 | isLoad |= II->getIntrinsicID() == Intrinsic::lifetime_start; |
Chris Lattner | e48c31c | 2010-11-21 07:34:32 +0000 | [diff] [blame] | 716 | |
Duncan P. N. Exon Smith | 5a82c91 | 2015-10-10 00:53:03 +0000 | [diff] [blame] | 717 | LocalCache = getPointerDependencyFrom( |
| 718 | MemLoc, isLoad, ScanPos->getIterator(), QueryParent, QueryInst); |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 719 | } else if (isa<CallInst>(QueryInst) || isa<InvokeInst>(QueryInst)) { |
Gabor Greif | ef1ca24 | 2010-07-27 22:02:00 +0000 | [diff] [blame] | 720 | CallSite QueryCS(QueryInst); |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 721 | bool isReadOnly = AA.onlyReadsMemory(QueryCS); |
Duncan P. N. Exon Smith | 5a82c91 | 2015-10-10 00:53:03 +0000 | [diff] [blame] | 722 | LocalCache = getCallSiteDependencyFrom( |
| 723 | QueryCS, isReadOnly, ScanPos->getIterator(), QueryParent); |
Dan Gohman | 1d760ce | 2010-11-10 21:51:35 +0000 | [diff] [blame] | 724 | } else |
| 725 | // Non-memory instruction. |
Eli Friedman | 7d58bc7 | 2011-06-15 00:47:34 +0000 | [diff] [blame] | 726 | LocalCache = MemDepResult::getUnknown(); |
Nick Lewycky | 218a339 | 2009-11-28 21:27:49 +0000 | [diff] [blame] | 727 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 728 | |
Chris Lattner | 51ba8d0 | 2008-11-29 03:47:00 +0000 | [diff] [blame] | 729 | // Remember the result! |
Chris Lattner | 47e81d0 | 2008-11-30 23:17:19 +0000 | [diff] [blame] | 730 | if (Instruction *I = LocalCache.getInst()) |
Chris Lattner | 9f1988ab | 2008-11-29 09:20:15 +0000 | [diff] [blame] | 731 | ReverseLocalDeps[I].insert(QueryInst); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 732 | |
Chris Lattner | 47e81d0 | 2008-11-30 23:17:19 +0000 | [diff] [blame] | 733 | return LocalCache; |
Chris Lattner | 51ba8d0 | 2008-11-29 03:47:00 +0000 | [diff] [blame] | 734 | } |
| 735 | |
Chris Lattner | f09619d | 2009-01-22 07:04:01 +0000 | [diff] [blame] | 736 | #ifndef NDEBUG |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 737 | /// This method is used when -debug is specified to verify that cache arrays |
| 738 | /// are properly kept sorted. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 739 | static void AssertSorted(MemoryDependenceResults::NonLocalDepInfo &Cache, |
Chris Lattner | f09619d | 2009-01-22 07:04:01 +0000 | [diff] [blame] | 740 | int Count = -1) { |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 741 | if (Count == -1) |
| 742 | Count = Cache.size(); |
Craig Topper | e30b8ca | 2016-01-03 19:43:40 +0000 | [diff] [blame] | 743 | assert(std::is_sorted(Cache.begin(), Cache.begin() + Count) && |
| 744 | "Cache isn't sorted!"); |
Chris Lattner | f09619d | 2009-01-22 07:04:01 +0000 | [diff] [blame] | 745 | } |
| 746 | #endif |
| 747 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 748 | const MemoryDependenceResults::NonLocalDepInfo & |
| 749 | MemoryDependenceResults::getNonLocalCallDependency(CallSite QueryCS) { |
Chris Lattner | 254314e | 2008-12-09 19:38:05 +0000 | [diff] [blame] | 750 | assert(getDependency(QueryCS.getInstruction()).isNonLocal() && |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 751 | "getNonLocalCallDependency should only be used on calls with " |
| 752 | "non-local deps!"); |
Chris Lattner | 254314e | 2008-12-09 19:38:05 +0000 | [diff] [blame] | 753 | PerInstNLInfo &CacheP = NonLocalDeps[QueryCS.getInstruction()]; |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 754 | NonLocalDepInfo &Cache = CacheP.first; |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 755 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 756 | // This is the set of blocks that need to be recomputed. In the cached case, |
| 757 | // this can happen due to instructions being deleted etc. In the uncached |
| 758 | // case, this starts out as the set of predecessors we care about. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 759 | SmallVector<BasicBlock *, 32> DirtyBlocks; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 760 | |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 761 | if (!Cache.empty()) { |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 762 | // Okay, we have a cache entry. If we know it is not dirty, just return it |
| 763 | // with no computation. |
| 764 | if (!CacheP.second) { |
Dan Gohman | d2d1ae1 | 2010-06-22 15:08:57 +0000 | [diff] [blame] | 765 | ++NumCacheNonLocal; |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 766 | return Cache; |
| 767 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 768 | |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 769 | // If we already have a partially computed set of results, scan them to |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 770 | // determine what is dirty, seeding our initial DirtyBlocks worklist. |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 771 | for (auto &Entry : Cache) |
| 772 | if (Entry.getResult().isDirty()) |
| 773 | DirtyBlocks.push_back(Entry.getBB()); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 774 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 775 | // Sort the cache so that we can do fast binary search lookups below. |
| 776 | std::sort(Cache.begin(), Cache.end()); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 777 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 778 | ++NumCacheDirtyNonLocal; |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 779 | // cerr << "CACHED CASE: " << DirtyBlocks.size() << " dirty: " |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 780 | // << Cache.size() << " cached: " << *QueryInst; |
| 781 | } else { |
| 782 | // Seed DirtyBlocks with each of the preds of QueryInst's block. |
Chris Lattner | 254314e | 2008-12-09 19:38:05 +0000 | [diff] [blame] | 783 | BasicBlock *QueryBB = QueryCS.getInstruction()->getParent(); |
Daniel Berlin | b4e7a4a | 2015-04-21 21:11:50 +0000 | [diff] [blame] | 784 | for (BasicBlock *Pred : PredCache.get(QueryBB)) |
| 785 | DirtyBlocks.push_back(Pred); |
Dan Gohman | d2d1ae1 | 2010-06-22 15:08:57 +0000 | [diff] [blame] | 786 | ++NumUncacheNonLocal; |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 787 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 788 | |
Chris Lattner | 702e46e | 2008-12-09 21:19:42 +0000 | [diff] [blame] | 789 | // isReadonlyCall - If this is a read-only call, we can be more aggressive. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 790 | bool isReadonlyCall = AA.onlyReadsMemory(QueryCS); |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 791 | |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 792 | SmallPtrSet<BasicBlock *, 32> Visited; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 793 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 794 | unsigned NumSortedEntries = Cache.size(); |
Chris Lattner | f09619d | 2009-01-22 07:04:01 +0000 | [diff] [blame] | 795 | DEBUG(AssertSorted(Cache)); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 796 | |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 797 | // Iterate while we still have blocks to update. |
| 798 | while (!DirtyBlocks.empty()) { |
| 799 | BasicBlock *DirtyBB = DirtyBlocks.back(); |
| 800 | DirtyBlocks.pop_back(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 801 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 802 | // Already processed this block? |
David Blaikie | 70573dc | 2014-11-19 07:49:26 +0000 | [diff] [blame] | 803 | if (!Visited.insert(DirtyBB).second) |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 804 | continue; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 805 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 806 | // Do a binary search to see if we already have an entry for this block in |
| 807 | // the cache set. If so, find it. |
Chris Lattner | f09619d | 2009-01-22 07:04:01 +0000 | [diff] [blame] | 808 | DEBUG(AssertSorted(Cache, NumSortedEntries)); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 809 | NonLocalDepInfo::iterator Entry = |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 810 | std::upper_bound(Cache.begin(), Cache.begin() + NumSortedEntries, |
| 811 | NonLocalDepEntry(DirtyBB)); |
Benjamin Kramer | b6d0bd4 | 2014-03-02 12:27:27 +0000 | [diff] [blame] | 812 | if (Entry != Cache.begin() && std::prev(Entry)->getBB() == DirtyBB) |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 813 | --Entry; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 814 | |
Craig Topper | 9f00886 | 2014-04-15 04:59:12 +0000 | [diff] [blame] | 815 | NonLocalDepEntry *ExistingResult = nullptr; |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 816 | if (Entry != Cache.begin() + NumSortedEntries && |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 817 | Entry->getBB() == DirtyBB) { |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 818 | // If we already have an entry, and if it isn't already dirty, the block |
| 819 | // is done. |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 820 | if (!Entry->getResult().isDirty()) |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 821 | continue; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 822 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 823 | // Otherwise, remember this slot so we can update the value. |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 824 | ExistingResult = &*Entry; |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 825 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 826 | |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 827 | // If the dirty entry has a pointer, start scanning from it so we don't have |
| 828 | // to rescan the entire block. |
| 829 | BasicBlock::iterator ScanPos = DirtyBB->end(); |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 830 | if (ExistingResult) { |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 831 | if (Instruction *Inst = ExistingResult->getResult().getInst()) { |
Duncan P. N. Exon Smith | 5a82c91 | 2015-10-10 00:53:03 +0000 | [diff] [blame] | 832 | ScanPos = Inst->getIterator(); |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 833 | // We're removing QueryInst's use of Inst. |
Chris Lattner | 254314e | 2008-12-09 19:38:05 +0000 | [diff] [blame] | 834 | RemoveFromReverseMap(ReverseNonLocalDeps, Inst, |
| 835 | QueryCS.getInstruction()); |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 836 | } |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 837 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 838 | |
Chris Lattner | 60444f8 | 2008-11-30 01:26:32 +0000 | [diff] [blame] | 839 | // Find out if this block has a local dependency for QueryInst. |
Chris Lattner | ed494f7 | 2008-12-07 01:21:14 +0000 | [diff] [blame] | 840 | MemDepResult Dep; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 841 | |
Chris Lattner | 254314e | 2008-12-09 19:38:05 +0000 | [diff] [blame] | 842 | if (ScanPos != DirtyBB->begin()) { |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 843 | Dep = |
| 844 | getCallSiteDependencyFrom(QueryCS, isReadonlyCall, ScanPos, DirtyBB); |
Chris Lattner | 254314e | 2008-12-09 19:38:05 +0000 | [diff] [blame] | 845 | } else if (DirtyBB != &DirtyBB->getParent()->getEntryBlock()) { |
| 846 | // No dependence found. If this is the entry block of the function, it is |
Eli Friedman | 7d58bc7 | 2011-06-15 00:47:34 +0000 | [diff] [blame] | 847 | // a clobber, otherwise it is unknown. |
Chris Lattner | 254314e | 2008-12-09 19:38:05 +0000 | [diff] [blame] | 848 | Dep = MemDepResult::getNonLocal(); |
Chris Lattner | 5a78604 | 2008-12-07 01:50:16 +0000 | [diff] [blame] | 849 | } else { |
Eli Friedman | c1702c8 | 2011-10-13 22:14:57 +0000 | [diff] [blame] | 850 | Dep = MemDepResult::getNonFuncLocal(); |
Chris Lattner | 5a78604 | 2008-12-07 01:50:16 +0000 | [diff] [blame] | 851 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 852 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 853 | // If we had a dirty entry for the block, update it. Otherwise, just add |
| 854 | // a new entry. |
| 855 | if (ExistingResult) |
Chris Lattner | 9b7d99e | 2009-12-22 04:25:02 +0000 | [diff] [blame] | 856 | ExistingResult->setResult(Dep); |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 857 | else |
Chris Lattner | 9b7d99e | 2009-12-22 04:25:02 +0000 | [diff] [blame] | 858 | Cache.push_back(NonLocalDepEntry(DirtyBB, Dep)); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 859 | |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 860 | // If the block has a dependency (i.e. it isn't completely transparent to |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 861 | // the value), remember the association! |
| 862 | if (!Dep.isNonLocal()) { |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 863 | // Keep the ReverseNonLocalDeps map up to date so we can efficiently |
| 864 | // update this when we remove instructions. |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 865 | if (Instruction *Inst = Dep.getInst()) |
Chris Lattner | 254314e | 2008-12-09 19:38:05 +0000 | [diff] [blame] | 866 | ReverseNonLocalDeps[Inst].insert(QueryCS.getInstruction()); |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 867 | } else { |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 868 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 869 | // If the block *is* completely transparent to the load, we need to check |
| 870 | // the predecessors of this block. Add them to our worklist. |
Daniel Berlin | b4e7a4a | 2015-04-21 21:11:50 +0000 | [diff] [blame] | 871 | for (BasicBlock *Pred : PredCache.get(DirtyBB)) |
| 872 | DirtyBlocks.push_back(Pred); |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 873 | } |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 874 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 875 | |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 876 | return Cache; |
Chris Lattner | 2059753 | 2008-11-30 01:18:27 +0000 | [diff] [blame] | 877 | } |
| 878 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 879 | void MemoryDependenceResults::getNonLocalPointerDependency( |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 880 | Instruction *QueryInst, SmallVectorImpl<NonLocalDepResult> &Result) { |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 881 | const MemoryLocation Loc = MemoryLocation::get(QueryInst); |
Philip Reames | 567feb9 | 2015-01-09 00:04:22 +0000 | [diff] [blame] | 882 | bool isLoad = isa<LoadInst>(QueryInst); |
| 883 | BasicBlock *FromBB = QueryInst->getParent(); |
| 884 | assert(FromBB); |
Philip Reames | 33d7f9d | 2015-01-09 00:26:45 +0000 | [diff] [blame] | 885 | |
| 886 | assert(Loc.Ptr->getType()->isPointerTy() && |
| 887 | "Can't get pointer deps of a non-pointer!"); |
| 888 | Result.clear(); |
Krzysztof Parzyszek | e261e5a | 2016-02-22 23:07:43 +0000 | [diff] [blame] | 889 | |
Philip Reames | 33d7f9d | 2015-01-09 00:26:45 +0000 | [diff] [blame] | 890 | // This routine does not expect to deal with volatile instructions. |
| 891 | // Doing so would require piping through the QueryInst all the way through. |
Philip Reames | 567feb9 | 2015-01-09 00:04:22 +0000 | [diff] [blame] | 892 | // TODO: volatiles can't be elided, but they can be reordered with other |
Philip Reames | 33d7f9d | 2015-01-09 00:26:45 +0000 | [diff] [blame] | 893 | // non-volatile accesses. |
Philip Reames | a7ad6a5 | 2015-01-26 18:54:27 +0000 | [diff] [blame] | 894 | |
Philip Reames | 567feb9 | 2015-01-09 00:04:22 +0000 | [diff] [blame] | 895 | // We currently give up on any instruction which is ordered, but we do handle |
| 896 | // atomic instructions which are unordered. |
| 897 | // TODO: Handle ordered instructions |
| 898 | auto isOrdered = [](Instruction *Inst) { |
| 899 | if (LoadInst *LI = dyn_cast<LoadInst>(Inst)) { |
| 900 | return !LI->isUnordered(); |
| 901 | } else if (StoreInst *SI = dyn_cast<StoreInst>(Inst)) { |
| 902 | return !SI->isUnordered(); |
| 903 | } |
| 904 | return false; |
| 905 | }; |
Philip Reames | 33d7f9d | 2015-01-09 00:26:45 +0000 | [diff] [blame] | 906 | if (isVolatile(QueryInst) || isOrdered(QueryInst)) { |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 907 | Result.push_back(NonLocalDepResult(FromBB, MemDepResult::getUnknown(), |
Philip Reames | 33d7f9d | 2015-01-09 00:26:45 +0000 | [diff] [blame] | 908 | const_cast<Value *>(Loc.Ptr))); |
| 909 | return; |
| 910 | } |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 911 | const DataLayout &DL = FromBB->getModule()->getDataLayout(); |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 912 | PHITransAddr Address(const_cast<Value *>(Loc.Ptr), DL, &AC); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 913 | |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 914 | // This is the set of blocks we've inspected, and the pointer we consider in |
| 915 | // each block. Because of critical edges, we currently bail out if querying |
| 916 | // a block with multiple different pointers. This can happen during PHI |
| 917 | // translation. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 918 | DenseMap<BasicBlock *, Value *> Visited; |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 919 | if (getNonLocalPointerDepFromBB(QueryInst, Address, Loc, isLoad, FromBB, |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 920 | Result, Visited, true)) |
| 921 | return; |
Chris Lattner | 7ed5ccc | 2008-12-15 04:58:29 +0000 | [diff] [blame] | 922 | Result.clear(); |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 923 | Result.push_back(NonLocalDepResult(FromBB, MemDepResult::getUnknown(), |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 924 | const_cast<Value *>(Loc.Ptr))); |
Chris Lattner | 7564a3b | 2008-12-07 02:56:57 +0000 | [diff] [blame] | 925 | } |
| 926 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 927 | /// Compute the memdep value for BB with Pointer/PointeeSize using either |
| 928 | /// cached information in Cache or by doing a lookup (which may use dirty cache |
| 929 | /// info if available). |
| 930 | /// |
| 931 | /// If we do a lookup, add the result to the cache. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 932 | MemDepResult MemoryDependenceResults::GetNonLocalInfoForBlock( |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 933 | Instruction *QueryInst, const MemoryLocation &Loc, bool isLoad, |
| 934 | BasicBlock *BB, NonLocalDepInfo *Cache, unsigned NumSortedEntries) { |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 935 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 936 | // Do a binary search to see if we already have an entry for this block in |
| 937 | // the cache set. If so, find it. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 938 | NonLocalDepInfo::iterator Entry = std::upper_bound( |
| 939 | Cache->begin(), Cache->begin() + NumSortedEntries, NonLocalDepEntry(BB)); |
| 940 | if (Entry != Cache->begin() && (Entry - 1)->getBB() == BB) |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 941 | --Entry; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 942 | |
Craig Topper | 9f00886 | 2014-04-15 04:59:12 +0000 | [diff] [blame] | 943 | NonLocalDepEntry *ExistingResult = nullptr; |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 944 | if (Entry != Cache->begin() + NumSortedEntries && Entry->getBB() == BB) |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 945 | ExistingResult = &*Entry; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 946 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 947 | // If we have a cached entry, and it is non-dirty, use it as the value for |
| 948 | // this dependency. |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 949 | if (ExistingResult && !ExistingResult->getResult().isDirty()) { |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 950 | ++NumCacheNonLocalPtr; |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 951 | return ExistingResult->getResult(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 952 | } |
| 953 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 954 | // Otherwise, we have to scan for the value. If we have a dirty cache |
| 955 | // entry, start scanning from its position, otherwise we scan from the end |
| 956 | // of the block. |
| 957 | BasicBlock::iterator ScanPos = BB->end(); |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 958 | if (ExistingResult && ExistingResult->getResult().getInst()) { |
| 959 | assert(ExistingResult->getResult().getInst()->getParent() == BB && |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 960 | "Instruction invalidated?"); |
| 961 | ++NumCacheDirtyNonLocalPtr; |
Duncan P. N. Exon Smith | 5a82c91 | 2015-10-10 00:53:03 +0000 | [diff] [blame] | 962 | ScanPos = ExistingResult->getResult().getInst()->getIterator(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 963 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 964 | // Eliminating the dirty entry from 'Cache', so update the reverse info. |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 965 | ValueIsLoadPair CacheKey(Loc.Ptr, isLoad); |
Duncan P. N. Exon Smith | 5a82c91 | 2015-10-10 00:53:03 +0000 | [diff] [blame] | 966 | RemoveFromReverseMap(ReverseNonLocalPtrDeps, &*ScanPos, CacheKey); |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 967 | } else { |
| 968 | ++NumUncacheNonLocalPtr; |
| 969 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 970 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 971 | // Scan the block for the dependency. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 972 | MemDepResult Dep = |
| 973 | getPointerDependencyFrom(Loc, isLoad, ScanPos, BB, QueryInst); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 974 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 975 | // If we had a dirty entry for the block, update it. Otherwise, just add |
| 976 | // a new entry. |
| 977 | if (ExistingResult) |
Chris Lattner | 9b7d99e | 2009-12-22 04:25:02 +0000 | [diff] [blame] | 978 | ExistingResult->setResult(Dep); |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 979 | else |
Chris Lattner | 9b7d99e | 2009-12-22 04:25:02 +0000 | [diff] [blame] | 980 | Cache->push_back(NonLocalDepEntry(BB, Dep)); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 981 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 982 | // If the block has a dependency (i.e. it isn't completely transparent to |
| 983 | // the value), remember the reverse association because we just added it |
| 984 | // to Cache! |
Eli Friedman | c1702c8 | 2011-10-13 22:14:57 +0000 | [diff] [blame] | 985 | if (!Dep.isDef() && !Dep.isClobber()) |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 986 | return Dep; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 987 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 988 | // Keep the ReverseNonLocalPtrDeps map up to date so we can efficiently |
| 989 | // update MemDep when we remove instructions. |
| 990 | Instruction *Inst = Dep.getInst(); |
| 991 | assert(Inst && "Didn't depend on anything?"); |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 992 | ValueIsLoadPair CacheKey(Loc.Ptr, isLoad); |
Chris Lattner | 8eda11b | 2009-03-29 00:24:04 +0000 | [diff] [blame] | 993 | ReverseNonLocalPtrDeps[Inst].insert(CacheKey); |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 994 | return Dep; |
| 995 | } |
| 996 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 997 | /// Sort the NonLocalDepInfo cache, given a certain number of elements in the |
| 998 | /// array that are already properly ordered. |
| 999 | /// |
| 1000 | /// This is optimized for the case when only a few entries are added. |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1001 | static void |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1002 | SortNonLocalDepInfoCache(MemoryDependenceResults::NonLocalDepInfo &Cache, |
Chris Lattner | 370aada | 2009-07-13 17:20:05 +0000 | [diff] [blame] | 1003 | unsigned NumSortedEntries) { |
| 1004 | switch (Cache.size() - NumSortedEntries) { |
| 1005 | case 0: |
| 1006 | // done, no new entries. |
| 1007 | break; |
| 1008 | case 2: { |
| 1009 | // Two new entries, insert the last one into place. |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 1010 | NonLocalDepEntry Val = Cache.back(); |
Chris Lattner | 370aada | 2009-07-13 17:20:05 +0000 | [diff] [blame] | 1011 | Cache.pop_back(); |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1012 | MemoryDependenceResults::NonLocalDepInfo::iterator Entry = |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1013 | std::upper_bound(Cache.begin(), Cache.end() - 1, Val); |
Chris Lattner | 370aada | 2009-07-13 17:20:05 +0000 | [diff] [blame] | 1014 | Cache.insert(Entry, Val); |
| 1015 | // FALL THROUGH. |
| 1016 | } |
| 1017 | case 1: |
| 1018 | // One new entry, Just insert the new value at the appropriate position. |
| 1019 | if (Cache.size() != 1) { |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 1020 | NonLocalDepEntry Val = Cache.back(); |
Chris Lattner | 370aada | 2009-07-13 17:20:05 +0000 | [diff] [blame] | 1021 | Cache.pop_back(); |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1022 | MemoryDependenceResults::NonLocalDepInfo::iterator Entry = |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1023 | std::upper_bound(Cache.begin(), Cache.end(), Val); |
Chris Lattner | 370aada | 2009-07-13 17:20:05 +0000 | [diff] [blame] | 1024 | Cache.insert(Entry, Val); |
| 1025 | } |
| 1026 | break; |
| 1027 | default: |
| 1028 | // Added many values, do a full scale sort. |
| 1029 | std::sort(Cache.begin(), Cache.end()); |
| 1030 | break; |
| 1031 | } |
| 1032 | } |
| 1033 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 1034 | /// Perform a dependency query based on pointer/pointeesize starting at the end |
| 1035 | /// of StartBB. |
| 1036 | /// |
| 1037 | /// Add any clobber/def results to the results vector and keep track of which |
| 1038 | /// blocks are visited in 'Visited'. |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1039 | /// |
| 1040 | /// This has special behavior for the first block queries (when SkipFirstBlock |
| 1041 | /// is true). In this special case, it ignores the contents of the specified |
| 1042 | /// block and starts returning dependence info for its predecessors. |
| 1043 | /// |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 1044 | /// This function returns true on success, or false to indicate that it could |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1045 | /// not compute dependence information for some reason. This should be treated |
| 1046 | /// as a clobber dependence on the first instruction in the predecessor block. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1047 | bool MemoryDependenceResults::getNonLocalPointerDepFromBB( |
Chandler Carruth | ac80dc7 | 2015-06-17 07:18:54 +0000 | [diff] [blame] | 1048 | Instruction *QueryInst, const PHITransAddr &Pointer, |
| 1049 | const MemoryLocation &Loc, bool isLoad, BasicBlock *StartBB, |
| 1050 | SmallVectorImpl<NonLocalDepResult> &Result, |
| 1051 | DenseMap<BasicBlock *, Value *> &Visited, bool SkipFirstBlock) { |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1052 | // Look up the cached info for Pointer. |
Chris Lattner | 972e6d8 | 2009-12-09 01:59:31 +0000 | [diff] [blame] | 1053 | ValueIsLoadPair CacheKey(Pointer.getAddr(), isLoad); |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1054 | |
Dan Gohman | 0a6021a | 2010-11-10 20:37:15 +0000 | [diff] [blame] | 1055 | // Set up a temporary NLPI value. If the map doesn't yet have an entry for |
| 1056 | // CacheKey, this value will be inserted as the associated value. Otherwise, |
| 1057 | // it'll be ignored, and we'll have to check to see if the cached size and |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 1058 | // aa tags are consistent with the current query. |
Dan Gohman | 0a6021a | 2010-11-10 20:37:15 +0000 | [diff] [blame] | 1059 | NonLocalPointerInfo InitialNLPI; |
| 1060 | InitialNLPI.Size = Loc.Size; |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 1061 | InitialNLPI.AATags = Loc.AATags; |
Dan Gohman | 0a6021a | 2010-11-10 20:37:15 +0000 | [diff] [blame] | 1062 | |
| 1063 | // Get the NLPI for CacheKey, inserting one into the map if it doesn't |
| 1064 | // already have one. |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1065 | std::pair<CachedNonLocalPointerInfo::iterator, bool> Pair = |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1066 | NonLocalPointerDeps.insert(std::make_pair(CacheKey, InitialNLPI)); |
Dan Gohman | 0a6021a | 2010-11-10 20:37:15 +0000 | [diff] [blame] | 1067 | NonLocalPointerInfo *CacheInfo = &Pair.first->second; |
| 1068 | |
Dan Gohman | 2e8ca44 | 2010-11-10 21:45:11 +0000 | [diff] [blame] | 1069 | // If we already have a cache entry for this CacheKey, we may need to do some |
| 1070 | // work to reconcile the cache entry and the current query. |
Dan Gohman | 0a6021a | 2010-11-10 20:37:15 +0000 | [diff] [blame] | 1071 | if (!Pair.second) { |
Dan Gohman | 2e8ca44 | 2010-11-10 21:45:11 +0000 | [diff] [blame] | 1072 | if (CacheInfo->Size < Loc.Size) { |
| 1073 | // The query's Size is greater than the cached one. Throw out the |
Benjamin Kramer | bde9176 | 2012-06-02 10:20:22 +0000 | [diff] [blame] | 1074 | // cached data and proceed with the query at the greater size. |
Dan Gohman | 2e8ca44 | 2010-11-10 21:45:11 +0000 | [diff] [blame] | 1075 | CacheInfo->Pair = BBSkipFirstBlockPair(); |
| 1076 | CacheInfo->Size = Loc.Size; |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1077 | for (auto &Entry : CacheInfo->NonLocalDeps) |
| 1078 | if (Instruction *Inst = Entry.getResult().getInst()) |
Dan Gohman | 6791936 | 2010-11-10 22:35:02 +0000 | [diff] [blame] | 1079 | RemoveFromReverseMap(ReverseNonLocalPtrDeps, Inst, CacheKey); |
Dan Gohman | 2e8ca44 | 2010-11-10 21:45:11 +0000 | [diff] [blame] | 1080 | CacheInfo->NonLocalDeps.clear(); |
| 1081 | } else if (CacheInfo->Size > Loc.Size) { |
| 1082 | // This query's Size is less than the cached one. Conservatively restart |
| 1083 | // the query using the greater size. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1084 | return getNonLocalPointerDepFromBB( |
| 1085 | QueryInst, Pointer, Loc.getWithNewSize(CacheInfo->Size), isLoad, |
| 1086 | StartBB, Result, Visited, SkipFirstBlock); |
Dan Gohman | 0a6021a | 2010-11-10 20:37:15 +0000 | [diff] [blame] | 1087 | } |
| 1088 | |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 1089 | // If the query's AATags are inconsistent with the cached one, |
Dan Gohman | 2e8ca44 | 2010-11-10 21:45:11 +0000 | [diff] [blame] | 1090 | // conservatively throw out the cached data and restart the query with |
| 1091 | // no tag if needed. |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 1092 | if (CacheInfo->AATags != Loc.AATags) { |
| 1093 | if (CacheInfo->AATags) { |
Dan Gohman | 2e8ca44 | 2010-11-10 21:45:11 +0000 | [diff] [blame] | 1094 | CacheInfo->Pair = BBSkipFirstBlockPair(); |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 1095 | CacheInfo->AATags = AAMDNodes(); |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1096 | for (auto &Entry : CacheInfo->NonLocalDeps) |
| 1097 | if (Instruction *Inst = Entry.getResult().getInst()) |
Dan Gohman | 6791936 | 2010-11-10 22:35:02 +0000 | [diff] [blame] | 1098 | RemoveFromReverseMap(ReverseNonLocalPtrDeps, Inst, CacheKey); |
Dan Gohman | 2e8ca44 | 2010-11-10 21:45:11 +0000 | [diff] [blame] | 1099 | CacheInfo->NonLocalDeps.clear(); |
| 1100 | } |
Hal Finkel | cc39b67 | 2014-07-24 12:16:19 +0000 | [diff] [blame] | 1101 | if (Loc.AATags) |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1102 | return getNonLocalPointerDepFromBB( |
| 1103 | QueryInst, Pointer, Loc.getWithoutAATags(), isLoad, StartBB, Result, |
| 1104 | Visited, SkipFirstBlock); |
Dan Gohman | 0a6021a | 2010-11-10 20:37:15 +0000 | [diff] [blame] | 1105 | } |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1106 | } |
| 1107 | |
| 1108 | NonLocalDepInfo *Cache = &CacheInfo->NonLocalDeps; |
Chris Lattner | 5ed409e | 2008-12-08 07:31:50 +0000 | [diff] [blame] | 1109 | |
| 1110 | // If we have valid cached information for exactly the block we are |
| 1111 | // investigating, just return it with no recomputation. |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1112 | if (CacheInfo->Pair == BBSkipFirstBlockPair(StartBB, SkipFirstBlock)) { |
Chris Lattner | 8b4be37 | 2008-12-16 07:10:09 +0000 | [diff] [blame] | 1113 | // We have a fully cached result for this query then we can just return the |
| 1114 | // cached results and populate the visited set. However, we have to verify |
| 1115 | // that we don't already have conflicting results for these blocks. Check |
| 1116 | // to ensure that if a block in the results set is in the visited set that |
| 1117 | // it was for the same pointer query. |
| 1118 | if (!Visited.empty()) { |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1119 | for (auto &Entry : *Cache) { |
| 1120 | DenseMap<BasicBlock *, Value *>::iterator VI = |
| 1121 | Visited.find(Entry.getBB()); |
Chris Lattner | 972e6d8 | 2009-12-09 01:59:31 +0000 | [diff] [blame] | 1122 | if (VI == Visited.end() || VI->second == Pointer.getAddr()) |
| 1123 | continue; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1124 | |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 1125 | // We have a pointer mismatch in a block. Just return false, saying |
Chris Lattner | 8b4be37 | 2008-12-16 07:10:09 +0000 | [diff] [blame] | 1126 | // that something was clobbered in this result. We could also do a |
| 1127 | // non-fully cached query, but there is little point in doing this. |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 1128 | return false; |
Chris Lattner | 8b4be37 | 2008-12-16 07:10:09 +0000 | [diff] [blame] | 1129 | } |
| 1130 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1131 | |
Chris Lattner | 9b7d99e | 2009-12-22 04:25:02 +0000 | [diff] [blame] | 1132 | Value *Addr = Pointer.getAddr(); |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1133 | for (auto &Entry : *Cache) { |
| 1134 | Visited.insert(std::make_pair(Entry.getBB(), Addr)); |
| 1135 | if (Entry.getResult().isNonLocal()) { |
Matt Arsenault | c23753a | 2013-05-06 02:07:24 +0000 | [diff] [blame] | 1136 | continue; |
| 1137 | } |
| 1138 | |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 1139 | if (DT.isReachableFromEntry(Entry.getBB())) { |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1140 | Result.push_back( |
| 1141 | NonLocalDepResult(Entry.getBB(), Entry.getResult(), Addr)); |
Matt Arsenault | c23753a | 2013-05-06 02:07:24 +0000 | [diff] [blame] | 1142 | } |
Chris Lattner | 8b4be37 | 2008-12-16 07:10:09 +0000 | [diff] [blame] | 1143 | } |
Chris Lattner | 5ed409e | 2008-12-08 07:31:50 +0000 | [diff] [blame] | 1144 | ++NumCacheCompleteNonLocalPtr; |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 1145 | return true; |
Chris Lattner | 5ed409e | 2008-12-08 07:31:50 +0000 | [diff] [blame] | 1146 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1147 | |
Chris Lattner | 5ed409e | 2008-12-08 07:31:50 +0000 | [diff] [blame] | 1148 | // Otherwise, either this is a new block, a block with an invalid cache |
| 1149 | // pointer or one that we're about to invalidate by putting more info into it |
| 1150 | // than its valid cache info. If empty, the result will be valid cache info, |
| 1151 | // otherwise it isn't. |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1152 | if (Cache->empty()) |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1153 | CacheInfo->Pair = BBSkipFirstBlockPair(StartBB, SkipFirstBlock); |
Dan Gohman | c87c843 | 2010-11-11 00:42:22 +0000 | [diff] [blame] | 1154 | else |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1155 | CacheInfo->Pair = BBSkipFirstBlockPair(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1156 | |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1157 | SmallVector<BasicBlock *, 32> Worklist; |
Chris Lattner | 5ed409e | 2008-12-08 07:31:50 +0000 | [diff] [blame] | 1158 | Worklist.push_back(StartBB); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1159 | |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1160 | // PredList used inside loop. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1161 | SmallVector<std::pair<BasicBlock *, PHITransAddr>, 16> PredList; |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1162 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1163 | // Keep track of the entries that we know are sorted. Previously cached |
| 1164 | // entries will all be sorted. The entries we add we only sort on demand (we |
| 1165 | // don't insert every element into its sorted position). We know that we |
| 1166 | // won't get any reuse from currently inserted values, because we don't |
| 1167 | // revisit blocks after we insert info for them. |
| 1168 | unsigned NumSortedEntries = Cache->size(); |
Joerg Sonnenberger | 36894dc | 2016-02-20 11:24:44 +0000 | [diff] [blame] | 1169 | unsigned WorklistEntries = BlockNumberLimit; |
| 1170 | bool GotWorklistLimit = false; |
Chris Lattner | f09619d | 2009-01-22 07:04:01 +0000 | [diff] [blame] | 1171 | DEBUG(AssertSorted(*Cache)); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1172 | |
Chris Lattner | 2faa2c7 | 2008-12-07 02:15:47 +0000 | [diff] [blame] | 1173 | while (!Worklist.empty()) { |
Chris Lattner | 7564a3b | 2008-12-07 02:56:57 +0000 | [diff] [blame] | 1174 | BasicBlock *BB = Worklist.pop_back_val(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1175 | |
Bruno Cardoso Lopes | e3c513a | 2014-10-01 20:07:13 +0000 | [diff] [blame] | 1176 | // If we do process a large number of blocks it becomes very expensive and |
| 1177 | // likely it isn't worth worrying about |
| 1178 | if (Result.size() > NumResultsLimit) { |
| 1179 | Worklist.clear(); |
| 1180 | // Sort it now (if needed) so that recursive invocations of |
| 1181 | // getNonLocalPointerDepFromBB and other routines that could reuse the |
| 1182 | // cache value will only see properly sorted cache arrays. |
| 1183 | if (Cache && NumSortedEntries != Cache->size()) { |
| 1184 | SortNonLocalDepInfoCache(*Cache, NumSortedEntries); |
Bruno Cardoso Lopes | e3c513a | 2014-10-01 20:07:13 +0000 | [diff] [blame] | 1185 | } |
| 1186 | // Since we bail out, the "Cache" set won't contain all of the |
| 1187 | // results for the query. This is ok (we can still use it to accelerate |
| 1188 | // specific block queries) but we can't do the fastpath "return all |
| 1189 | // results from the set". Clear out the indicator for this. |
| 1190 | CacheInfo->Pair = BBSkipFirstBlockPair(); |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 1191 | return false; |
Bruno Cardoso Lopes | e3c513a | 2014-10-01 20:07:13 +0000 | [diff] [blame] | 1192 | } |
| 1193 | |
Chris Lattner | 75510d8 | 2008-12-09 07:52:59 +0000 | [diff] [blame] | 1194 | // Skip the first block if we have it. |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1195 | if (!SkipFirstBlock) { |
Chris Lattner | 75510d8 | 2008-12-09 07:52:59 +0000 | [diff] [blame] | 1196 | // Analyze the dependency of *Pointer in FromBB. See if we already have |
| 1197 | // been here. |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1198 | assert(Visited.count(BB) && "Should check 'visited' before adding to WL"); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1199 | |
Chris Lattner | 75510d8 | 2008-12-09 07:52:59 +0000 | [diff] [blame] | 1200 | // Get the dependency info for Pointer in BB. If we have cached |
| 1201 | // information, we will use it, otherwise we compute it. |
Chris Lattner | f09619d | 2009-01-22 07:04:01 +0000 | [diff] [blame] | 1202 | DEBUG(AssertSorted(*Cache, NumSortedEntries)); |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1203 | MemDepResult Dep = GetNonLocalInfoForBlock(QueryInst, Loc, isLoad, BB, |
| 1204 | Cache, NumSortedEntries); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1205 | |
Chris Lattner | 75510d8 | 2008-12-09 07:52:59 +0000 | [diff] [blame] | 1206 | // If we got a Def or Clobber, add this to the list of results. |
Matt Arsenault | c23753a | 2013-05-06 02:07:24 +0000 | [diff] [blame] | 1207 | if (!Dep.isNonLocal()) { |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 1208 | if (DT.isReachableFromEntry(BB)) { |
Matt Arsenault | c23753a | 2013-05-06 02:07:24 +0000 | [diff] [blame] | 1209 | Result.push_back(NonLocalDepResult(BB, Dep, Pointer.getAddr())); |
| 1210 | continue; |
| 1211 | } |
Chris Lattner | 75510d8 | 2008-12-09 07:52:59 +0000 | [diff] [blame] | 1212 | } |
Chris Lattner | 2faa2c7 | 2008-12-07 02:15:47 +0000 | [diff] [blame] | 1213 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1214 | |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1215 | // If 'Pointer' is an instruction defined in this block, then we need to do |
| 1216 | // phi translation to change it into a value live in the predecessor block. |
Chris Lattner | 972e6d8 | 2009-12-09 01:59:31 +0000 | [diff] [blame] | 1217 | // If not, we just add the predecessors to the worklist and scan them with |
| 1218 | // the same Pointer. |
| 1219 | if (!Pointer.NeedsPHITranslationFromBlock(BB)) { |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1220 | SkipFirstBlock = false; |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1221 | SmallVector<BasicBlock *, 16> NewBlocks; |
Daniel Berlin | b4e7a4a | 2015-04-21 21:11:50 +0000 | [diff] [blame] | 1222 | for (BasicBlock *Pred : PredCache.get(BB)) { |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1223 | // Verify that we haven't looked at this block yet. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1224 | std::pair<DenseMap<BasicBlock *, Value *>::iterator, bool> InsertRes = |
| 1225 | Visited.insert(std::make_pair(Pred, Pointer.getAddr())); |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1226 | if (InsertRes.second) { |
| 1227 | // First time we've looked at *PI. |
Daniel Berlin | b4e7a4a | 2015-04-21 21:11:50 +0000 | [diff] [blame] | 1228 | NewBlocks.push_back(Pred); |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1229 | continue; |
| 1230 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1231 | |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1232 | // If we have seen this block before, but it was with a different |
| 1233 | // pointer then we have a phi translation failure and we have to treat |
| 1234 | // this as a clobber. |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1235 | if (InsertRes.first->second != Pointer.getAddr()) { |
| 1236 | // Make sure to clean up the Visited map before continuing on to |
| 1237 | // PredTranslationFailure. |
| 1238 | for (unsigned i = 0; i < NewBlocks.size(); i++) |
| 1239 | Visited.erase(NewBlocks[i]); |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1240 | goto PredTranslationFailure; |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1241 | } |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1242 | } |
Joerg Sonnenberger | 36894dc | 2016-02-20 11:24:44 +0000 | [diff] [blame] | 1243 | if (NewBlocks.size() > WorklistEntries) { |
| 1244 | // Make sure to clean up the Visited map before continuing on to |
| 1245 | // PredTranslationFailure. |
| 1246 | for (unsigned i = 0; i < NewBlocks.size(); i++) |
| 1247 | Visited.erase(NewBlocks[i]); |
| 1248 | GotWorklistLimit = true; |
| 1249 | goto PredTranslationFailure; |
| 1250 | } |
| 1251 | WorklistEntries -= NewBlocks.size(); |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1252 | Worklist.append(NewBlocks.begin(), NewBlocks.end()); |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1253 | continue; |
| 1254 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1255 | |
Chris Lattner | 972e6d8 | 2009-12-09 01:59:31 +0000 | [diff] [blame] | 1256 | // We do need to do phi translation, if we know ahead of time we can't phi |
| 1257 | // translate this value, don't even try. |
| 1258 | if (!Pointer.IsPotentiallyPHITranslatable()) |
| 1259 | goto PredTranslationFailure; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1260 | |
Chris Lattner | 2f0c1c4 | 2009-07-13 17:14:23 +0000 | [diff] [blame] | 1261 | // We may have added values to the cache list before this PHI translation. |
| 1262 | // If so, we haven't done anything to ensure that the cache remains sorted. |
| 1263 | // Sort it now (if needed) so that recursive invocations of |
| 1264 | // getNonLocalPointerDepFromBB and other routines that could reuse the cache |
| 1265 | // value will only see properly sorted cache arrays. |
| 1266 | if (Cache && NumSortedEntries != Cache->size()) { |
Chris Lattner | 370aada | 2009-07-13 17:20:05 +0000 | [diff] [blame] | 1267 | SortNonLocalDepInfoCache(*Cache, NumSortedEntries); |
Chris Lattner | 2f0c1c4 | 2009-07-13 17:14:23 +0000 | [diff] [blame] | 1268 | NumSortedEntries = Cache->size(); |
| 1269 | } |
Craig Topper | 9f00886 | 2014-04-15 04:59:12 +0000 | [diff] [blame] | 1270 | Cache = nullptr; |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1271 | |
| 1272 | PredList.clear(); |
Daniel Berlin | b4e7a4a | 2015-04-21 21:11:50 +0000 | [diff] [blame] | 1273 | for (BasicBlock *Pred : PredCache.get(BB)) { |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1274 | PredList.push_back(std::make_pair(Pred, Pointer)); |
| 1275 | |
Chris Lattner | 972e6d8 | 2009-12-09 01:59:31 +0000 | [diff] [blame] | 1276 | // Get the PHI translated pointer in this predecessor. This can fail if |
| 1277 | // not translatable, in which case the getAddr() returns null. |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1278 | PHITransAddr &PredPointer = PredList.back().second; |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 1279 | PredPointer.PHITranslateValue(BB, Pred, &DT, /*MustDominate=*/false); |
Chris Lattner | 972e6d8 | 2009-12-09 01:59:31 +0000 | [diff] [blame] | 1280 | Value *PredPtrVal = PredPointer.getAddr(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1281 | |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1282 | // Check to see if we have already visited this pred block with another |
| 1283 | // pointer. If so, we can't do this lookup. This failure can occur |
| 1284 | // with PHI translation when a critical edge exists and the PHI node in |
| 1285 | // the successor translates to a pointer value different than the |
| 1286 | // pointer the block was first analyzed with. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1287 | std::pair<DenseMap<BasicBlock *, Value *>::iterator, bool> InsertRes = |
| 1288 | Visited.insert(std::make_pair(Pred, PredPtrVal)); |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1289 | |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1290 | if (!InsertRes.second) { |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1291 | // We found the pred; take it off the list of preds to visit. |
| 1292 | PredList.pop_back(); |
| 1293 | |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1294 | // If the predecessor was visited with PredPtr, then we already did |
| 1295 | // the analysis and can ignore it. |
Chris Lattner | 972e6d8 | 2009-12-09 01:59:31 +0000 | [diff] [blame] | 1296 | if (InsertRes.first->second == PredPtrVal) |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1297 | continue; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1298 | |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1299 | // Otherwise, the block was previously analyzed with a different |
| 1300 | // pointer. We can't represent the result of this case, so we just |
| 1301 | // treat this as a phi translation failure. |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1302 | |
| 1303 | // Make sure to clean up the Visited map before continuing on to |
| 1304 | // PredTranslationFailure. |
Matt Arsenault | 2080ecd | 2013-03-29 18:48:42 +0000 | [diff] [blame] | 1305 | for (unsigned i = 0, n = PredList.size(); i < n; ++i) |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1306 | Visited.erase(PredList[i].first); |
| 1307 | |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1308 | goto PredTranslationFailure; |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1309 | } |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1310 | } |
| 1311 | |
| 1312 | // Actually process results here; this need to be a separate loop to avoid |
| 1313 | // calling getNonLocalPointerDepFromBB for blocks we don't want to return |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1314 | // any results for. (getNonLocalPointerDepFromBB will modify our |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1315 | // datastructures in ways the code after the PredTranslationFailure label |
| 1316 | // doesn't expect.) |
Matt Arsenault | 2080ecd | 2013-03-29 18:48:42 +0000 | [diff] [blame] | 1317 | for (unsigned i = 0, n = PredList.size(); i < n; ++i) { |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1318 | BasicBlock *Pred = PredList[i].first; |
| 1319 | PHITransAddr &PredPointer = PredList[i].second; |
| 1320 | Value *PredPtrVal = PredPointer.getAddr(); |
| 1321 | |
| 1322 | bool CanTranslate = true; |
Chris Lattner | 2be52e7 | 2009-11-27 22:05:15 +0000 | [diff] [blame] | 1323 | // If PHI translation was unable to find an available pointer in this |
| 1324 | // predecessor, then we have to assume that the pointer is clobbered in |
| 1325 | // that predecessor. We can still do PRE of the load, which would insert |
| 1326 | // a computation of the pointer in this predecessor. |
Craig Topper | 9f00886 | 2014-04-15 04:59:12 +0000 | [diff] [blame] | 1327 | if (!PredPtrVal) |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1328 | CanTranslate = false; |
| 1329 | |
| 1330 | // FIXME: it is entirely possible that PHI translating will end up with |
| 1331 | // the same value. Consider PHI translating something like: |
| 1332 | // X = phi [x, bb1], [y, bb2]. PHI translating for bb1 doesn't *need* |
| 1333 | // to recurse here, pedantically speaking. |
| 1334 | |
| 1335 | // If getNonLocalPointerDepFromBB fails here, that means the cached |
| 1336 | // result conflicted with the Visited list; we have to conservatively |
Eli Friedman | 7d58bc7 | 2011-06-15 00:47:34 +0000 | [diff] [blame] | 1337 | // assume it is unknown, but this also does not block PRE of the load. |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1338 | if (!CanTranslate || |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 1339 | !getNonLocalPointerDepFromBB(QueryInst, PredPointer, |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1340 | Loc.getWithNewPtr(PredPtrVal), isLoad, |
| 1341 | Pred, Result, Visited)) { |
Chris Lattner | 9c2053b | 2009-12-01 07:33:32 +0000 | [diff] [blame] | 1342 | // Add the entry to the Result list. |
Eli Friedman | 7d58bc7 | 2011-06-15 00:47:34 +0000 | [diff] [blame] | 1343 | NonLocalDepResult Entry(Pred, MemDepResult::getUnknown(), PredPtrVal); |
Chris Lattner | 9c2053b | 2009-12-01 07:33:32 +0000 | [diff] [blame] | 1344 | Result.push_back(Entry); |
| 1345 | |
Chris Lattner | 25bf6f8 | 2009-12-19 21:29:22 +0000 | [diff] [blame] | 1346 | // Since we had a phi translation failure, the cache for CacheKey won't |
| 1347 | // include all of the entries that we need to immediately satisfy future |
| 1348 | // queries. Mark this in NonLocalPointerDeps by setting the |
| 1349 | // BBSkipFirstBlockPair pointer to null. This requires reuse of the |
| 1350 | // cached value to do more work but not miss the phi trans failure. |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1351 | NonLocalPointerInfo &NLPI = NonLocalPointerDeps[CacheKey]; |
| 1352 | NLPI.Pair = BBSkipFirstBlockPair(); |
Chris Lattner | 2be52e7 | 2009-11-27 22:05:15 +0000 | [diff] [blame] | 1353 | continue; |
Chris Lattner | 2be52e7 | 2009-11-27 22:05:15 +0000 | [diff] [blame] | 1354 | } |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1355 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1356 | |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1357 | // Refresh the CacheInfo/Cache pointer so that it isn't invalidated. |
| 1358 | CacheInfo = &NonLocalPointerDeps[CacheKey]; |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1359 | Cache = &CacheInfo->NonLocalDeps; |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1360 | NumSortedEntries = Cache->size(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1361 | |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1362 | // Since we did phi translation, the "Cache" set won't contain all of the |
| 1363 | // results for the query. This is ok (we can still use it to accelerate |
| 1364 | // specific block queries) but we can't do the fastpath "return all |
| 1365 | // results from the set" Clear out the indicator for this. |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1366 | CacheInfo->Pair = BBSkipFirstBlockPair(); |
Chris Lattner | ac32329 | 2009-11-27 08:37:22 +0000 | [diff] [blame] | 1367 | SkipFirstBlock = false; |
| 1368 | continue; |
Chris Lattner | c49f5ac | 2009-11-26 23:18:49 +0000 | [diff] [blame] | 1369 | |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1370 | PredTranslationFailure: |
Eli Friedman | 4b6eeb9 | 2011-06-01 23:16:53 +0000 | [diff] [blame] | 1371 | // The following code is "failure"; we can't produce a sane translation |
| 1372 | // for the given block. It assumes that we haven't modified any of |
| 1373 | // our datastructures while processing the current block. |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1374 | |
Craig Topper | 9f00886 | 2014-04-15 04:59:12 +0000 | [diff] [blame] | 1375 | if (!Cache) { |
Chris Lattner | 3f4591c | 2009-01-23 07:12:16 +0000 | [diff] [blame] | 1376 | // Refresh the CacheInfo/Cache pointer if it got invalidated. |
| 1377 | CacheInfo = &NonLocalPointerDeps[CacheKey]; |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1378 | Cache = &CacheInfo->NonLocalDeps; |
Chris Lattner | 3f4591c | 2009-01-23 07:12:16 +0000 | [diff] [blame] | 1379 | NumSortedEntries = Cache->size(); |
Chris Lattner | 3f4591c | 2009-01-23 07:12:16 +0000 | [diff] [blame] | 1380 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1381 | |
Chris Lattner | 25bf6f8 | 2009-12-19 21:29:22 +0000 | [diff] [blame] | 1382 | // Since we failed phi translation, the "Cache" set won't contain all of the |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1383 | // results for the query. This is ok (we can still use it to accelerate |
| 1384 | // specific block queries) but we can't do the fastpath "return all |
Chris Lattner | 25bf6f8 | 2009-12-19 21:29:22 +0000 | [diff] [blame] | 1385 | // results from the set". Clear out the indicator for this. |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1386 | CacheInfo->Pair = BBSkipFirstBlockPair(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1387 | |
Eli Friedman | 7d58bc7 | 2011-06-15 00:47:34 +0000 | [diff] [blame] | 1388 | // If *nothing* works, mark the pointer as unknown. |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1389 | // |
| 1390 | // If this is the magic first block, return this as a clobber of the whole |
| 1391 | // incoming value. Since we can't phi translate to one of the predecessors, |
| 1392 | // we have to bail out. |
| 1393 | if (SkipFirstBlock) |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 1394 | return false; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1395 | |
Joerg Sonnenberger | 36894dc | 2016-02-20 11:24:44 +0000 | [diff] [blame] | 1396 | bool foundBlock = false; |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1397 | for (NonLocalDepEntry &I : llvm::reverse(*Cache)) { |
Joerg Sonnenberger | 36894dc | 2016-02-20 11:24:44 +0000 | [diff] [blame] | 1398 | if (I.getBB() != BB) |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1399 | continue; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1400 | |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1401 | assert((GotWorklistLimit || I.getResult().isNonLocal() || |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 1402 | !DT.isReachableFromEntry(BB)) && |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1403 | "Should only be here with transparent block"); |
Joerg Sonnenberger | 36894dc | 2016-02-20 11:24:44 +0000 | [diff] [blame] | 1404 | foundBlock = true; |
| 1405 | I.setResult(MemDepResult::getUnknown()); |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1406 | Result.push_back( |
| 1407 | NonLocalDepResult(I.getBB(), I.getResult(), Pointer.getAddr())); |
Chris Lattner | ff9f3db | 2008-12-15 03:35:32 +0000 | [diff] [blame] | 1408 | break; |
Chris Lattner | 7564a3b | 2008-12-07 02:56:57 +0000 | [diff] [blame] | 1409 | } |
Joerg Sonnenberger | 36894dc | 2016-02-20 11:24:44 +0000 | [diff] [blame] | 1410 | (void)foundBlock; |
| 1411 | assert((foundBlock || GotWorklistLimit) && "Current block not in cache?"); |
Chris Lattner | 2faa2c7 | 2008-12-07 02:15:47 +0000 | [diff] [blame] | 1412 | } |
Chris Lattner | 3f4591c | 2009-01-23 07:12:16 +0000 | [diff] [blame] | 1413 | |
Chris Lattner | f903fe1 | 2008-12-09 07:47:11 +0000 | [diff] [blame] | 1414 | // Okay, we're done now. If we added new values to the cache, re-sort it. |
Chris Lattner | 370aada | 2009-07-13 17:20:05 +0000 | [diff] [blame] | 1415 | SortNonLocalDepInfoCache(*Cache, NumSortedEntries); |
Chris Lattner | f09619d | 2009-01-22 07:04:01 +0000 | [diff] [blame] | 1416 | DEBUG(AssertSorted(*Cache)); |
Chandler Carruth | b32febe | 2016-03-07 12:45:07 +0000 | [diff] [blame] | 1417 | return true; |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1418 | } |
| 1419 | |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 1420 | /// If P exists in CachedNonLocalPointerInfo, remove it. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1421 | void MemoryDependenceResults::RemoveCachedNonLocalPointerDependencies( |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1422 | ValueIsLoadPair P) { |
| 1423 | CachedNonLocalPointerInfo::iterator It = NonLocalPointerDeps.find(P); |
| 1424 | if (It == NonLocalPointerDeps.end()) |
| 1425 | return; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1426 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1427 | // Remove all of the entries in the BB->val map. This involves removing |
| 1428 | // instructions from the reverse map. |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1429 | NonLocalDepInfo &PInfo = It->second.NonLocalDeps; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1430 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1431 | for (unsigned i = 0, e = PInfo.size(); i != e; ++i) { |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 1432 | Instruction *Target = PInfo[i].getResult().getInst(); |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1433 | if (!Target) |
| 1434 | continue; // Ignore non-local dep results. |
Chris Lattner | 0c31547 | 2009-12-09 07:08:01 +0000 | [diff] [blame] | 1435 | assert(Target->getParent() == PInfo[i].getBB()); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1436 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1437 | // Eliminating the dirty entry from 'Cache', so update the reverse info. |
Chris Lattner | 8eda11b | 2009-03-29 00:24:04 +0000 | [diff] [blame] | 1438 | RemoveFromReverseMap(ReverseNonLocalPtrDeps, Target, P); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1439 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1440 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1441 | // Remove P from NonLocalPointerDeps (which deletes NonLocalDepInfo). |
| 1442 | NonLocalPointerDeps.erase(It); |
Chris Lattner | 2faa2c7 | 2008-12-07 02:15:47 +0000 | [diff] [blame] | 1443 | } |
| 1444 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1445 | void MemoryDependenceResults::invalidateCachedPointerInfo(Value *Ptr) { |
Chris Lattner | fa9f99a | 2008-12-09 22:06:23 +0000 | [diff] [blame] | 1446 | // If Ptr isn't really a pointer, just ignore it. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1447 | if (!Ptr->getType()->isPointerTy()) |
| 1448 | return; |
Chris Lattner | fa9f99a | 2008-12-09 22:06:23 +0000 | [diff] [blame] | 1449 | // Flush store info for the pointer. |
| 1450 | RemoveCachedNonLocalPointerDependencies(ValueIsLoadPair(Ptr, false)); |
| 1451 | // Flush load info for the pointer. |
| 1452 | RemoveCachedNonLocalPointerDependencies(ValueIsLoadPair(Ptr, true)); |
| 1453 | } |
| 1454 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1455 | void MemoryDependenceResults::invalidateCachedPredecessors() { |
Daniel Berlin | b4e7a4a | 2015-04-21 21:11:50 +0000 | [diff] [blame] | 1456 | PredCache.clear(); |
Bob Wilson | 92cdb6e | 2010-02-16 19:51:59 +0000 | [diff] [blame] | 1457 | } |
| 1458 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1459 | void MemoryDependenceResults::removeInstruction(Instruction *RemInst) { |
Chris Lattner | a25d3952 | 2008-11-28 22:04:47 +0000 | [diff] [blame] | 1460 | // Walk through the Non-local dependencies, removing this one as the value |
| 1461 | // for any cached queries. |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 1462 | NonLocalDepMapType::iterator NLDI = NonLocalDeps.find(RemInst); |
| 1463 | if (NLDI != NonLocalDeps.end()) { |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 1464 | NonLocalDepInfo &BlockMap = NLDI->second.first; |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1465 | for (auto &Entry : BlockMap) |
| 1466 | if (Instruction *Inst = Entry.getResult().getInst()) |
Chris Lattner | de4440c | 2008-12-07 18:39:13 +0000 | [diff] [blame] | 1467 | RemoveFromReverseMap(ReverseNonLocalDeps, Inst, RemInst); |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 1468 | NonLocalDeps.erase(NLDI); |
| 1469 | } |
Owen Anderson | 086b2c4 | 2007-12-08 01:37:09 +0000 | [diff] [blame] | 1470 | |
Chris Lattner | a25d3952 | 2008-11-28 22:04:47 +0000 | [diff] [blame] | 1471 | // If we have a cached local dependence query for this instruction, remove it. |
Chris Lattner | 73c2545 | 2008-11-28 22:28:27 +0000 | [diff] [blame] | 1472 | // |
Chris Lattner | de04e11 | 2008-11-29 01:43:36 +0000 | [diff] [blame] | 1473 | LocalDepMapType::iterator LocalDepEntry = LocalDeps.find(RemInst); |
| 1474 | if (LocalDepEntry != LocalDeps.end()) { |
Chris Lattner | ada1f87 | 2008-11-30 01:09:30 +0000 | [diff] [blame] | 1475 | // Remove us from DepInst's reverse set now that the local dep info is gone. |
Chris Lattner | de4440c | 2008-12-07 18:39:13 +0000 | [diff] [blame] | 1476 | if (Instruction *Inst = LocalDepEntry->second.getInst()) |
| 1477 | RemoveFromReverseMap(ReverseLocalDeps, Inst, RemInst); |
Chris Lattner | ada1f87 | 2008-11-30 01:09:30 +0000 | [diff] [blame] | 1478 | |
Chris Lattner | 73c2545 | 2008-11-28 22:28:27 +0000 | [diff] [blame] | 1479 | // Remove this local dependency info. |
Chris Lattner | de04e11 | 2008-11-29 01:43:36 +0000 | [diff] [blame] | 1480 | LocalDeps.erase(LocalDepEntry); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1481 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1482 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1483 | // If we have any cached pointer dependencies on this instruction, remove |
| 1484 | // them. If the instruction has non-pointer type, then it can't be a pointer |
| 1485 | // base. |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1486 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1487 | // Remove it from both the load info and the store info. The instruction |
| 1488 | // can't be in either of these maps if it is non-pointer. |
Duncan Sands | 19d0b47 | 2010-02-16 11:11:14 +0000 | [diff] [blame] | 1489 | if (RemInst->getType()->isPointerTy()) { |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1490 | RemoveCachedNonLocalPointerDependencies(ValueIsLoadPair(RemInst, false)); |
| 1491 | RemoveCachedNonLocalPointerDependencies(ValueIsLoadPair(RemInst, true)); |
| 1492 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1493 | |
Chris Lattner | d3d9111 | 2008-11-28 22:51:08 +0000 | [diff] [blame] | 1494 | // Loop over all of the things that depend on the instruction we're removing. |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1495 | // |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1496 | SmallVector<std::pair<Instruction *, Instruction *>, 8> ReverseDepsToAdd; |
Chris Lattner | 82b7034 | 2008-12-07 18:42:51 +0000 | [diff] [blame] | 1497 | |
| 1498 | // If we find RemInst as a clobber or Def in any of the maps for other values, |
| 1499 | // we need to replace its entry with a dirty version of the instruction after |
| 1500 | // it. If RemInst is a terminator, we use a null dirty value. |
| 1501 | // |
| 1502 | // Using a dirty version of the instruction after RemInst saves having to scan |
| 1503 | // the entire block to get to this point. |
| 1504 | MemDepResult NewDirtyVal; |
| 1505 | if (!RemInst->isTerminator()) |
Duncan P. N. Exon Smith | 5a82c91 | 2015-10-10 00:53:03 +0000 | [diff] [blame] | 1506 | NewDirtyVal = MemDepResult::getDirty(&*++RemInst->getIterator()); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1507 | |
Chris Lattner | 9f1988ab | 2008-11-29 09:20:15 +0000 | [diff] [blame] | 1508 | ReverseDepMapType::iterator ReverseDepIt = ReverseLocalDeps.find(RemInst); |
| 1509 | if (ReverseDepIt != ReverseLocalDeps.end()) { |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1510 | // RemInst can't be the terminator if it has local stuff depending on it. |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1511 | assert(!ReverseDepIt->second.empty() && !isa<TerminatorInst>(RemInst) && |
Chris Lattner | ada1f87 | 2008-11-30 01:09:30 +0000 | [diff] [blame] | 1512 | "Nothing can locally depend on a terminator"); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1513 | |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1514 | for (Instruction *InstDependingOnRemInst : ReverseDepIt->second) { |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 1515 | assert(InstDependingOnRemInst != RemInst && |
| 1516 | "Already removed our local dep info"); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1517 | |
Chris Lattner | 82b7034 | 2008-12-07 18:42:51 +0000 | [diff] [blame] | 1518 | LocalDeps[InstDependingOnRemInst] = NewDirtyVal; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1519 | |
Chris Lattner | ada1f87 | 2008-11-30 01:09:30 +0000 | [diff] [blame] | 1520 | // Make sure to remember that new things depend on NewDepInst. |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1521 | assert(NewDirtyVal.getInst() && |
| 1522 | "There is no way something else can have " |
Chris Lattner | 82b7034 | 2008-12-07 18:42:51 +0000 | [diff] [blame] | 1523 | "a local dep on this if it is a terminator!"); |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1524 | ReverseDepsToAdd.push_back( |
| 1525 | std::make_pair(NewDirtyVal.getInst(), InstDependingOnRemInst)); |
Chris Lattner | d3d9111 | 2008-11-28 22:51:08 +0000 | [diff] [blame] | 1526 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1527 | |
Chris Lattner | 63bd586 | 2008-11-29 23:30:39 +0000 | [diff] [blame] | 1528 | ReverseLocalDeps.erase(ReverseDepIt); |
| 1529 | |
| 1530 | // Add new reverse deps after scanning the set, to avoid invalidating the |
| 1531 | // 'ReverseDeps' reference. |
| 1532 | while (!ReverseDepsToAdd.empty()) { |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1533 | ReverseLocalDeps[ReverseDepsToAdd.back().first].insert( |
| 1534 | ReverseDepsToAdd.back().second); |
Chris Lattner | 63bd586 | 2008-11-29 23:30:39 +0000 | [diff] [blame] | 1535 | ReverseDepsToAdd.pop_back(); |
| 1536 | } |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 1537 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1538 | |
Chris Lattner | 9f1988ab | 2008-11-29 09:20:15 +0000 | [diff] [blame] | 1539 | ReverseDepIt = ReverseNonLocalDeps.find(RemInst); |
| 1540 | if (ReverseDepIt != ReverseNonLocalDeps.end()) { |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1541 | for (Instruction *I : ReverseDepIt->second) { |
| 1542 | assert(I != RemInst && "Already removed NonLocalDep info for RemInst"); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1543 | |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1544 | PerInstNLInfo &INLD = NonLocalDeps[I]; |
Chris Lattner | 4410427 | 2008-11-30 02:52:26 +0000 | [diff] [blame] | 1545 | // The information is now dirty! |
Chris Lattner | 7e61daf | 2008-12-01 01:15:42 +0000 | [diff] [blame] | 1546 | INLD.second = true; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1547 | |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1548 | for (auto &Entry : INLD.first) { |
| 1549 | if (Entry.getResult().getInst() != RemInst) |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1550 | continue; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1551 | |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 1552 | // Convert to a dirty entry for the subsequent instruction. |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1553 | Entry.setResult(NewDirtyVal); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1554 | |
Chris Lattner | 82b7034 | 2008-12-07 18:42:51 +0000 | [diff] [blame] | 1555 | if (Instruction *NextI = NewDirtyVal.getInst()) |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1556 | ReverseDepsToAdd.push_back(std::make_pair(NextI, I)); |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 1557 | } |
| 1558 | } |
Chris Lattner | 63bd586 | 2008-11-29 23:30:39 +0000 | [diff] [blame] | 1559 | |
| 1560 | ReverseNonLocalDeps.erase(ReverseDepIt); |
| 1561 | |
Chris Lattner | e7d7e13 | 2008-11-29 22:02:15 +0000 | [diff] [blame] | 1562 | // Add new reverse deps after scanning the set, to avoid invalidating 'Set' |
| 1563 | while (!ReverseDepsToAdd.empty()) { |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1564 | ReverseNonLocalDeps[ReverseDepsToAdd.back().first].insert( |
| 1565 | ReverseDepsToAdd.back().second); |
Chris Lattner | e7d7e13 | 2008-11-29 22:02:15 +0000 | [diff] [blame] | 1566 | ReverseDepsToAdd.pop_back(); |
| 1567 | } |
Owen Anderson | 5f208be | 2007-08-16 21:27:05 +0000 | [diff] [blame] | 1568 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1569 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1570 | // If the instruction is in ReverseNonLocalPtrDeps then it appears as a |
| 1571 | // value in the NonLocalPointerDeps info. |
| 1572 | ReverseNonLocalPtrDepTy::iterator ReversePtrDepIt = |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1573 | ReverseNonLocalPtrDeps.find(RemInst); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1574 | if (ReversePtrDepIt != ReverseNonLocalPtrDeps.end()) { |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1575 | SmallVector<std::pair<Instruction *, ValueIsLoadPair>, 8> |
| 1576 | ReversePtrDepsToAdd; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1577 | |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1578 | for (ValueIsLoadPair P : ReversePtrDepIt->second) { |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1579 | assert(P.getPointer() != RemInst && |
| 1580 | "Already removed NonLocalPointerDeps info for RemInst"); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1581 | |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1582 | NonLocalDepInfo &NLPDI = NonLocalPointerDeps[P].NonLocalDeps; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1583 | |
Chris Lattner | 5ed409e | 2008-12-08 07:31:50 +0000 | [diff] [blame] | 1584 | // The cache is not valid for any specific block anymore. |
Dan Gohman | 2348393 | 2010-09-22 21:41:02 +0000 | [diff] [blame] | 1585 | NonLocalPointerDeps[P].Pair = BBSkipFirstBlockPair(); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1586 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1587 | // Update any entries for RemInst to use the instruction after it. |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1588 | for (auto &Entry : NLPDI) { |
| 1589 | if (Entry.getResult().getInst() != RemInst) |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1590 | continue; |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1591 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1592 | // Convert to a dirty entry for the subsequent instruction. |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1593 | Entry.setResult(NewDirtyVal); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1594 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1595 | if (Instruction *NewDirtyInst = NewDirtyVal.getInst()) |
| 1596 | ReversePtrDepsToAdd.push_back(std::make_pair(NewDirtyInst, P)); |
| 1597 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1598 | |
Chris Lattner | 3f4591c | 2009-01-23 07:12:16 +0000 | [diff] [blame] | 1599 | // Re-sort the NonLocalDepInfo. Changing the dirty entry to its |
| 1600 | // subsequent value may invalidate the sortedness. |
| 1601 | std::sort(NLPDI.begin(), NLPDI.end()); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1602 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1603 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1604 | ReverseNonLocalPtrDeps.erase(ReversePtrDepIt); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1605 | |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1606 | while (!ReversePtrDepsToAdd.empty()) { |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1607 | ReverseNonLocalPtrDeps[ReversePtrDepsToAdd.back().first].insert( |
| 1608 | ReversePtrDepsToAdd.back().second); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1609 | ReversePtrDepsToAdd.pop_back(); |
| 1610 | } |
| 1611 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1612 | |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 1613 | assert(!NonLocalDeps.count(RemInst) && "RemInst got reinserted?"); |
Jakob Stoklund Olesen | 087f207 | 2011-01-11 04:05:39 +0000 | [diff] [blame] | 1614 | DEBUG(verifyRemoved(RemInst)); |
Owen Anderson | c0daf5f | 2007-07-06 23:14:35 +0000 | [diff] [blame] | 1615 | } |
Chandler Carruth | 40e21f2 | 2016-03-07 12:30:06 +0000 | [diff] [blame] | 1616 | |
| 1617 | /// Verify that the specified instruction does not occur in our internal data |
| 1618 | /// structures. |
| 1619 | /// |
| 1620 | /// This function verifies by asserting in debug builds. |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1621 | void MemoryDependenceResults::verifyRemoved(Instruction *D) const { |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1622 | #ifndef NDEBUG |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1623 | for (const auto &DepKV : LocalDeps) { |
| 1624 | assert(DepKV.first != D && "Inst occurs in data structures"); |
| 1625 | assert(DepKV.second.getInst() != D && "Inst occurs in data structures"); |
Chris Lattner | b8ec75b | 2008-11-29 21:25:10 +0000 | [diff] [blame] | 1626 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1627 | |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1628 | for (const auto &DepKV : NonLocalPointerDeps) { |
| 1629 | assert(DepKV.first.getPointer() != D && "Inst occurs in NLPD map key"); |
| 1630 | for (const auto &Entry : DepKV.second.NonLocalDeps) |
| 1631 | assert(Entry.getResult().getInst() != D && "Inst occurs as NLPD value"); |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1632 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1633 | |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1634 | for (const auto &DepKV : NonLocalDeps) { |
| 1635 | assert(DepKV.first != D && "Inst occurs in data structures"); |
| 1636 | const PerInstNLInfo &INLD = DepKV.second; |
| 1637 | for (const auto &Entry : INLD.first) |
| 1638 | assert(Entry.getResult().getInst() != D && |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1639 | "Inst occurs in data structures"); |
Chris Lattner | b8ec75b | 2008-11-29 21:25:10 +0000 | [diff] [blame] | 1640 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1641 | |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1642 | for (const auto &DepKV : ReverseLocalDeps) { |
| 1643 | assert(DepKV.first != D && "Inst occurs in data structures"); |
| 1644 | for (Instruction *Inst : DepKV.second) |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1645 | assert(Inst != D && "Inst occurs in data structures"); |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 1646 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1647 | |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1648 | for (const auto &DepKV : ReverseNonLocalDeps) { |
| 1649 | assert(DepKV.first != D && "Inst occurs in data structures"); |
| 1650 | for (Instruction *Inst : DepKV.second) |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1651 | assert(Inst != D && "Inst occurs in data structures"); |
Chris Lattner | 1b810bd | 2008-11-30 02:28:25 +0000 | [diff] [blame] | 1652 | } |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1653 | |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1654 | for (const auto &DepKV : ReverseNonLocalPtrDeps) { |
| 1655 | assert(DepKV.first != D && "Inst occurs in rev NLPD map"); |
Jakub Staszak | b0a7eed | 2013-03-20 21:47:51 +0000 | [diff] [blame] | 1656 | |
Chandler Carruth | af8321e | 2016-03-07 15:12:57 +0000 | [diff] [blame] | 1657 | for (ValueIsLoadPair P : DepKV.second) |
Chandler Carruth | 60fb1b4 | 2016-03-07 10:19:30 +0000 | [diff] [blame] | 1658 | assert(P != ValueIsLoadPair(D, false) && P != ValueIsLoadPair(D, true) && |
Chris Lattner | a28355d | 2008-12-07 08:50:20 +0000 | [diff] [blame] | 1659 | "Inst occurs in ReverseNonLocalPtrDeps map"); |
| 1660 | } |
Craig Topper | 4627679 | 2014-08-24 23:23:06 +0000 | [diff] [blame] | 1661 | #endif |
Chris Lattner | b8ec75b | 2008-11-29 21:25:10 +0000 | [diff] [blame] | 1662 | } |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1663 | |
Chandler Carruth | b4faf13 | 2016-03-11 10:22:49 +0000 | [diff] [blame] | 1664 | char MemoryDependenceAnalysis::PassID; |
| 1665 | |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1666 | MemoryDependenceResults |
Chandler Carruth | b47f801 | 2016-03-11 11:05:24 +0000 | [diff] [blame] | 1667 | MemoryDependenceAnalysis::run(Function &F, AnalysisManager<Function> &AM) { |
| 1668 | auto &AA = AM.getResult<AAManager>(F); |
| 1669 | auto &AC = AM.getResult<AssumptionAnalysis>(F); |
| 1670 | auto &TLI = AM.getResult<TargetLibraryAnalysis>(F); |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 1671 | auto &DT = AM.getResult<DominatorTreeAnalysis>(F); |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1672 | return MemoryDependenceResults(AA, AC, TLI, DT); |
| 1673 | } |
| 1674 | |
| 1675 | char MemoryDependenceWrapperPass::ID = 0; |
| 1676 | |
| 1677 | INITIALIZE_PASS_BEGIN(MemoryDependenceWrapperPass, "memdep", |
| 1678 | "Memory Dependence Analysis", false, true) |
| 1679 | INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker) |
| 1680 | INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass) |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 1681 | INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1682 | INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass) |
| 1683 | INITIALIZE_PASS_END(MemoryDependenceWrapperPass, "memdep", |
| 1684 | "Memory Dependence Analysis", false, true) |
| 1685 | |
| 1686 | MemoryDependenceWrapperPass::MemoryDependenceWrapperPass() : FunctionPass(ID) { |
| 1687 | initializeMemoryDependenceWrapperPassPass(*PassRegistry::getPassRegistry()); |
| 1688 | } |
| 1689 | MemoryDependenceWrapperPass::~MemoryDependenceWrapperPass() {} |
| 1690 | |
| 1691 | void MemoryDependenceWrapperPass::releaseMemory() { |
| 1692 | MemDep.reset(); |
| 1693 | } |
| 1694 | |
| 1695 | void MemoryDependenceWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const { |
| 1696 | AU.setPreservesAll(); |
| 1697 | AU.addRequired<AssumptionCacheTracker>(); |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 1698 | AU.addRequired<DominatorTreeWrapperPass>(); |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1699 | AU.addRequiredTransitive<AAResultsWrapperPass>(); |
| 1700 | AU.addRequiredTransitive<TargetLibraryInfoWrapperPass>(); |
| 1701 | } |
| 1702 | |
| 1703 | bool MemoryDependenceWrapperPass::runOnFunction(Function &F) { |
| 1704 | auto &AA = getAnalysis<AAResultsWrapperPass>().getAAResults(); |
| 1705 | auto &AC = getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F); |
| 1706 | auto &TLI = getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(); |
Chandler Carruth | aef32bd | 2016-03-11 13:46:00 +0000 | [diff] [blame] | 1707 | auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree(); |
| 1708 | MemDep.emplace(AA, AC, TLI, DT); |
Chandler Carruth | 61440d2 | 2016-03-10 00:55:30 +0000 | [diff] [blame] | 1709 | return false; |
| 1710 | } |
| 1711 | |