Chris Lattner | 55c1058 | 2002-10-03 20:38:41 +0000 | [diff] [blame] | 1 | //===- BottomUpClosure.cpp - Compute bottom-up interprocedural closure ----===// |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 2 | // |
| 3 | // This file implements the BUDataStructures class, which represents the |
| 4 | // Bottom-Up Interprocedural closure of the data structure graph over the |
| 5 | // program. This is useful for applications like pool allocation, but **not** |
Chris Lattner | 55c1058 | 2002-10-03 20:38:41 +0000 | [diff] [blame] | 6 | // applications like alias analysis. |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
Chris Lattner | 2b4c8df | 2003-06-30 05:27:53 +0000 | [diff] [blame^] | 10 | #include "DSCallSiteIterator.h" |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 11 | #include "llvm/Analysis/DataStructure.h" |
| 12 | #include "llvm/Module.h" |
Chris Lattner | fccd06f | 2002-10-01 22:33:50 +0000 | [diff] [blame] | 13 | #include "Support/Statistic.h" |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 14 | |
Chris Lattner | ae5f603 | 2002-11-17 22:16:28 +0000 | [diff] [blame] | 15 | namespace { |
| 16 | Statistic<> MaxSCC("budatastructure", "Maximum SCC Size in Call Graph"); |
| 17 | |
| 18 | RegisterAnalysis<BUDataStructures> |
Chris Lattner | 312edd3 | 2003-06-28 22:14:55 +0000 | [diff] [blame] | 19 | X("budatastructure", "Bottom-up Data Structure Analysis"); |
Chris Lattner | ae5f603 | 2002-11-17 22:16:28 +0000 | [diff] [blame] | 20 | } |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 21 | |
Chris Lattner | b106043 | 2002-11-07 05:20:53 +0000 | [diff] [blame] | 22 | using namespace DS; |
Chris Lattner | 55c1058 | 2002-10-03 20:38:41 +0000 | [diff] [blame] | 23 | |
Chris Lattner | aa0b468 | 2002-11-09 21:12:07 +0000 | [diff] [blame] | 24 | // run - Calculate the bottom up data structure graphs for each function in the |
| 25 | // program. |
| 26 | // |
| 27 | bool BUDataStructures::run(Module &M) { |
Chris Lattner | 312edd3 | 2003-06-28 22:14:55 +0000 | [diff] [blame] | 28 | LocalDataStructures &LocalDSA = getAnalysis<LocalDataStructures>(); |
| 29 | GlobalsGraph = new DSGraph(LocalDSA.getGlobalsGraph()); |
Chris Lattner | 20167e3 | 2003-02-03 19:11:38 +0000 | [diff] [blame] | 30 | GlobalsGraph->setPrintAuxCalls(); |
Chris Lattner | aa0b468 | 2002-11-09 21:12:07 +0000 | [diff] [blame] | 31 | |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 32 | Function *MainFunc = M.getMainFunction(); |
| 33 | if (MainFunc) |
| 34 | calculateReachableGraphs(MainFunc); |
| 35 | |
| 36 | // Calculate the graphs for any functions that are unreachable from main... |
Chris Lattner | aa0b468 | 2002-11-09 21:12:07 +0000 | [diff] [blame] | 37 | for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I) |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 38 | if (!I->isExternal() && DSInfo.find(I) == DSInfo.end()) { |
Chris Lattner | ae5f603 | 2002-11-17 22:16:28 +0000 | [diff] [blame] | 39 | #ifndef NDEBUG |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 40 | if (MainFunc) |
| 41 | std::cerr << "*** Function unreachable from main: " |
| 42 | << I->getName() << "\n"; |
Chris Lattner | ae5f603 | 2002-11-17 22:16:28 +0000 | [diff] [blame] | 43 | #endif |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 44 | calculateReachableGraphs(I); // Calculate all graphs... |
| 45 | } |
Chris Lattner | aa0b468 | 2002-11-09 21:12:07 +0000 | [diff] [blame] | 46 | return false; |
| 47 | } |
Chris Lattner | 55c1058 | 2002-10-03 20:38:41 +0000 | [diff] [blame] | 48 | |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 49 | void BUDataStructures::calculateReachableGraphs(Function *F) { |
| 50 | std::vector<Function*> Stack; |
Chris Lattner | 41c04f7 | 2003-02-01 04:52:08 +0000 | [diff] [blame] | 51 | hash_map<Function*, unsigned> ValMap; |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 52 | unsigned NextID = 1; |
| 53 | calculateGraphs(F, Stack, NextID, ValMap); |
| 54 | } |
| 55 | |
| 56 | DSGraph &BUDataStructures::getOrCreateGraph(Function *F) { |
| 57 | // Has the graph already been created? |
| 58 | DSGraph *&Graph = DSInfo[F]; |
| 59 | if (Graph) return *Graph; |
| 60 | |
| 61 | // Copy the local version into DSInfo... |
| 62 | Graph = new DSGraph(getAnalysis<LocalDataStructures>().getDSGraph(*F)); |
| 63 | |
| 64 | Graph->setGlobalsGraph(GlobalsGraph); |
| 65 | Graph->setPrintAuxCalls(); |
| 66 | |
| 67 | // Start with a copy of the original call sites... |
| 68 | Graph->getAuxFunctionCalls() = Graph->getFunctionCalls(); |
| 69 | return *Graph; |
| 70 | } |
| 71 | |
| 72 | unsigned BUDataStructures::calculateGraphs(Function *F, |
| 73 | std::vector<Function*> &Stack, |
| 74 | unsigned &NextID, |
Chris Lattner | 41c04f7 | 2003-02-01 04:52:08 +0000 | [diff] [blame] | 75 | hash_map<Function*, unsigned> &ValMap) { |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 76 | assert(ValMap.find(F) == ValMap.end() && "Shouldn't revisit functions!"); |
| 77 | unsigned Min = NextID++, MyID = Min; |
| 78 | ValMap[F] = Min; |
| 79 | Stack.push_back(F); |
| 80 | |
| 81 | if (F->isExternal()) { // sprintf, fprintf, sscanf, etc... |
| 82 | // No callees! |
| 83 | Stack.pop_back(); |
| 84 | ValMap[F] = ~0; |
| 85 | return Min; |
| 86 | } |
| 87 | |
| 88 | DSGraph &Graph = getOrCreateGraph(F); |
| 89 | |
| 90 | // The edges out of the current node are the call site targets... |
Chris Lattner | 2b4c8df | 2003-06-30 05:27:53 +0000 | [diff] [blame^] | 91 | for (DSCallSiteIterator I = DSCallSiteIterator::begin_aux(Graph), |
| 92 | E = DSCallSiteIterator::end_aux(Graph); I != E; ++I) { |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 93 | Function *Callee = *I; |
| 94 | unsigned M; |
| 95 | // Have we visited the destination function yet? |
Chris Lattner | 41c04f7 | 2003-02-01 04:52:08 +0000 | [diff] [blame] | 96 | hash_map<Function*, unsigned>::iterator It = ValMap.find(Callee); |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 97 | if (It == ValMap.end()) // No, visit it now. |
| 98 | M = calculateGraphs(Callee, Stack, NextID, ValMap); |
| 99 | else // Yes, get it's number. |
| 100 | M = It->second; |
| 101 | if (M < Min) Min = M; |
| 102 | } |
| 103 | |
| 104 | assert(ValMap[F] == MyID && "SCC construction assumption wrong!"); |
| 105 | if (Min != MyID) |
| 106 | return Min; // This is part of a larger SCC! |
| 107 | |
| 108 | // If this is a new SCC, process it now. |
| 109 | if (Stack.back() == F) { // Special case the single "SCC" case here. |
| 110 | DEBUG(std::cerr << "Visiting single node SCC #: " << MyID << " fn: " |
| 111 | << F->getName() << "\n"); |
| 112 | Stack.pop_back(); |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 113 | DSGraph &G = getDSGraph(*F); |
| 114 | DEBUG(std::cerr << " [BU] Calculating graph for: " << F->getName()<< "\n"); |
| 115 | calculateGraph(G); |
| 116 | DEBUG(std::cerr << " [BU] Done inlining: " << F->getName() << " [" |
| 117 | << G.getGraphSize() << "+" << G.getAuxFunctionCalls().size() |
| 118 | << "]\n"); |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 119 | |
Chris Lattner | ae5f603 | 2002-11-17 22:16:28 +0000 | [diff] [blame] | 120 | if (MaxSCC < 1) MaxSCC = 1; |
| 121 | |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 122 | // Should we revisit the graph? |
Chris Lattner | 2b4c8df | 2003-06-30 05:27:53 +0000 | [diff] [blame^] | 123 | if (DSCallSiteIterator::begin_aux(G) != DSCallSiteIterator::end_aux(G)) { |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 124 | ValMap.erase(F); |
| 125 | return calculateGraphs(F, Stack, NextID, ValMap); |
| 126 | } else { |
| 127 | ValMap[F] = ~0U; |
| 128 | } |
| 129 | return MyID; |
| 130 | |
| 131 | } else { |
| 132 | // SCCFunctions - Keep track of the functions in the current SCC |
| 133 | // |
Chris Lattner | 41c04f7 | 2003-02-01 04:52:08 +0000 | [diff] [blame] | 134 | hash_set<Function*> SCCFunctions; |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 135 | |
| 136 | Function *NF; |
| 137 | std::vector<Function*>::iterator FirstInSCC = Stack.end(); |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 138 | DSGraph *SCCGraph = 0; |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 139 | do { |
| 140 | NF = *--FirstInSCC; |
| 141 | ValMap[NF] = ~0U; |
| 142 | SCCFunctions.insert(NF); |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 143 | |
| 144 | // Figure out which graph is the largest one, in order to speed things up |
| 145 | // a bit in situations where functions in the SCC have widely different |
| 146 | // graph sizes. |
| 147 | DSGraph &NFGraph = getDSGraph(*NF); |
| 148 | if (!SCCGraph || SCCGraph->getGraphSize() < NFGraph.getGraphSize()) |
| 149 | SCCGraph = &NFGraph; |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 150 | } while (NF != F); |
| 151 | |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 152 | std::cerr << "Calculating graph for SCC #: " << MyID << " of size: " |
| 153 | << SCCFunctions.size() << "\n"; |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 154 | |
Chris Lattner | ae5f603 | 2002-11-17 22:16:28 +0000 | [diff] [blame] | 155 | // Compute the Max SCC Size... |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 156 | if (MaxSCC < SCCFunctions.size()) |
| 157 | MaxSCC = SCCFunctions.size(); |
Chris Lattner | ae5f603 | 2002-11-17 22:16:28 +0000 | [diff] [blame] | 158 | |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 159 | // First thing first, collapse all of the DSGraphs into a single graph for |
| 160 | // the entire SCC. We computed the largest graph, so clone all of the other |
| 161 | // (smaller) graphs into it. Discard all of the old graphs. |
| 162 | // |
| 163 | for (hash_set<Function*>::iterator I = SCCFunctions.begin(), |
| 164 | E = SCCFunctions.end(); I != E; ++I) { |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 165 | DSGraph &G = getDSGraph(**I); |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 166 | if (&G != SCCGraph) { |
| 167 | DSGraph::NodeMapTy NodeMap; |
| 168 | SCCGraph->cloneInto(G, SCCGraph->getScalarMap(), |
| 169 | SCCGraph->getReturnNodes(), NodeMap, 0); |
| 170 | // Update the DSInfo map and delete the old graph... |
| 171 | DSInfo[*I] = SCCGraph; |
| 172 | delete &G; |
| 173 | } |
| 174 | } |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 175 | |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 176 | // Now that we have one big happy family, resolve all of the call sites in |
| 177 | // the graph... |
| 178 | calculateGraph(*SCCGraph); |
| 179 | DEBUG(std::cerr << " [BU] Done inlining SCC [" << SCCGraph->getGraphSize() |
| 180 | << "+" << SCCGraph->getAuxFunctionCalls().size() << "]\n"); |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 181 | |
| 182 | std::cerr << "DONE with SCC #: " << MyID << "\n"; |
| 183 | |
| 184 | // We never have to revisit "SCC" processed functions... |
| 185 | |
| 186 | // Drop the stuff we don't need from the end of the stack |
| 187 | Stack.erase(FirstInSCC, Stack.end()); |
| 188 | return MyID; |
| 189 | } |
| 190 | |
| 191 | return MyID; // == Min |
| 192 | } |
| 193 | |
| 194 | |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 195 | // releaseMemory - If the pass pipeline is done with this pass, we can release |
| 196 | // our memory... here... |
| 197 | // |
| 198 | void BUDataStructures::releaseMemory() { |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 199 | for (hash_map<Function*, DSGraph*>::iterator I = DSInfo.begin(), |
| 200 | E = DSInfo.end(); I != E; ++I) { |
| 201 | I->second->getReturnNodes().erase(I->first); |
| 202 | if (I->second->getReturnNodes().empty()) |
| 203 | delete I->second; |
| 204 | } |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 205 | |
| 206 | // Empty map so next time memory is released, data structures are not |
| 207 | // re-deleted. |
| 208 | DSInfo.clear(); |
Chris Lattner | aa0b468 | 2002-11-09 21:12:07 +0000 | [diff] [blame] | 209 | delete GlobalsGraph; |
| 210 | GlobalsGraph = 0; |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 211 | } |
| 212 | |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 213 | void BUDataStructures::calculateGraph(DSGraph &Graph) { |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 214 | // Move our call site list into TempFCs so that inline call sites go into the |
| 215 | // new call site list and doesn't invalidate our iterators! |
| 216 | std::vector<DSCallSite> TempFCs; |
| 217 | std::vector<DSCallSite> &AuxCallsList = Graph.getAuxFunctionCalls(); |
| 218 | TempFCs.swap(AuxCallsList); |
Chris Lattner | 8a5db46 | 2002-11-11 00:01:34 +0000 | [diff] [blame] | 219 | |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 220 | DSGraph::ReturnNodesTy &ReturnNodes = Graph.getReturnNodes(); |
| 221 | |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 222 | // Loop over all of the resolvable call sites |
| 223 | unsigned LastCallSiteIdx = ~0U; |
Chris Lattner | 2b4c8df | 2003-06-30 05:27:53 +0000 | [diff] [blame^] | 224 | for (DSCallSiteIterator I = DSCallSiteIterator::begin(TempFCs), |
| 225 | E = DSCallSiteIterator::end(TempFCs); I != E; ++I) { |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 226 | // If we skipped over any call sites, they must be unresolvable, copy them |
| 227 | // to the real call site list. |
| 228 | LastCallSiteIdx++; |
| 229 | for (; LastCallSiteIdx < I.getCallSiteIdx(); ++LastCallSiteIdx) |
| 230 | AuxCallsList.push_back(TempFCs[LastCallSiteIdx]); |
| 231 | LastCallSiteIdx = I.getCallSiteIdx(); |
Chris Lattner | a107905 | 2002-11-10 06:52:47 +0000 | [diff] [blame] | 232 | |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 233 | // Resolve the current call... |
| 234 | Function *Callee = *I; |
Chris Lattner | 2b4c8df | 2003-06-30 05:27:53 +0000 | [diff] [blame^] | 235 | const DSCallSite &CS = I.getCallSite(); |
Chris Lattner | 0d9bab8 | 2002-07-18 00:12:30 +0000 | [diff] [blame] | 236 | |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 237 | if (Callee->isExternal()) { |
| 238 | // Ignore this case, simple varargs functions we cannot stub out! |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 239 | } else if (ReturnNodes.find(Callee) != ReturnNodes.end()) { |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 240 | // Self recursion... simply link up the formal arguments with the |
| 241 | // actual arguments... |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 242 | DEBUG(std::cerr << " Self Inlining: " << Callee->getName() << "\n"); |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 243 | |
| 244 | // Handle self recursion by resolving the arguments and return value |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 245 | Graph.mergeInGraph(CS, *Callee, Graph, 0); |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 246 | |
| 247 | } else { |
| 248 | // Get the data structure graph for the called function. |
| 249 | // |
| 250 | DSGraph &GI = getDSGraph(*Callee); // Graph to inline |
| 251 | |
| 252 | DEBUG(std::cerr << " Inlining graph for " << Callee->getName() |
Chris Lattner | 20167e3 | 2003-02-03 19:11:38 +0000 | [diff] [blame] | 253 | << "[" << GI.getGraphSize() << "+" |
Chris Lattner | 0eea618 | 2003-06-30 05:09:58 +0000 | [diff] [blame] | 254 | << GI.getAuxFunctionCalls().size() << "] into [" |
| 255 | << Graph.getGraphSize() << "+" |
Chris Lattner | 20167e3 | 2003-02-03 19:11:38 +0000 | [diff] [blame] | 256 | << Graph.getAuxFunctionCalls().size() << "]\n"); |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 257 | |
| 258 | // Handle self recursion by resolving the arguments and return value |
Chris Lattner | 5a54063 | 2003-06-30 03:15:25 +0000 | [diff] [blame] | 259 | Graph.mergeInGraph(CS, *Callee, GI, |
Vikram S. Adve | 61ff029 | 2002-11-27 17:41:13 +0000 | [diff] [blame] | 260 | DSGraph::KeepModRefBits | |
| 261 | DSGraph::StripAllocaBit | DSGraph::DontCloneCallNodes); |
Chris Lattner | ae5f603 | 2002-11-17 22:16:28 +0000 | [diff] [blame] | 262 | |
| 263 | #if 0 |
| 264 | Graph.writeGraphToFile(std::cerr, "bu_" + F.getName() + "_after_" + |
| 265 | Callee->getName()); |
| 266 | #endif |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 267 | } |
| 268 | } |
| 269 | |
| 270 | // Make sure to catch any leftover unresolvable calls... |
| 271 | for (++LastCallSiteIdx; LastCallSiteIdx < TempFCs.size(); ++LastCallSiteIdx) |
| 272 | AuxCallsList.push_back(TempFCs[LastCallSiteIdx]); |
| 273 | |
| 274 | TempFCs.clear(); |
| 275 | |
| 276 | // Recompute the Incomplete markers. If there are any function calls left |
| 277 | // now that are complete, we must loop! |
| 278 | Graph.maskIncompleteMarkers(); |
Chris Lattner | 394471f | 2003-01-23 22:05:33 +0000 | [diff] [blame] | 279 | Graph.markIncompleteNodes(DSGraph::MarkFormalArgs); |
Chris Lattner | 20167e3 | 2003-02-03 19:11:38 +0000 | [diff] [blame] | 280 | // FIXME: materialize nodes from the globals graph as neccesary... |
Chris Lattner | 394471f | 2003-01-23 22:05:33 +0000 | [diff] [blame] | 281 | Graph.removeDeadNodes(DSGraph::KeepUnreachableGlobals); |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 282 | |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 283 | //Graph.writeGraphToFile(std::cerr, "bu_" + F.getName()); |
Chris Lattner | a9c9c02 | 2002-11-11 21:35:13 +0000 | [diff] [blame] | 284 | } |
| 285 | |