Chris Lattner | 44d2c35 | 2003-10-13 03:32:08 +0000 | [diff] [blame] | 1 | //===-- ProfilePaths.cpp - interface to insert instrumentation --*- C++ -*-===// |
John Criswell | 482202a | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file was developed by the LLVM research group and is distributed under |
| 6 | // the University of Illinois Open Source License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 9 | // |
Chris Lattner | 44d2c35 | 2003-10-13 03:32:08 +0000 | [diff] [blame] | 10 | // This inserts instrumentation for counting execution of paths though a given |
| 11 | // function Its implemented as a "Function" Pass, and called using opt |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 12 | // |
| 13 | // This pass is implemented by using algorithms similar to |
| 14 | // 1."Efficient Path Profiling": Ball, T. and Larus, J. R., |
Chris Lattner | 44d2c35 | 2003-10-13 03:32:08 +0000 | [diff] [blame] | 15 | // Proceedings of Micro-29, Dec 1996, Paris, France. |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 16 | // 2."Efficiently Counting Program events with support for on-line |
| 17 | // "queries": Ball T., ACM Transactions on Programming Languages |
Chris Lattner | 44d2c35 | 2003-10-13 03:32:08 +0000 | [diff] [blame] | 18 | // and systems, Sep 1994. |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 19 | // |
Chris Lattner | 44d2c35 | 2003-10-13 03:32:08 +0000 | [diff] [blame] | 20 | // The algorithms work on a Graph constructed over the nodes made from Basic |
| 21 | // Blocks: The transformations then take place on the constructed graph |
| 22 | // (implementation in Graph.cpp and GraphAuxiliary.cpp) and finally, appropriate |
| 23 | // instrumentation is placed over suitable edges. (code inserted through |
| 24 | // EdgeCode.cpp). |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 25 | // |
Chris Lattner | 44d2c35 | 2003-10-13 03:32:08 +0000 | [diff] [blame] | 26 | // The algorithm inserts code such that every acyclic path in the CFG of a |
| 27 | // function is identified through a unique number. the code insertion is optimal |
| 28 | // in the sense that its inserted over a minimal set of edges. Also, the |
| 29 | // algorithm makes sure than initialization, path increment and counter update |
| 30 | // can be collapsed into minimum number of edges. |
| 31 | // |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 32 | //===----------------------------------------------------------------------===// |
| 33 | |
Chris Lattner | 15435fd | 2002-05-07 19:18:48 +0000 | [diff] [blame] | 34 | #include "llvm/Transforms/Utils/UnifyFunctionExitNodes.h" |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 35 | #include "llvm/Support/CFG.h" |
Chris Lattner | ca14237 | 2002-04-28 19:55:58 +0000 | [diff] [blame] | 36 | #include "llvm/Constants.h" |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 37 | #include "llvm/DerivedTypes.h" |
| 38 | #include "llvm/iMemory.h" |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 39 | #include "llvm/iOperators.h" |
| 40 | #include "llvm/iOther.h" |
Anand Shukla | 77dca14 | 2002-09-20 16:44:35 +0000 | [diff] [blame] | 41 | #include "llvm/Module.h" |
Chris Lattner | 2f04a0d | 2003-01-14 22:33:56 +0000 | [diff] [blame] | 42 | #include "Graph.h" |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 43 | #include <fstream> |
Brian Gaeke | b8a4ed6 | 2003-10-10 18:46:52 +0000 | [diff] [blame] | 44 | #include <cstdio> |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 45 | |
Chris Lattner | 37104aa | 2002-04-29 14:57:45 +0000 | [diff] [blame] | 46 | struct ProfilePaths : public FunctionPass { |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 47 | bool runOnFunction(Function &F); |
Chris Lattner | d209550 | 2002-02-26 20:04:59 +0000 | [diff] [blame] | 48 | |
| 49 | // Before this pass, make sure that there is only one |
Chris Lattner | 62b7fd1 | 2002-04-07 20:49:59 +0000 | [diff] [blame] | 50 | // entry and only one exit node for the function in the CFG of the function |
Chris Lattner | d209550 | 2002-02-26 20:04:59 +0000 | [diff] [blame] | 51 | // |
Chris Lattner | c8e6654 | 2002-04-27 06:56:12 +0000 | [diff] [blame] | 52 | void ProfilePaths::getAnalysisUsage(AnalysisUsage &AU) const { |
Chris Lattner | 40eb9da | 2002-08-08 19:01:28 +0000 | [diff] [blame] | 53 | AU.addRequired<UnifyFunctionExitNodes>(); |
Chris Lattner | d209550 | 2002-02-26 20:04:59 +0000 | [diff] [blame] | 54 | } |
| 55 | }; |
| 56 | |
Chris Lattner | a2c0985 | 2002-07-26 21:12:44 +0000 | [diff] [blame] | 57 | static RegisterOpt<ProfilePaths> X("paths", "Profile Paths"); |
Chris Lattner | b28b680 | 2002-07-23 18:06:35 +0000 | [diff] [blame] | 58 | |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 59 | static Node *findBB(std::vector<Node *> &st, BasicBlock *BB){ |
| 60 | for(std::vector<Node *>::iterator si=st.begin(); si!=st.end(); ++si){ |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 61 | if(((*si)->getElement())==BB){ |
| 62 | return *si; |
| 63 | } |
| 64 | } |
| 65 | return NULL; |
| 66 | } |
| 67 | |
Chris Lattner | 62b7fd1 | 2002-04-07 20:49:59 +0000 | [diff] [blame] | 68 | //Per function pass for inserting counters and trigger code |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 69 | bool ProfilePaths::runOnFunction(Function &F){ |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 70 | |
| 71 | static int mn = -1; |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 72 | static int CountCounter = 1; |
Anand Shukla | fd61c60 | 2002-07-18 20:56:47 +0000 | [diff] [blame] | 73 | if(F.isExternal()) { |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 74 | return false; |
| 75 | } |
| 76 | |
| 77 | //increment counter for instrumented functions. mn is now function# |
| 78 | mn++; |
| 79 | |
Chris Lattner | f998685 | 2002-04-27 07:27:19 +0000 | [diff] [blame] | 80 | // Transform the cfg s.t. we have just one exit node |
Chris Lattner | 10a032a | 2003-09-10 20:35:33 +0000 | [diff] [blame] | 81 | BasicBlock *ExitNode = |
| 82 | getAnalysis<UnifyFunctionExitNodes>().getReturnBlock(); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 83 | |
| 84 | //iterating over BBs and making graph |
| 85 | std::vector<Node *> nodes; |
| 86 | std::vector<Edge> edges; |
| 87 | |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 88 | Node *tmp; |
Chris Lattner | a2620ac | 2002-11-09 00:49:43 +0000 | [diff] [blame] | 89 | Node *exitNode = 0, *startNode = 0; |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 90 | |
Misha Brukman | 8b2bd4e | 2003-10-10 17:57:28 +0000 | [diff] [blame] | 91 | // The nodes must be uniquely identified: |
Chris Lattner | f998685 | 2002-04-27 07:27:19 +0000 | [diff] [blame] | 92 | // That is, no two nodes must hav same BB* |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 93 | |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 94 | for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB) { |
| 95 | Node *nd=new Node(BB); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 96 | nodes.push_back(nd); |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 97 | if(&*BB == ExitNode) |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 98 | exitNode=nd; |
Chris Lattner | 889f620 | 2003-04-23 16:37:45 +0000 | [diff] [blame] | 99 | if(BB==F.begin()) |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 100 | startNode=nd; |
| 101 | } |
| 102 | |
Misha Brukman | 8b2bd4e | 2003-10-10 17:57:28 +0000 | [diff] [blame] | 103 | // now do it again to insert edges |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 104 | for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB){ |
| 105 | Node *nd=findBB(nodes, BB); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 106 | assert(nd && "No node for this edge!"); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 107 | |
Chris Lattner | a940095 | 2003-09-24 22:06:25 +0000 | [diff] [blame] | 108 | for(succ_iterator s=succ_begin(BB), se=succ_end(BB); s!=se; ++s){ |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 109 | Node *nd2=findBB(nodes,*s); |
| 110 | assert(nd2 && "No node for this edge!"); |
| 111 | Edge ed(nd,nd2,0); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 112 | edges.push_back(ed); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 113 | } |
| 114 | } |
| 115 | |
| 116 | Graph g(nodes,edges, startNode, exitNode); |
| 117 | |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 118 | #ifdef DEBUG_PATH_PROFILES |
| 119 | std::cerr<<"Original graph\n"; |
| 120 | printGraph(g); |
| 121 | #endif |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 122 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 123 | BasicBlock *fr = &F.front(); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 124 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 125 | // The graph is made acyclic: this is done |
| 126 | // by removing back edges for now, and adding them later on |
Chris Lattner | 10a032a | 2003-09-10 20:35:33 +0000 | [diff] [blame] | 127 | std::vector<Edge> be; |
Anand Shukla | fd61c60 | 2002-07-18 20:56:47 +0000 | [diff] [blame] | 128 | std::map<Node *, int> nodePriority; //it ranks nodes in depth first order traversal |
| 129 | g.getBackEdges(be, nodePriority); |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 130 | |
| 131 | #ifdef DEBUG_PATH_PROFILES |
| 132 | std::cerr<<"BackEdges-------------\n"; |
Chris Lattner | 10a032a | 2003-09-10 20:35:33 +0000 | [diff] [blame] | 133 | for (std::vector<Edge>::iterator VI=be.begin(); VI!=be.end(); ++VI){ |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 134 | printEdge(*VI); |
| 135 | cerr<<"\n"; |
| 136 | } |
| 137 | std::cerr<<"------\n"; |
| 138 | #endif |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 139 | |
| 140 | #ifdef DEBUG_PATH_PROFILES |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 141 | cerr<<"Backedges:"<<be.size()<<endl; |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 142 | #endif |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 143 | //Now we need to reflect the effect of back edges |
| 144 | //This is done by adding dummy edges |
| 145 | //If a->b is a back edge |
| 146 | //Then we add 2 back edges for it: |
| 147 | //1. from root->b (in vector stDummy) |
| 148 | //and 2. from a->exit (in vector exDummy) |
Chris Lattner | 10a032a | 2003-09-10 20:35:33 +0000 | [diff] [blame] | 149 | std::vector<Edge> stDummy; |
| 150 | std::vector<Edge> exDummy; |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 151 | addDummyEdges(stDummy, exDummy, g, be); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 152 | |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 153 | #ifdef DEBUG_PATH_PROFILES |
| 154 | std::cerr<<"After adding dummy edges\n"; |
| 155 | printGraph(g); |
| 156 | #endif |
| 157 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 158 | // Now, every edge in the graph is assigned a weight |
| 159 | // This weight later adds on to assign path |
| 160 | // numbers to different paths in the graph |
| 161 | // All paths for now are acyclic, |
| 162 | // since no back edges in the graph now |
| 163 | // numPaths is the number of acyclic paths in the graph |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 164 | int numPaths=valueAssignmentToEdges(g, nodePriority, be); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 165 | |
Anand Shukla | f8c09ee | 2003-02-14 20:41:53 +0000 | [diff] [blame] | 166 | //if(numPaths<=1) return false; |
| 167 | |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 168 | static GlobalVariable *threshold = NULL; |
| 169 | static bool insertedThreshold = false; |
| 170 | |
| 171 | if(!insertedThreshold){ |
| 172 | threshold = new GlobalVariable(Type::IntTy, false, |
| 173 | GlobalValue::ExternalLinkage, 0, |
| 174 | "reopt_threshold"); |
| 175 | |
| 176 | F.getParent()->getGlobalList().push_back(threshold); |
| 177 | insertedThreshold = true; |
| 178 | } |
| 179 | |
| 180 | assert(threshold && "GlobalVariable threshold not defined!"); |
| 181 | |
| 182 | |
| 183 | if(fr->getParent()->getName() == "main"){ |
Misha Brukman | 8b2bd4e | 2003-10-10 17:57:28 +0000 | [diff] [blame] | 184 | //initialize threshold |
Chris Lattner | 25bc3f8 | 2003-08-31 00:21:59 +0000 | [diff] [blame] | 185 | |
| 186 | // FIXME: THIS IS HORRIBLY BROKEN. FUNCTION PASSES CANNOT DO THIS, EXCEPT |
| 187 | // IN THEIR INITIALIZE METHOD!! |
| 188 | Function *initialize = |
| 189 | F.getParent()->getOrInsertFunction("reoptimizerInitialize", Type::VoidTy, |
| 190 | PointerType::get(Type::IntTy), 0); |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 191 | |
Chris Lattner | 10a032a | 2003-09-10 20:35:33 +0000 | [diff] [blame] | 192 | std::vector<Value *> trargs; |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 193 | trargs.push_back(threshold); |
Chris Lattner | 25bc3f8 | 2003-08-31 00:21:59 +0000 | [diff] [blame] | 194 | new CallInst(initialize, trargs, "", fr->begin()); |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 195 | } |
| 196 | |
| 197 | |
Anand Shukla | fd61c60 | 2002-07-18 20:56:47 +0000 | [diff] [blame] | 198 | if(numPaths<=1 || numPaths >5000) return false; |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 199 | |
| 200 | #ifdef DEBUG_PATH_PROFILES |
| 201 | printGraph(g); |
| 202 | #endif |
| 203 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 204 | //create instruction allocation r and count |
| 205 | //r is the variable that'll act like an accumulator |
| 206 | //all along the path, we just add edge values to r |
| 207 | //and at the end, r reflects the path number |
| 208 | //count is an array: count[x] would store |
| 209 | //the number of executions of path numbered x |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 210 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 211 | Instruction *rVar=new |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 212 | AllocaInst(Type::IntTy, |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 213 | ConstantUInt::get(Type::UIntTy,1),"R"); |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 214 | |
Anand Shukla | f8c09ee | 2003-02-14 20:41:53 +0000 | [diff] [blame] | 215 | //Instruction *countVar=new |
| 216 | //AllocaInst(Type::IntTy, |
| 217 | // ConstantUInt::get(Type::UIntTy, numPaths), "Count"); |
| 218 | |
| 219 | //initialize counter array! |
| 220 | std::vector<Constant*> arrayInitialize; |
| 221 | for(int xi=0; xi<numPaths; xi++) |
| 222 | arrayInitialize.push_back(ConstantSInt::get(Type::IntTy, 0)); |
| 223 | |
Chris Lattner | 379a8d2 | 2003-04-16 20:28:45 +0000 | [diff] [blame] | 224 | const ArrayType *ATy = ArrayType::get(Type::IntTy, numPaths); |
| 225 | Constant *initializer = ConstantArray::get(ATy, arrayInitialize); |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 226 | char tempChar[20]; |
| 227 | sprintf(tempChar, "Count%d", CountCounter); |
| 228 | CountCounter++; |
| 229 | std::string countStr = tempChar; |
Chris Lattner | 379a8d2 | 2003-04-16 20:28:45 +0000 | [diff] [blame] | 230 | GlobalVariable *countVar = new GlobalVariable(ATy, false, |
| 231 | GlobalValue::InternalLinkage, |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 232 | initializer, countStr, |
Chris Lattner | 379a8d2 | 2003-04-16 20:28:45 +0000 | [diff] [blame] | 233 | F.getParent()); |
Anand Shukla | 2fd8edd | 2003-06-05 06:02:46 +0000 | [diff] [blame] | 234 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 235 | // insert initialization code in first (entry) BB |
| 236 | // this includes initializing r and count |
Chris Lattner | 5dac64f | 2003-09-20 14:39:18 +0000 | [diff] [blame] | 237 | insertInTopBB(&F.getEntryBlock(), numPaths, rVar, threshold); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 238 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 239 | //now process the graph: get path numbers, |
| 240 | //get increments along different paths, |
| 241 | //and assign "increments" and "updates" (to r and count) |
| 242 | //"optimally". Finally, insert llvm code along various edges |
Anand Shukla | 77dca14 | 2002-09-20 16:44:35 +0000 | [diff] [blame] | 243 | processGraph(g, rVar, countVar, be, stDummy, exDummy, numPaths, mn, |
| 244 | threshold); |
Anand Shukla | fd61c60 | 2002-07-18 20:56:47 +0000 | [diff] [blame] | 245 | |
Chris Lattner | 62b7fd1 | 2002-04-07 20:49:59 +0000 | [diff] [blame] | 246 | return true; // Always modifies function |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 247 | } |