Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 1 | //===-- ProfilePaths.cpp - interface to insert instrumentation ---*- C++ -*--=// |
| 2 | // |
| 3 | // This inserts intrumentation for counting |
Chris Lattner | 62b7fd1 | 2002-04-07 20:49:59 +0000 | [diff] [blame] | 4 | // execution of paths though a given function |
| 5 | // Its implemented as a "Function" Pass, and called using opt |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 6 | // |
| 7 | // This pass is implemented by using algorithms similar to |
| 8 | // 1."Efficient Path Profiling": Ball, T. and Larus, J. R., |
| 9 | // Proceedings of Micro-29, Dec 1996, Paris, France. |
| 10 | // 2."Efficiently Counting Program events with support for on-line |
| 11 | // "queries": Ball T., ACM Transactions on Programming Languages |
| 12 | // and systems, Sep 1994. |
| 13 | // |
| 14 | // The algorithms work on a Graph constructed over the nodes |
| 15 | // made from Basic Blocks: The transformations then take place on |
| 16 | // the constucted graph (implementation in Graph.cpp and GraphAuxillary.cpp) |
| 17 | // and finally, appropriate instrumentation is placed over suitable edges. |
| 18 | // (code inserted through EdgeCode.cpp). |
| 19 | // |
| 20 | // The algorithm inserts code such that every acyclic path in the CFG |
Chris Lattner | 62b7fd1 | 2002-04-07 20:49:59 +0000 | [diff] [blame] | 21 | // of a function is identified through a unique number. the code insertion |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 22 | // is optimal in the sense that its inserted over a minimal set of edges. Also, |
| 23 | // the algorithm makes sure than initialization, path increment and counter |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 24 | // update can be collapsed into minimum number of edges. |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 25 | //===----------------------------------------------------------------------===// |
| 26 | |
| 27 | #include "llvm/Transforms/Instrumentation/ProfilePaths.h" |
Chris Lattner | 15435fd | 2002-05-07 19:18:48 +0000 | [diff] [blame] | 28 | #include "llvm/Transforms/Utils/UnifyFunctionExitNodes.h" |
Anand Shukla | 77dca14 | 2002-09-20 16:44:35 +0000 | [diff] [blame] | 29 | #include "llvm/Transforms/Instrumentation/Graph.h" |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 30 | #include "llvm/Support/CFG.h" |
Chris Lattner | ca14237 | 2002-04-28 19:55:58 +0000 | [diff] [blame] | 31 | #include "llvm/Constants.h" |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 32 | #include "llvm/DerivedTypes.h" |
| 33 | #include "llvm/iMemory.h" |
Anand Shukla | 77dca14 | 2002-09-20 16:44:35 +0000 | [diff] [blame] | 34 | #include "llvm/GlobalVariable.h" |
| 35 | #include "llvm/Module.h" |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 36 | #include <iostream> |
| 37 | #include <fstream> |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 38 | |
| 39 | using std::vector; |
| 40 | |
Chris Lattner | 37104aa | 2002-04-29 14:57:45 +0000 | [diff] [blame] | 41 | struct ProfilePaths : public FunctionPass { |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 42 | bool runOnFunction(Function &F); |
Chris Lattner | d209550 | 2002-02-26 20:04:59 +0000 | [diff] [blame] | 43 | |
| 44 | // Before this pass, make sure that there is only one |
Chris Lattner | 62b7fd1 | 2002-04-07 20:49:59 +0000 | [diff] [blame] | 45 | // entry and only one exit node for the function in the CFG of the function |
Chris Lattner | d209550 | 2002-02-26 20:04:59 +0000 | [diff] [blame] | 46 | // |
Chris Lattner | c8e6654 | 2002-04-27 06:56:12 +0000 | [diff] [blame] | 47 | void ProfilePaths::getAnalysisUsage(AnalysisUsage &AU) const { |
Chris Lattner | 40eb9da | 2002-08-08 19:01:28 +0000 | [diff] [blame] | 48 | AU.addRequired<UnifyFunctionExitNodes>(); |
Chris Lattner | d209550 | 2002-02-26 20:04:59 +0000 | [diff] [blame] | 49 | } |
| 50 | }; |
| 51 | |
Chris Lattner | a2c0985 | 2002-07-26 21:12:44 +0000 | [diff] [blame] | 52 | static RegisterOpt<ProfilePaths> X("paths", "Profile Paths"); |
Chris Lattner | b28b680 | 2002-07-23 18:06:35 +0000 | [diff] [blame] | 53 | |
Chris Lattner | d209550 | 2002-02-26 20:04:59 +0000 | [diff] [blame] | 54 | // createProfilePathsPass - Create a new pass to add path profiling |
| 55 | // |
| 56 | Pass *createProfilePathsPass() { |
| 57 | return new ProfilePaths(); |
| 58 | } |
| 59 | |
| 60 | |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 61 | static Node *findBB(std::vector<Node *> &st, BasicBlock *BB){ |
| 62 | for(std::vector<Node *>::iterator si=st.begin(); si!=st.end(); ++si){ |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 63 | if(((*si)->getElement())==BB){ |
| 64 | return *si; |
| 65 | } |
| 66 | } |
| 67 | return NULL; |
| 68 | } |
| 69 | |
Chris Lattner | 62b7fd1 | 2002-04-07 20:49:59 +0000 | [diff] [blame] | 70 | //Per function pass for inserting counters and trigger code |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 71 | bool ProfilePaths::runOnFunction(Function &F){ |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 72 | |
| 73 | static int mn = -1; |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 74 | |
Anand Shukla | fd61c60 | 2002-07-18 20:56:47 +0000 | [diff] [blame] | 75 | if(F.isExternal()) { |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 76 | return false; |
| 77 | } |
| 78 | |
| 79 | //increment counter for instrumented functions. mn is now function# |
| 80 | mn++; |
| 81 | |
Chris Lattner | f998685 | 2002-04-27 07:27:19 +0000 | [diff] [blame] | 82 | // Transform the cfg s.t. we have just one exit node |
| 83 | BasicBlock *ExitNode = getAnalysis<UnifyFunctionExitNodes>().getExitNode(); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 84 | |
| 85 | //iterating over BBs and making graph |
| 86 | std::vector<Node *> nodes; |
| 87 | std::vector<Edge> edges; |
| 88 | |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 89 | Node *tmp; |
| 90 | Node *exitNode, *startNode; |
| 91 | |
Chris Lattner | f998685 | 2002-04-27 07:27:19 +0000 | [diff] [blame] | 92 | // The nodes must be uniquesly identified: |
| 93 | // That is, no two nodes must hav same BB* |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 94 | |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 95 | for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB) { |
| 96 | Node *nd=new Node(BB); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 97 | nodes.push_back(nd); |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 98 | if(&*BB == ExitNode) |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 99 | exitNode=nd; |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 100 | if(&*BB==F.begin()) |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 101 | startNode=nd; |
| 102 | } |
| 103 | |
Chris Lattner | f998685 | 2002-04-27 07:27:19 +0000 | [diff] [blame] | 104 | // now do it againto insert edges |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 105 | for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB){ |
| 106 | Node *nd=findBB(nodes, BB); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 107 | assert(nd && "No node for this edge!"); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 108 | |
Chris Lattner | 7076ff2 | 2002-06-25 16:13:21 +0000 | [diff] [blame] | 109 | for(BasicBlock::succ_iterator s=succ_begin(BB), se=succ_end(BB); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 110 | s!=se; ++s){ |
| 111 | Node *nd2=findBB(nodes,*s); |
| 112 | assert(nd2 && "No node for this edge!"); |
| 113 | Edge ed(nd,nd2,0); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 114 | edges.push_back(ed); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 115 | } |
| 116 | } |
| 117 | |
| 118 | Graph g(nodes,edges, startNode, exitNode); |
| 119 | |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 120 | #ifdef DEBUG_PATH_PROFILES |
| 121 | std::cerr<<"Original graph\n"; |
| 122 | printGraph(g); |
| 123 | #endif |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 124 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 125 | BasicBlock *fr = &F.front(); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 126 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 127 | // The graph is made acyclic: this is done |
| 128 | // by removing back edges for now, and adding them later on |
| 129 | vector<Edge> be; |
Anand Shukla | fd61c60 | 2002-07-18 20:56:47 +0000 | [diff] [blame] | 130 | std::map<Node *, int> nodePriority; //it ranks nodes in depth first order traversal |
| 131 | g.getBackEdges(be, nodePriority); |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 132 | |
| 133 | #ifdef DEBUG_PATH_PROFILES |
| 134 | std::cerr<<"BackEdges-------------\n"; |
| 135 | for(vector<Edge>::iterator VI=be.begin(); VI!=be.end(); ++VI){ |
| 136 | printEdge(*VI); |
| 137 | cerr<<"\n"; |
| 138 | } |
| 139 | std::cerr<<"------\n"; |
| 140 | #endif |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 141 | |
| 142 | #ifdef DEBUG_PATH_PROFILES |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 143 | cerr<<"Backedges:"<<be.size()<<endl; |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 144 | #endif |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 145 | //Now we need to reflect the effect of back edges |
| 146 | //This is done by adding dummy edges |
| 147 | //If a->b is a back edge |
| 148 | //Then we add 2 back edges for it: |
| 149 | //1. from root->b (in vector stDummy) |
| 150 | //and 2. from a->exit (in vector exDummy) |
| 151 | vector<Edge> stDummy; |
| 152 | vector<Edge> exDummy; |
| 153 | addDummyEdges(stDummy, exDummy, g, be); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 154 | |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 155 | #ifdef DEBUG_PATH_PROFILES |
| 156 | std::cerr<<"After adding dummy edges\n"; |
| 157 | printGraph(g); |
| 158 | #endif |
| 159 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 160 | // Now, every edge in the graph is assigned a weight |
| 161 | // This weight later adds on to assign path |
| 162 | // numbers to different paths in the graph |
| 163 | // All paths for now are acyclic, |
| 164 | // since no back edges in the graph now |
| 165 | // numPaths is the number of acyclic paths in the graph |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 166 | int numPaths=valueAssignmentToEdges(g, nodePriority, be); |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 167 | |
Anand Shukla | fd61c60 | 2002-07-18 20:56:47 +0000 | [diff] [blame] | 168 | if(numPaths<=1 || numPaths >5000) return false; |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 169 | |
| 170 | #ifdef DEBUG_PATH_PROFILES |
| 171 | printGraph(g); |
| 172 | #endif |
| 173 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 174 | //create instruction allocation r and count |
| 175 | //r is the variable that'll act like an accumulator |
| 176 | //all along the path, we just add edge values to r |
| 177 | //and at the end, r reflects the path number |
| 178 | //count is an array: count[x] would store |
| 179 | //the number of executions of path numbered x |
Anand Shukla | 2190689 | 2002-06-25 21:14:58 +0000 | [diff] [blame] | 180 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 181 | Instruction *rVar=new |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 182 | AllocaInst(Type::IntTy, |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 183 | ConstantUInt::get(Type::UIntTy,1),"R"); |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 184 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 185 | Instruction *countVar=new |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 186 | AllocaInst(Type::IntTy, |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 187 | ConstantUInt::get(Type::UIntTy, numPaths), "Count"); |
Anand Shukla | d9a6af0 | 2002-09-16 05:24:49 +0000 | [diff] [blame] | 188 | |
Anand Shukla | 77dca14 | 2002-09-20 16:44:35 +0000 | [diff] [blame] | 189 | static GlobalVariable *threshold = NULL; |
| 190 | static bool insertedThreshold = false; |
| 191 | |
| 192 | if(!insertedThreshold){ |
| 193 | threshold = new GlobalVariable(Type::IntTy, false, true, 0, |
| 194 | "reopt_threshold"); |
| 195 | |
| 196 | F.getParent()->getGlobalList().push_back(threshold); |
| 197 | insertedThreshold = true; |
| 198 | } |
| 199 | |
| 200 | assert(threshold && "GlobalVariable threshold not defined!"); |
| 201 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 202 | // insert initialization code in first (entry) BB |
| 203 | // this includes initializing r and count |
Anand Shukla | 77dca14 | 2002-09-20 16:44:35 +0000 | [diff] [blame] | 204 | insertInTopBB(&F.getEntryNode(),numPaths, rVar, countVar, threshold); |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 205 | |
Anand Shukla | 11f4262 | 2002-07-08 19:36:01 +0000 | [diff] [blame] | 206 | //now process the graph: get path numbers, |
| 207 | //get increments along different paths, |
| 208 | //and assign "increments" and "updates" (to r and count) |
| 209 | //"optimally". Finally, insert llvm code along various edges |
Anand Shukla | 77dca14 | 2002-09-20 16:44:35 +0000 | [diff] [blame] | 210 | processGraph(g, rVar, countVar, be, stDummy, exDummy, numPaths, mn, |
| 211 | threshold); |
Anand Shukla | fd61c60 | 2002-07-18 20:56:47 +0000 | [diff] [blame] | 212 | |
Chris Lattner | 62b7fd1 | 2002-04-07 20:49:59 +0000 | [diff] [blame] | 213 | return true; // Always modifies function |
Anand Shukla | 70a6138 | 2002-02-26 19:00:48 +0000 | [diff] [blame] | 214 | } |