blob: 95cd5bea9a90a182454b87b7205930ee8bd80148 [file] [log] [blame]
Anand Shukla70a61382002-02-26 19:00:48 +00001//===-- ProfilePaths.cpp - interface to insert instrumentation ---*- C++ -*--=//
2//
3// This inserts intrumentation for counting
Chris Lattner62b7fd12002-04-07 20:49:59 +00004// execution of paths though a given function
5// Its implemented as a "Function" Pass, and called using opt
Anand Shukla70a61382002-02-26 19:00:48 +00006//
7// This pass is implemented by using algorithms similar to
8// 1."Efficient Path Profiling": Ball, T. and Larus, J. R.,
9// Proceedings of Micro-29, Dec 1996, Paris, France.
10// 2."Efficiently Counting Program events with support for on-line
11// "queries": Ball T., ACM Transactions on Programming Languages
12// and systems, Sep 1994.
13//
14// The algorithms work on a Graph constructed over the nodes
15// made from Basic Blocks: The transformations then take place on
16// the constucted graph (implementation in Graph.cpp and GraphAuxillary.cpp)
17// and finally, appropriate instrumentation is placed over suitable edges.
18// (code inserted through EdgeCode.cpp).
19//
20// The algorithm inserts code such that every acyclic path in the CFG
Chris Lattner62b7fd12002-04-07 20:49:59 +000021// of a function is identified through a unique number. the code insertion
Anand Shukla70a61382002-02-26 19:00:48 +000022// is optimal in the sense that its inserted over a minimal set of edges. Also,
23// the algorithm makes sure than initialization, path increment and counter
Anand Shukla21906892002-06-25 21:14:58 +000024// update can be collapsed into minimum number of edges.
Anand Shukla70a61382002-02-26 19:00:48 +000025//===----------------------------------------------------------------------===//
26
27#include "llvm/Transforms/Instrumentation/ProfilePaths.h"
Chris Lattner15435fd2002-05-07 19:18:48 +000028#include "llvm/Transforms/Utils/UnifyFunctionExitNodes.h"
Anand Shukla70a61382002-02-26 19:00:48 +000029#include "llvm/Support/CFG.h"
Chris Lattnerca142372002-04-28 19:55:58 +000030#include "llvm/Constants.h"
Anand Shukla70a61382002-02-26 19:00:48 +000031#include "llvm/DerivedTypes.h"
32#include "llvm/iMemory.h"
Anand Shukla21906892002-06-25 21:14:58 +000033#include "llvm/Transforms/Instrumentation/Graph.h"
34#include <iostream>
35#include <fstream>
Anand Shukla70a61382002-02-26 19:00:48 +000036
37using std::vector;
38
Chris Lattner37104aa2002-04-29 14:57:45 +000039struct ProfilePaths : public FunctionPass {
Chris Lattner7076ff22002-06-25 16:13:21 +000040 bool runOnFunction(Function &F);
Chris Lattnerd2095502002-02-26 20:04:59 +000041
42 // Before this pass, make sure that there is only one
Chris Lattner62b7fd12002-04-07 20:49:59 +000043 // entry and only one exit node for the function in the CFG of the function
Chris Lattnerd2095502002-02-26 20:04:59 +000044 //
Chris Lattnerc8e66542002-04-27 06:56:12 +000045 void ProfilePaths::getAnalysisUsage(AnalysisUsage &AU) const {
Chris Lattnerf9986852002-04-27 07:27:19 +000046 AU.addRequired(UnifyFunctionExitNodes::ID);
Chris Lattnerd2095502002-02-26 20:04:59 +000047 }
48};
49
Chris Lattnerb28b6802002-07-23 18:06:35 +000050static RegisterPass<ProfilePaths> X("paths", "Profile Paths");
51
Chris Lattnerd2095502002-02-26 20:04:59 +000052// createProfilePathsPass - Create a new pass to add path profiling
53//
54Pass *createProfilePathsPass() {
55 return new ProfilePaths();
56}
57
58
Anand Shukla21906892002-06-25 21:14:58 +000059static Node *findBB(std::vector<Node *> &st, BasicBlock *BB){
60 for(std::vector<Node *>::iterator si=st.begin(); si!=st.end(); ++si){
Anand Shukla70a61382002-02-26 19:00:48 +000061 if(((*si)->getElement())==BB){
62 return *si;
63 }
64 }
65 return NULL;
66}
67
Chris Lattner62b7fd12002-04-07 20:49:59 +000068//Per function pass for inserting counters and trigger code
Chris Lattner7076ff22002-06-25 16:13:21 +000069bool ProfilePaths::runOnFunction(Function &F){
Anand Shukla21906892002-06-25 21:14:58 +000070
71 static int mn = -1;
Anand Shukla11f42622002-07-08 19:36:01 +000072
Anand Shuklafd61c602002-07-18 20:56:47 +000073 if(F.isExternal()) {
Anand Shukla11f42622002-07-08 19:36:01 +000074 return false;
75 }
76
Anand Shuklafd61c602002-07-18 20:56:47 +000077 //std::cerr<<"Instrumenting\n-----------------\n";
78 //std::cerr<<F;
Anand Shukla11f42622002-07-08 19:36:01 +000079 //increment counter for instrumented functions. mn is now function#
80 mn++;
81
82 //std::cerr<<"MN = "<<mn<<"\n";;
83 //std::cerr<<F;
84
Chris Lattnerf9986852002-04-27 07:27:19 +000085 // Transform the cfg s.t. we have just one exit node
86 BasicBlock *ExitNode = getAnalysis<UnifyFunctionExitNodes>().getExitNode();
Anand Shukla21906892002-06-25 21:14:58 +000087
88 //iterating over BBs and making graph
89 std::vector<Node *> nodes;
90 std::vector<Edge> edges;
91
Anand Shukla70a61382002-02-26 19:00:48 +000092 Node *tmp;
93 Node *exitNode, *startNode;
94
Chris Lattnerf9986852002-04-27 07:27:19 +000095 // The nodes must be uniquesly identified:
96 // That is, no two nodes must hav same BB*
Anand Shukla70a61382002-02-26 19:00:48 +000097
Chris Lattner7076ff22002-06-25 16:13:21 +000098 for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB) {
99 Node *nd=new Node(BB);
Anand Shukla21906892002-06-25 21:14:58 +0000100 nodes.push_back(nd);
Chris Lattner7076ff22002-06-25 16:13:21 +0000101 if(&*BB == ExitNode)
Anand Shukla70a61382002-02-26 19:00:48 +0000102 exitNode=nd;
Chris Lattner7076ff22002-06-25 16:13:21 +0000103 if(&*BB==F.begin())
Anand Shukla70a61382002-02-26 19:00:48 +0000104 startNode=nd;
105 }
106
Chris Lattnerf9986852002-04-27 07:27:19 +0000107 // now do it againto insert edges
Chris Lattner7076ff22002-06-25 16:13:21 +0000108 for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB){
109 Node *nd=findBB(nodes, BB);
Anand Shukla70a61382002-02-26 19:00:48 +0000110 assert(nd && "No node for this edge!");
Anand Shukla21906892002-06-25 21:14:58 +0000111
Chris Lattner7076ff22002-06-25 16:13:21 +0000112 for(BasicBlock::succ_iterator s=succ_begin(BB), se=succ_end(BB);
Anand Shukla70a61382002-02-26 19:00:48 +0000113 s!=se; ++s){
114 Node *nd2=findBB(nodes,*s);
115 assert(nd2 && "No node for this edge!");
116 Edge ed(nd,nd2,0);
Anand Shukla21906892002-06-25 21:14:58 +0000117 edges.push_back(ed);
Anand Shukla70a61382002-02-26 19:00:48 +0000118 }
119 }
120
121 Graph g(nodes,edges, startNode, exitNode);
122
Anand Shuklafd61c602002-07-18 20:56:47 +0000123 //#ifdef DEBUG_PATH_PROFILES
124 //std::cerr<<"Original graph\n";
125 //printGraph(g);
126 //#endif
Anand Shukla70a61382002-02-26 19:00:48 +0000127
Anand Shukla11f42622002-07-08 19:36:01 +0000128 BasicBlock *fr = &F.front();
Anand Shukla70a61382002-02-26 19:00:48 +0000129
Anand Shukla11f42622002-07-08 19:36:01 +0000130 // The graph is made acyclic: this is done
131 // by removing back edges for now, and adding them later on
132 vector<Edge> be;
Anand Shuklafd61c602002-07-18 20:56:47 +0000133 std::map<Node *, int> nodePriority; //it ranks nodes in depth first order traversal
134 g.getBackEdges(be, nodePriority);
135 /*
136 std::cerr<<"Node priority--------------\n";
137 for(std::map<Node *, int>::iterator MI = nodePriority.begin(),
138 ME = nodePriority.end(); MI!=ME; ++MI)
139 std::cerr<<MI->first->getElement()->getName()<<"->"<<MI->second<<"\n";
140 std::cerr<<"End Node priority--------------\n";
141 */
Anand Shukla11f42622002-07-08 19:36:01 +0000142 //std::cerr<<"BackEdges-------------\n";
143 // for(vector<Edge>::iterator VI=be.begin(); VI!=be.end(); ++VI){
144 //printEdge(*VI);
145 //cerr<<"\n";
146 //}
147 //std::cerr<<"------\n";
Anand Shukla21906892002-06-25 21:14:58 +0000148
149#ifdef DEBUG_PATH_PROFILES
Anand Shukla11f42622002-07-08 19:36:01 +0000150 cerr<<"Backedges:"<<be.size()<<endl;
Anand Shukla21906892002-06-25 21:14:58 +0000151#endif
Anand Shukla11f42622002-07-08 19:36:01 +0000152 //Now we need to reflect the effect of back edges
153 //This is done by adding dummy edges
154 //If a->b is a back edge
155 //Then we add 2 back edges for it:
156 //1. from root->b (in vector stDummy)
157 //and 2. from a->exit (in vector exDummy)
158 vector<Edge> stDummy;
159 vector<Edge> exDummy;
160 addDummyEdges(stDummy, exDummy, g, be);
Anand Shukla21906892002-06-25 21:14:58 +0000161
Anand Shukla11f42622002-07-08 19:36:01 +0000162 //std::cerr<<"After adding dummy edges\n";
163 //printGraph(g);
Anand Shukla70a61382002-02-26 19:00:48 +0000164
Anand Shukla11f42622002-07-08 19:36:01 +0000165 // Now, every edge in the graph is assigned a weight
166 // This weight later adds on to assign path
167 // numbers to different paths in the graph
168 // All paths for now are acyclic,
169 // since no back edges in the graph now
170 // numPaths is the number of acyclic paths in the graph
Anand Shuklafd61c602002-07-18 20:56:47 +0000171 int numPaths=valueAssignmentToEdges(g, nodePriority);
Anand Shukla21906892002-06-25 21:14:58 +0000172
Anand Shuklafd61c602002-07-18 20:56:47 +0000173 if(numPaths<=1 || numPaths >5000) return false;
Anand Shukla11f42622002-07-08 19:36:01 +0000174 //std::cerr<<"Numpaths="<<numPaths<<std::endl;
175 //printGraph(g);
176 //create instruction allocation r and count
177 //r is the variable that'll act like an accumulator
178 //all along the path, we just add edge values to r
179 //and at the end, r reflects the path number
180 //count is an array: count[x] would store
181 //the number of executions of path numbered x
Anand Shukla21906892002-06-25 21:14:58 +0000182
Anand Shukla11f42622002-07-08 19:36:01 +0000183 Instruction *rVar=new
184 AllocaInst(PointerType::get(Type::IntTy),
185 ConstantUInt::get(Type::UIntTy,1),"R");
Anand Shukla70a61382002-02-26 19:00:48 +0000186
Anand Shukla11f42622002-07-08 19:36:01 +0000187 Instruction *countVar=new
188 AllocaInst(PointerType::get(Type::IntTy),
189 ConstantUInt::get(Type::UIntTy, numPaths), "Count");
Anand Shukla70a61382002-02-26 19:00:48 +0000190
Anand Shukla11f42622002-07-08 19:36:01 +0000191 // insert initialization code in first (entry) BB
192 // this includes initializing r and count
193 insertInTopBB(&F.getEntryNode(),numPaths, rVar, countVar);
Anand Shukla70a61382002-02-26 19:00:48 +0000194
Anand Shukla11f42622002-07-08 19:36:01 +0000195 //now process the graph: get path numbers,
196 //get increments along different paths,
197 //and assign "increments" and "updates" (to r and count)
198 //"optimally". Finally, insert llvm code along various edges
Anand Shuklafd61c602002-07-18 20:56:47 +0000199 processGraph(g, rVar, countVar, be, stDummy, exDummy, numPaths, mn);
200
Chris Lattner62b7fd12002-04-07 20:49:59 +0000201 return true; // Always modifies function
Anand Shukla70a61382002-02-26 19:00:48 +0000202}