blob: ebd290cd9157f841ff9822ac3ae1b931410ec28c [file] [log] [blame]
Anand Shukla70a61382002-02-26 19:00:48 +00001//===-- ProfilePaths.cpp - interface to insert instrumentation ---*- C++ -*--=//
2//
3// This inserts intrumentation for counting
Chris Lattner62b7fd12002-04-07 20:49:59 +00004// execution of paths though a given function
5// Its implemented as a "Function" Pass, and called using opt
Anand Shukla70a61382002-02-26 19:00:48 +00006//
7// This pass is implemented by using algorithms similar to
8// 1."Efficient Path Profiling": Ball, T. and Larus, J. R.,
9// Proceedings of Micro-29, Dec 1996, Paris, France.
10// 2."Efficiently Counting Program events with support for on-line
11// "queries": Ball T., ACM Transactions on Programming Languages
12// and systems, Sep 1994.
13//
14// The algorithms work on a Graph constructed over the nodes
15// made from Basic Blocks: The transformations then take place on
16// the constucted graph (implementation in Graph.cpp and GraphAuxillary.cpp)
17// and finally, appropriate instrumentation is placed over suitable edges.
18// (code inserted through EdgeCode.cpp).
19//
20// The algorithm inserts code such that every acyclic path in the CFG
Chris Lattner62b7fd12002-04-07 20:49:59 +000021// of a function is identified through a unique number. the code insertion
Anand Shukla70a61382002-02-26 19:00:48 +000022// is optimal in the sense that its inserted over a minimal set of edges. Also,
23// the algorithm makes sure than initialization, path increment and counter
24// update can be collapsed into minmimum number of edges.
25//===----------------------------------------------------------------------===//
26
27#include "llvm/Transforms/Instrumentation/ProfilePaths.h"
Chris Lattnerf9986852002-04-27 07:27:19 +000028#include "llvm/Transforms/UnifyFunctionExitNodes.h"
Anand Shukla70a61382002-02-26 19:00:48 +000029#include "llvm/Support/CFG.h"
Chris Lattnerca142372002-04-28 19:55:58 +000030#include "llvm/Constants.h"
Anand Shukla70a61382002-02-26 19:00:48 +000031#include "llvm/DerivedTypes.h"
32#include "llvm/iMemory.h"
33#include "Graph.h"
34
35using std::vector;
36
Chris Lattner37104aa2002-04-29 14:57:45 +000037struct ProfilePaths : public FunctionPass {
38 const char *getPassName() const { return "ProfilePaths"; }
39
Chris Lattnerc8e66542002-04-27 06:56:12 +000040 bool runOnFunction(Function *F);
Chris Lattnerd2095502002-02-26 20:04:59 +000041
42 // Before this pass, make sure that there is only one
Chris Lattner62b7fd12002-04-07 20:49:59 +000043 // entry and only one exit node for the function in the CFG of the function
Chris Lattnerd2095502002-02-26 20:04:59 +000044 //
Chris Lattnerc8e66542002-04-27 06:56:12 +000045 void ProfilePaths::getAnalysisUsage(AnalysisUsage &AU) const {
Chris Lattnerf9986852002-04-27 07:27:19 +000046 AU.addRequired(UnifyFunctionExitNodes::ID);
Chris Lattnerd2095502002-02-26 20:04:59 +000047 }
48};
49
50// createProfilePathsPass - Create a new pass to add path profiling
51//
52Pass *createProfilePathsPass() {
53 return new ProfilePaths();
54}
55
56
Chris Lattner5328c6f2002-02-26 19:40:28 +000057static Node *findBB(std::set<Node *> &st, BasicBlock *BB){
58 for(std::set<Node *>::iterator si=st.begin(); si!=st.end(); ++si){
Anand Shukla70a61382002-02-26 19:00:48 +000059 if(((*si)->getElement())==BB){
60 return *si;
61 }
62 }
63 return NULL;
64}
65
Chris Lattner62b7fd12002-04-07 20:49:59 +000066//Per function pass for inserting counters and trigger code
Chris Lattnerc8e66542002-04-27 06:56:12 +000067bool ProfilePaths::runOnFunction(Function *M){
Chris Lattnerf9986852002-04-27 07:27:19 +000068 // Transform the cfg s.t. we have just one exit node
69 BasicBlock *ExitNode = getAnalysis<UnifyFunctionExitNodes>().getExitNode();
Anand Shukla70a61382002-02-26 19:00:48 +000070
Chris Lattnerf9986852002-04-27 07:27:19 +000071 // iterating over BBs and making graph
Anand Shukla70a61382002-02-26 19:00:48 +000072 std::set<Node *> nodes;
73 std::set<Edge> edges;
74 Node *tmp;
75 Node *exitNode, *startNode;
76
Chris Lattnerf9986852002-04-27 07:27:19 +000077 // The nodes must be uniquesly identified:
78 // That is, no two nodes must hav same BB*
Anand Shukla70a61382002-02-26 19:00:48 +000079
Chris Lattnerf9986852002-04-27 07:27:19 +000080 // First enter just nodes: later enter edges
Chris Lattner62b7fd12002-04-07 20:49:59 +000081 for (Function::iterator BB = M->begin(), BE=M->end(); BB != BE; ++BB){
Anand Shukla70a61382002-02-26 19:00:48 +000082 Node *nd=new Node(*BB);
83 nodes.insert(nd);
84 if(*BB==ExitNode)
85 exitNode=nd;
86 if(*BB==M->front())
87 startNode=nd;
88 }
89
Chris Lattnerf9986852002-04-27 07:27:19 +000090 // now do it againto insert edges
Chris Lattner62b7fd12002-04-07 20:49:59 +000091 for (Function::iterator BB = M->begin(), BE=M->end(); BB != BE; ++BB){
Anand Shukla70a61382002-02-26 19:00:48 +000092 Node *nd=findBB(nodes, *BB);
93 assert(nd && "No node for this edge!");
94 for(BasicBlock::succ_iterator s=succ_begin(*BB), se=succ_end(*BB);
95 s!=se; ++s){
96 Node *nd2=findBB(nodes,*s);
97 assert(nd2 && "No node for this edge!");
98 Edge ed(nd,nd2,0);
99 edges.insert(ed);
100 }
101 }
102
103 Graph g(nodes,edges, startNode, exitNode);
104
105#ifdef DEBUG_PATH_PROFILES
106 printGraph(g);
107#endif
108
109 BasicBlock *fr=M->front();
110
Chris Lattnerf9986852002-04-27 07:27:19 +0000111 // If only one BB, don't instrument
Anand Shukla70a61382002-02-26 19:00:48 +0000112 if (M->getBasicBlocks().size() == 1) {
Chris Lattnerf9986852002-04-27 07:27:19 +0000113 // The graph is made acyclic: this is done
114 // by removing back edges for now, and adding them later on
Chris Lattner5328c6f2002-02-26 19:40:28 +0000115 vector<Edge> be;
Anand Shukla70a61382002-02-26 19:00:48 +0000116 g.getBackEdges(be);
117#ifdef DEBUG_PATH_PROFILES
118 cerr<<"Backedges:"<<be.size()<<endl;
119#endif
Chris Lattnerf9986852002-04-27 07:27:19 +0000120 // Now we need to reflect the effect of back edges
121 // This is done by adding dummy edges
122 // If a->b is a back edge
123 // Then we add 2 back edges for it:
124 // 1. from root->b (in vector stDummy)
125 // and 2. from a->exit (in vector exDummy)
Chris Lattner5328c6f2002-02-26 19:40:28 +0000126 vector<Edge> stDummy;
127 vector<Edge> exDummy;
Anand Shukla70a61382002-02-26 19:00:48 +0000128 addDummyEdges(stDummy, exDummy, g, be);
129
Chris Lattnerf9986852002-04-27 07:27:19 +0000130 // Now, every edge in the graph is assigned a weight
131 // This weight later adds on to assign path
132 // numbers to different paths in the graph
133 // All paths for now are acyclic,
134 // since no back edges in the graph now
135 // numPaths is the number of acyclic paths in the graph
Anand Shukla70a61382002-02-26 19:00:48 +0000136 int numPaths=valueAssignmentToEdges(g);
137
Chris Lattnerf9986852002-04-27 07:27:19 +0000138 // create instruction allocation r and count
139 // r is the variable that'll act like an accumulator
140 // all along the path, we just add edge values to r
141 // and at the end, r reflects the path number
142 // count is an array: count[x] would store
143 // the number of executions of path numbered x
Anand Shukla70a61382002-02-26 19:00:48 +0000144 Instruction *rVar=new
145 AllocaInst(PointerType::get(Type::IntTy),
146 ConstantUInt::get(Type::UIntTy,1),"R");
147
148 Instruction *countVar=new
149 AllocaInst(PointerType::get(Type::IntTy),
150 ConstantUInt::get(Type::UIntTy, numPaths), "Count");
151
Chris Lattnerf9986852002-04-27 07:27:19 +0000152 // insert initialization code in first (entry) BB
153 // this includes initializing r and count
Anand Shukla70a61382002-02-26 19:00:48 +0000154 insertInTopBB(M->getEntryNode(),numPaths, rVar, countVar);
155
Chris Lattnerf9986852002-04-27 07:27:19 +0000156 // now process the graph: get path numbers,
157 // get increments along different paths,
158 // and assign "increments" and "updates" (to r and count)
159 // "optimally". Finally, insert llvm code along various edges
Anand Shukla70a61382002-02-26 19:00:48 +0000160 processGraph(g, rVar, countVar, be, stDummy, exDummy);
161 }
162
Chris Lattner62b7fd12002-04-07 20:49:59 +0000163 return true; // Always modifies function
Anand Shukla70a61382002-02-26 19:00:48 +0000164}