blob: 42ef33cb0d5852f80a9a3f583169623a711e685b [file] [log] [blame]
Anand Shukla70a61382002-02-26 19:00:48 +00001//===-- ProfilePaths.cpp - interface to insert instrumentation ---*- C++ -*--=//
2//
3// This inserts intrumentation for counting
Chris Lattner62b7fd12002-04-07 20:49:59 +00004// execution of paths though a given function
5// Its implemented as a "Function" Pass, and called using opt
Anand Shukla70a61382002-02-26 19:00:48 +00006//
7// This pass is implemented by using algorithms similar to
8// 1."Efficient Path Profiling": Ball, T. and Larus, J. R.,
9// Proceedings of Micro-29, Dec 1996, Paris, France.
10// 2."Efficiently Counting Program events with support for on-line
11// "queries": Ball T., ACM Transactions on Programming Languages
12// and systems, Sep 1994.
13//
14// The algorithms work on a Graph constructed over the nodes
15// made from Basic Blocks: The transformations then take place on
16// the constucted graph (implementation in Graph.cpp and GraphAuxillary.cpp)
17// and finally, appropriate instrumentation is placed over suitable edges.
18// (code inserted through EdgeCode.cpp).
19//
20// The algorithm inserts code such that every acyclic path in the CFG
Chris Lattner62b7fd12002-04-07 20:49:59 +000021// of a function is identified through a unique number. the code insertion
Anand Shukla70a61382002-02-26 19:00:48 +000022// is optimal in the sense that its inserted over a minimal set of edges. Also,
23// the algorithm makes sure than initialization, path increment and counter
24// update can be collapsed into minmimum number of edges.
25//===----------------------------------------------------------------------===//
26
27#include "llvm/Transforms/Instrumentation/ProfilePaths.h"
Chris Lattner15435fd2002-05-07 19:18:48 +000028#include "llvm/Transforms/Utils/UnifyFunctionExitNodes.h"
Anand Shukla70a61382002-02-26 19:00:48 +000029#include "llvm/Support/CFG.h"
Chris Lattnerca142372002-04-28 19:55:58 +000030#include "llvm/Constants.h"
Anand Shukla70a61382002-02-26 19:00:48 +000031#include "llvm/DerivedTypes.h"
32#include "llvm/iMemory.h"
33#include "Graph.h"
34
35using std::vector;
36
Chris Lattner37104aa2002-04-29 14:57:45 +000037struct ProfilePaths : public FunctionPass {
38 const char *getPassName() const { return "ProfilePaths"; }
39
Chris Lattner7076ff22002-06-25 16:13:21 +000040 bool runOnFunction(Function &F);
Chris Lattnerd2095502002-02-26 20:04:59 +000041
42 // Before this pass, make sure that there is only one
Chris Lattner62b7fd12002-04-07 20:49:59 +000043 // entry and only one exit node for the function in the CFG of the function
Chris Lattnerd2095502002-02-26 20:04:59 +000044 //
Chris Lattnerc8e66542002-04-27 06:56:12 +000045 void ProfilePaths::getAnalysisUsage(AnalysisUsage &AU) const {
Chris Lattnerf9986852002-04-27 07:27:19 +000046 AU.addRequired(UnifyFunctionExitNodes::ID);
Chris Lattnerd2095502002-02-26 20:04:59 +000047 }
48};
49
50// createProfilePathsPass - Create a new pass to add path profiling
51//
52Pass *createProfilePathsPass() {
53 return new ProfilePaths();
54}
55
56
Chris Lattner5328c6f2002-02-26 19:40:28 +000057static Node *findBB(std::set<Node *> &st, BasicBlock *BB){
58 for(std::set<Node *>::iterator si=st.begin(); si!=st.end(); ++si){
Anand Shukla70a61382002-02-26 19:00:48 +000059 if(((*si)->getElement())==BB){
60 return *si;
61 }
62 }
63 return NULL;
64}
65
Chris Lattner62b7fd12002-04-07 20:49:59 +000066//Per function pass for inserting counters and trigger code
Chris Lattner7076ff22002-06-25 16:13:21 +000067bool ProfilePaths::runOnFunction(Function &F){
Chris Lattnerf9986852002-04-27 07:27:19 +000068 // Transform the cfg s.t. we have just one exit node
69 BasicBlock *ExitNode = getAnalysis<UnifyFunctionExitNodes>().getExitNode();
Anand Shukla70a61382002-02-26 19:00:48 +000070
Chris Lattnerf9986852002-04-27 07:27:19 +000071 // iterating over BBs and making graph
Anand Shukla70a61382002-02-26 19:00:48 +000072 std::set<Node *> nodes;
73 std::set<Edge> edges;
74 Node *tmp;
75 Node *exitNode, *startNode;
76
Chris Lattnerf9986852002-04-27 07:27:19 +000077 // The nodes must be uniquesly identified:
78 // That is, no two nodes must hav same BB*
Anand Shukla70a61382002-02-26 19:00:48 +000079
Chris Lattnerf9986852002-04-27 07:27:19 +000080 // First enter just nodes: later enter edges
Chris Lattner7076ff22002-06-25 16:13:21 +000081 for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB) {
82 Node *nd=new Node(BB);
Anand Shukla70a61382002-02-26 19:00:48 +000083 nodes.insert(nd);
Chris Lattner7076ff22002-06-25 16:13:21 +000084 if(&*BB == ExitNode)
Anand Shukla70a61382002-02-26 19:00:48 +000085 exitNode=nd;
Chris Lattner7076ff22002-06-25 16:13:21 +000086 if(&*BB==F.begin())
Anand Shukla70a61382002-02-26 19:00:48 +000087 startNode=nd;
88 }
89
Chris Lattnerf9986852002-04-27 07:27:19 +000090 // now do it againto insert edges
Chris Lattner7076ff22002-06-25 16:13:21 +000091 for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB){
92 Node *nd=findBB(nodes, BB);
Anand Shukla70a61382002-02-26 19:00:48 +000093 assert(nd && "No node for this edge!");
Chris Lattner7076ff22002-06-25 16:13:21 +000094 for(BasicBlock::succ_iterator s=succ_begin(BB), se=succ_end(BB);
Anand Shukla70a61382002-02-26 19:00:48 +000095 s!=se; ++s){
96 Node *nd2=findBB(nodes,*s);
97 assert(nd2 && "No node for this edge!");
98 Edge ed(nd,nd2,0);
99 edges.insert(ed);
100 }
101 }
102
103 Graph g(nodes,edges, startNode, exitNode);
104
Chris Lattnere1fc2d92002-05-22 21:56:32 +0000105 DEBUG(printGraph(g));
Anand Shukla70a61382002-02-26 19:00:48 +0000106
Chris Lattner7076ff22002-06-25 16:13:21 +0000107 BasicBlock *fr=&F.front();
Anand Shukla70a61382002-02-26 19:00:48 +0000108
Chris Lattnerf9986852002-04-27 07:27:19 +0000109 // If only one BB, don't instrument
Chris Lattner7076ff22002-06-25 16:13:21 +0000110 if (++F.begin() == F.end()) {
Chris Lattnerf9986852002-04-27 07:27:19 +0000111 // The graph is made acyclic: this is done
112 // by removing back edges for now, and adding them later on
Chris Lattner5328c6f2002-02-26 19:40:28 +0000113 vector<Edge> be;
Anand Shukla70a61382002-02-26 19:00:48 +0000114 g.getBackEdges(be);
Chris Lattnere1fc2d92002-05-22 21:56:32 +0000115 DEBUG(cerr << "Backedges:" << be.size() << "\n");
116
Chris Lattnerf9986852002-04-27 07:27:19 +0000117 // Now we need to reflect the effect of back edges
118 // This is done by adding dummy edges
119 // If a->b is a back edge
120 // Then we add 2 back edges for it:
121 // 1. from root->b (in vector stDummy)
122 // and 2. from a->exit (in vector exDummy)
Chris Lattner5328c6f2002-02-26 19:40:28 +0000123 vector<Edge> stDummy;
124 vector<Edge> exDummy;
Anand Shukla70a61382002-02-26 19:00:48 +0000125 addDummyEdges(stDummy, exDummy, g, be);
126
Chris Lattnerf9986852002-04-27 07:27:19 +0000127 // Now, every edge in the graph is assigned a weight
128 // This weight later adds on to assign path
129 // numbers to different paths in the graph
130 // All paths for now are acyclic,
131 // since no back edges in the graph now
132 // numPaths is the number of acyclic paths in the graph
Anand Shukla70a61382002-02-26 19:00:48 +0000133 int numPaths=valueAssignmentToEdges(g);
134
Chris Lattnerf9986852002-04-27 07:27:19 +0000135 // create instruction allocation r and count
136 // r is the variable that'll act like an accumulator
137 // all along the path, we just add edge values to r
138 // and at the end, r reflects the path number
139 // count is an array: count[x] would store
140 // the number of executions of path numbered x
Anand Shukla70a61382002-02-26 19:00:48 +0000141 Instruction *rVar=new
142 AllocaInst(PointerType::get(Type::IntTy),
143 ConstantUInt::get(Type::UIntTy,1),"R");
144
145 Instruction *countVar=new
146 AllocaInst(PointerType::get(Type::IntTy),
147 ConstantUInt::get(Type::UIntTy, numPaths), "Count");
148
Chris Lattnerf9986852002-04-27 07:27:19 +0000149 // insert initialization code in first (entry) BB
150 // this includes initializing r and count
Chris Lattner7076ff22002-06-25 16:13:21 +0000151 insertInTopBB(&F.getEntryNode(),numPaths, rVar, countVar);
Anand Shukla70a61382002-02-26 19:00:48 +0000152
Chris Lattnerf9986852002-04-27 07:27:19 +0000153 // now process the graph: get path numbers,
154 // get increments along different paths,
155 // and assign "increments" and "updates" (to r and count)
156 // "optimally". Finally, insert llvm code along various edges
Anand Shukla70a61382002-02-26 19:00:48 +0000157 processGraph(g, rVar, countVar, be, stDummy, exDummy);
158 }
159
Chris Lattner62b7fd12002-04-07 20:49:59 +0000160 return true; // Always modifies function
Anand Shukla70a61382002-02-26 19:00:48 +0000161}