blob: d0d0f550fef788230d94cc9bb03e955b2893a1e0 [file] [log] [blame]
Chris Lattner44d2c352003-10-13 03:32:08 +00001//===-- ProfilePaths.cpp - interface to insert instrumentation --*- C++ -*-===//
Misha Brukmanb1c93172005-04-21 23:48:37 +00002//
John Criswell482202a2003-10-20 19:43:21 +00003// The LLVM Compiler Infrastructure
4//
5// This file was developed by the LLVM research group and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
Misha Brukmanb1c93172005-04-21 23:48:37 +00007//
John Criswell482202a2003-10-20 19:43:21 +00008//===----------------------------------------------------------------------===//
Anand Shukla70a61382002-02-26 19:00:48 +00009//
Chris Lattner44d2c352003-10-13 03:32:08 +000010// This inserts instrumentation for counting execution of paths though a given
11// function Its implemented as a "Function" Pass, and called using opt
Anand Shukla70a61382002-02-26 19:00:48 +000012//
Misha Brukmanb1c93172005-04-21 23:48:37 +000013// This pass is implemented by using algorithms similar to
14// 1."Efficient Path Profiling": Ball, T. and Larus, J. R.,
Chris Lattner44d2c352003-10-13 03:32:08 +000015// Proceedings of Micro-29, Dec 1996, Paris, France.
Anand Shukla70a61382002-02-26 19:00:48 +000016// 2."Efficiently Counting Program events with support for on-line
17// "queries": Ball T., ACM Transactions on Programming Languages
Chris Lattner44d2c352003-10-13 03:32:08 +000018// and systems, Sep 1994.
Anand Shukla70a61382002-02-26 19:00:48 +000019//
Chris Lattner44d2c352003-10-13 03:32:08 +000020// The algorithms work on a Graph constructed over the nodes made from Basic
21// Blocks: The transformations then take place on the constructed graph
22// (implementation in Graph.cpp and GraphAuxiliary.cpp) and finally, appropriate
23// instrumentation is placed over suitable edges. (code inserted through
24// EdgeCode.cpp).
Misha Brukmanb1c93172005-04-21 23:48:37 +000025//
Chris Lattner44d2c352003-10-13 03:32:08 +000026// The algorithm inserts code such that every acyclic path in the CFG of a
27// function is identified through a unique number. the code insertion is optimal
28// in the sense that its inserted over a minimal set of edges. Also, the
29// algorithm makes sure than initialization, path increment and counter update
30// can be collapsed into minimum number of edges.
31//
Anand Shukla70a61382002-02-26 19:00:48 +000032//===----------------------------------------------------------------------===//
33
Jeff Cohen9a7ac162005-01-07 06:57:28 +000034#include "llvm/Transforms/Instrumentation.h"
Chris Lattner15435fd2002-05-07 19:18:48 +000035#include "llvm/Transforms/Utils/UnifyFunctionExitNodes.h"
Anand Shukla70a61382002-02-26 19:00:48 +000036#include "llvm/Support/CFG.h"
Chris Lattnerca142372002-04-28 19:55:58 +000037#include "llvm/Constants.h"
Anand Shukla70a61382002-02-26 19:00:48 +000038#include "llvm/DerivedTypes.h"
Misha Brukman63b38bd2004-07-29 17:30:56 +000039#include "llvm/Instructions.h"
Anand Shukla77dca142002-09-20 16:44:35 +000040#include "llvm/Module.h"
Chris Lattner2f04a0d2003-01-14 22:33:56 +000041#include "Graph.h"
Anand Shukla21906892002-06-25 21:14:58 +000042#include <fstream>
Brian Gaekeb8a4ed62003-10-10 18:46:52 +000043#include <cstdio>
Anand Shukla70a61382002-02-26 19:00:48 +000044
Brian Gaeke960707c2003-11-11 22:41:34 +000045namespace llvm {
46
Chris Lattner37104aa2002-04-29 14:57:45 +000047struct ProfilePaths : public FunctionPass {
Chris Lattner7076ff22002-06-25 16:13:21 +000048 bool runOnFunction(Function &F);
Chris Lattnerd2095502002-02-26 20:04:59 +000049
Misha Brukmanb1c93172005-04-21 23:48:37 +000050 // Before this pass, make sure that there is only one
Chris Lattner62b7fd12002-04-07 20:49:59 +000051 // entry and only one exit node for the function in the CFG of the function
Chris Lattnerd2095502002-02-26 20:04:59 +000052 //
Chris Lattner407000c2004-12-08 16:05:02 +000053 void getAnalysisUsage(AnalysisUsage &AU) const {
Chris Lattner40eb9da2002-08-08 19:01:28 +000054 AU.addRequired<UnifyFunctionExitNodes>();
Chris Lattnerd2095502002-02-26 20:04:59 +000055 }
56};
57
Chris Lattnera2c09852002-07-26 21:12:44 +000058static RegisterOpt<ProfilePaths> X("paths", "Profile Paths");
Chris Lattnerb28b6802002-07-23 18:06:35 +000059
Jeff Cohen9a7ac162005-01-07 06:57:28 +000060FunctionPass *createProfilePathsPass() { return new ProfilePaths(); }
61
Anand Shukla21906892002-06-25 21:14:58 +000062static Node *findBB(std::vector<Node *> &st, BasicBlock *BB){
63 for(std::vector<Node *>::iterator si=st.begin(); si!=st.end(); ++si){
Anand Shukla70a61382002-02-26 19:00:48 +000064 if(((*si)->getElement())==BB){
65 return *si;
66 }
67 }
68 return NULL;
69}
70
Chris Lattner62b7fd12002-04-07 20:49:59 +000071//Per function pass for inserting counters and trigger code
Chris Lattner7076ff22002-06-25 16:13:21 +000072bool ProfilePaths::runOnFunction(Function &F){
Anand Shukla21906892002-06-25 21:14:58 +000073
74 static int mn = -1;
Anand Shukla2fd8edd2003-06-05 06:02:46 +000075 static int CountCounter = 1;
Anand Shuklafd61c602002-07-18 20:56:47 +000076 if(F.isExternal()) {
Anand Shukla11f42622002-07-08 19:36:01 +000077 return false;
78 }
Misha Brukmanb1c93172005-04-21 23:48:37 +000079
Anand Shukla11f42622002-07-08 19:36:01 +000080 //increment counter for instrumented functions. mn is now function#
81 mn++;
Misha Brukmanb1c93172005-04-21 23:48:37 +000082
Chris Lattnerf9986852002-04-27 07:27:19 +000083 // Transform the cfg s.t. we have just one exit node
Misha Brukmanb1c93172005-04-21 23:48:37 +000084 BasicBlock *ExitNode =
85 getAnalysis<UnifyFunctionExitNodes>().getReturnBlock();
Anand Shukla21906892002-06-25 21:14:58 +000086
87 //iterating over BBs and making graph
88 std::vector<Node *> nodes;
89 std::vector<Edge> edges;
90
Chris Lattnera2620ac2002-11-09 00:49:43 +000091 Node *exitNode = 0, *startNode = 0;
Anand Shukla70a61382002-02-26 19:00:48 +000092
Misha Brukman8b2bd4e2003-10-10 17:57:28 +000093 // The nodes must be uniquely identified:
Chris Lattnerf9986852002-04-27 07:27:19 +000094 // That is, no two nodes must hav same BB*
Misha Brukmanb1c93172005-04-21 23:48:37 +000095
Chris Lattner7076ff22002-06-25 16:13:21 +000096 for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB) {
97 Node *nd=new Node(BB);
Misha Brukmanb1c93172005-04-21 23:48:37 +000098 nodes.push_back(nd);
Chris Lattner7076ff22002-06-25 16:13:21 +000099 if(&*BB == ExitNode)
Anand Shukla70a61382002-02-26 19:00:48 +0000100 exitNode=nd;
Chris Lattner889f6202003-04-23 16:37:45 +0000101 if(BB==F.begin())
Anand Shukla70a61382002-02-26 19:00:48 +0000102 startNode=nd;
103 }
104
Misha Brukman8b2bd4e2003-10-10 17:57:28 +0000105 // now do it again to insert edges
Chris Lattner7076ff22002-06-25 16:13:21 +0000106 for (Function::iterator BB = F.begin(), BE = F.end(); BB != BE; ++BB){
107 Node *nd=findBB(nodes, BB);
Anand Shukla70a61382002-02-26 19:00:48 +0000108 assert(nd && "No node for this edge!");
Anand Shukla21906892002-06-25 21:14:58 +0000109
Chris Lattnera9400952003-09-24 22:06:25 +0000110 for(succ_iterator s=succ_begin(BB), se=succ_end(BB); s!=se; ++s){
Anand Shukla70a61382002-02-26 19:00:48 +0000111 Node *nd2=findBB(nodes,*s);
112 assert(nd2 && "No node for this edge!");
113 Edge ed(nd,nd2,0);
Anand Shukla21906892002-06-25 21:14:58 +0000114 edges.push_back(ed);
Anand Shukla70a61382002-02-26 19:00:48 +0000115 }
116 }
Misha Brukmanb1c93172005-04-21 23:48:37 +0000117
Anand Shukla70a61382002-02-26 19:00:48 +0000118 Graph g(nodes,edges, startNode, exitNode);
119
Misha Brukmanb1c93172005-04-21 23:48:37 +0000120#ifdef DEBUG_PATH_PROFILES
Anand Shuklad9a6af02002-09-16 05:24:49 +0000121 std::cerr<<"Original graph\n";
122 printGraph(g);
123#endif
Anand Shukla70a61382002-02-26 19:00:48 +0000124
Anand Shukla11f42622002-07-08 19:36:01 +0000125 BasicBlock *fr = &F.front();
Misha Brukmanb1c93172005-04-21 23:48:37 +0000126
Anand Shukla11f42622002-07-08 19:36:01 +0000127 // The graph is made acyclic: this is done
128 // by removing back edges for now, and adding them later on
Chris Lattner10a032a2003-09-10 20:35:33 +0000129 std::vector<Edge> be;
Anand Shuklafd61c602002-07-18 20:56:47 +0000130 std::map<Node *, int> nodePriority; //it ranks nodes in depth first order traversal
131 g.getBackEdges(be, nodePriority);
Misha Brukmanb1c93172005-04-21 23:48:37 +0000132
Anand Shuklad9a6af02002-09-16 05:24:49 +0000133#ifdef DEBUG_PATH_PROFILES
134 std::cerr<<"BackEdges-------------\n";
Chris Lattner10a032a2003-09-10 20:35:33 +0000135 for (std::vector<Edge>::iterator VI=be.begin(); VI!=be.end(); ++VI){
Anand Shuklad9a6af02002-09-16 05:24:49 +0000136 printEdge(*VI);
137 cerr<<"\n";
138 }
139 std::cerr<<"------\n";
140#endif
Anand Shukla21906892002-06-25 21:14:58 +0000141
142#ifdef DEBUG_PATH_PROFILES
Anand Shukla11f42622002-07-08 19:36:01 +0000143 cerr<<"Backedges:"<<be.size()<<endl;
Anand Shukla21906892002-06-25 21:14:58 +0000144#endif
Anand Shukla11f42622002-07-08 19:36:01 +0000145 //Now we need to reflect the effect of back edges
146 //This is done by adding dummy edges
147 //If a->b is a back edge
148 //Then we add 2 back edges for it:
149 //1. from root->b (in vector stDummy)
150 //and 2. from a->exit (in vector exDummy)
Chris Lattner10a032a2003-09-10 20:35:33 +0000151 std::vector<Edge> stDummy;
152 std::vector<Edge> exDummy;
Anand Shukla11f42622002-07-08 19:36:01 +0000153 addDummyEdges(stDummy, exDummy, g, be);
Anand Shukla21906892002-06-25 21:14:58 +0000154
Anand Shuklad9a6af02002-09-16 05:24:49 +0000155#ifdef DEBUG_PATH_PROFILES
156 std::cerr<<"After adding dummy edges\n";
157 printGraph(g);
158#endif
159
Anand Shukla11f42622002-07-08 19:36:01 +0000160 // Now, every edge in the graph is assigned a weight
161 // This weight later adds on to assign path
162 // numbers to different paths in the graph
163 // All paths for now are acyclic,
164 // since no back edges in the graph now
165 // numPaths is the number of acyclic paths in the graph
Anand Shuklad9a6af02002-09-16 05:24:49 +0000166 int numPaths=valueAssignmentToEdges(g, nodePriority, be);
Anand Shukla21906892002-06-25 21:14:58 +0000167
Anand Shuklaf8c09ee2003-02-14 20:41:53 +0000168 //if(numPaths<=1) return false;
169
Anand Shukla2fd8edd2003-06-05 06:02:46 +0000170 static GlobalVariable *threshold = NULL;
171 static bool insertedThreshold = false;
172
173 if(!insertedThreshold){
174 threshold = new GlobalVariable(Type::IntTy, false,
175 GlobalValue::ExternalLinkage, 0,
176 "reopt_threshold");
177
178 F.getParent()->getGlobalList().push_back(threshold);
179 insertedThreshold = true;
180 }
181
182 assert(threshold && "GlobalVariable threshold not defined!");
183
184
185 if(fr->getParent()->getName() == "main"){
Misha Brukman8b2bd4e2003-10-10 17:57:28 +0000186 //initialize threshold
Chris Lattner25bc3f82003-08-31 00:21:59 +0000187
188 // FIXME: THIS IS HORRIBLY BROKEN. FUNCTION PASSES CANNOT DO THIS, EXCEPT
189 // IN THEIR INITIALIZE METHOD!!
190 Function *initialize =
191 F.getParent()->getOrInsertFunction("reoptimizerInitialize", Type::VoidTy,
192 PointerType::get(Type::IntTy), 0);
Misha Brukmanb1c93172005-04-21 23:48:37 +0000193
Chris Lattner10a032a2003-09-10 20:35:33 +0000194 std::vector<Value *> trargs;
Anand Shukla2fd8edd2003-06-05 06:02:46 +0000195 trargs.push_back(threshold);
Chris Lattner25bc3f82003-08-31 00:21:59 +0000196 new CallInst(initialize, trargs, "", fr->begin());
Anand Shukla2fd8edd2003-06-05 06:02:46 +0000197 }
198
199
Anand Shuklafd61c602002-07-18 20:56:47 +0000200 if(numPaths<=1 || numPaths >5000) return false;
Misha Brukmanb1c93172005-04-21 23:48:37 +0000201
202#ifdef DEBUG_PATH_PROFILES
Anand Shuklad9a6af02002-09-16 05:24:49 +0000203 printGraph(g);
204#endif
205
Anand Shukla11f42622002-07-08 19:36:01 +0000206 //create instruction allocation r and count
207 //r is the variable that'll act like an accumulator
208 //all along the path, we just add edge values to r
209 //and at the end, r reflects the path number
210 //count is an array: count[x] would store
211 //the number of executions of path numbered x
Anand Shukla21906892002-06-25 21:14:58 +0000212
Misha Brukmanb1c93172005-04-21 23:48:37 +0000213 Instruction *rVar=new
214 AllocaInst(Type::IntTy,
Anand Shukla11f42622002-07-08 19:36:01 +0000215 ConstantUInt::get(Type::UIntTy,1),"R");
Anand Shuklad9a6af02002-09-16 05:24:49 +0000216
Misha Brukmanb1c93172005-04-21 23:48:37 +0000217 //Instruction *countVar=new
218 //AllocaInst(Type::IntTy,
Anand Shuklaf8c09ee2003-02-14 20:41:53 +0000219 // ConstantUInt::get(Type::UIntTy, numPaths), "Count");
220
221 //initialize counter array!
222 std::vector<Constant*> arrayInitialize;
223 for(int xi=0; xi<numPaths; xi++)
224 arrayInitialize.push_back(ConstantSInt::get(Type::IntTy, 0));
225
Chris Lattner379a8d22003-04-16 20:28:45 +0000226 const ArrayType *ATy = ArrayType::get(Type::IntTy, numPaths);
227 Constant *initializer = ConstantArray::get(ATy, arrayInitialize);
Anand Shukla2fd8edd2003-06-05 06:02:46 +0000228 char tempChar[20];
229 sprintf(tempChar, "Count%d", CountCounter);
230 CountCounter++;
231 std::string countStr = tempChar;
Chris Lattner379a8d22003-04-16 20:28:45 +0000232 GlobalVariable *countVar = new GlobalVariable(ATy, false,
Misha Brukmanb1c93172005-04-21 23:48:37 +0000233 GlobalValue::InternalLinkage,
Anand Shukla2fd8edd2003-06-05 06:02:46 +0000234 initializer, countStr,
Chris Lattner379a8d22003-04-16 20:28:45 +0000235 F.getParent());
Misha Brukmanb1c93172005-04-21 23:48:37 +0000236
Anand Shukla11f42622002-07-08 19:36:01 +0000237 // insert initialization code in first (entry) BB
238 // this includes initializing r and count
Chris Lattner5dac64f2003-09-20 14:39:18 +0000239 insertInTopBB(&F.getEntryBlock(), numPaths, rVar, threshold);
Misha Brukmanb1c93172005-04-21 23:48:37 +0000240
Anand Shukla11f42622002-07-08 19:36:01 +0000241 //now process the graph: get path numbers,
242 //get increments along different paths,
243 //and assign "increments" and "updates" (to r and count)
244 //"optimally". Finally, insert llvm code along various edges
Misha Brukmanb1c93172005-04-21 23:48:37 +0000245 processGraph(g, rVar, countVar, be, stDummy, exDummy, numPaths, mn,
246 threshold);
247
Chris Lattner62b7fd12002-04-07 20:49:59 +0000248 return true; // Always modifies function
Anand Shukla70a61382002-02-26 19:00:48 +0000249}
Brian Gaeke960707c2003-11-11 22:41:34 +0000250
251} // End llvm namespace