2002-02-26 20:00:48 +01:00
|
|
|
//===-- ProfilePaths.cpp - interface to insert instrumentation ---*- C++ -*--=//
|
|
|
|
//
|
|
|
|
// This inserts intrumentation for counting
|
2002-04-07 22:49:59 +02:00
|
|
|
// execution of paths though a given function
|
|
|
|
// Its implemented as a "Function" Pass, and called using opt
|
2002-02-26 20:00:48 +01:00
|
|
|
//
|
|
|
|
// This pass is implemented by using algorithms similar to
|
|
|
|
// 1."Efficient Path Profiling": Ball, T. and Larus, J. R.,
|
|
|
|
// Proceedings of Micro-29, Dec 1996, Paris, France.
|
|
|
|
// 2."Efficiently Counting Program events with support for on-line
|
|
|
|
// "queries": Ball T., ACM Transactions on Programming Languages
|
|
|
|
// and systems, Sep 1994.
|
|
|
|
//
|
|
|
|
// The algorithms work on a Graph constructed over the nodes
|
|
|
|
// made from Basic Blocks: The transformations then take place on
|
|
|
|
// the constucted graph (implementation in Graph.cpp and GraphAuxillary.cpp)
|
|
|
|
// and finally, appropriate instrumentation is placed over suitable edges.
|
|
|
|
// (code inserted through EdgeCode.cpp).
|
|
|
|
//
|
|
|
|
// The algorithm inserts code such that every acyclic path in the CFG
|
2002-04-07 22:49:59 +02:00
|
|
|
// of a function is identified through a unique number. the code insertion
|
2002-02-26 20:00:48 +01:00
|
|
|
// is optimal in the sense that its inserted over a minimal set of edges. Also,
|
|
|
|
// the algorithm makes sure than initialization, path increment and counter
|
|
|
|
// update can be collapsed into minmimum number of edges.
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "llvm/Transforms/Instrumentation/ProfilePaths.h"
|
2002-04-27 09:27:19 +02:00
|
|
|
#include "llvm/Transforms/UnifyFunctionExitNodes.h"
|
2002-02-26 20:00:48 +01:00
|
|
|
#include "llvm/Support/CFG.h"
|
2002-04-07 22:49:59 +02:00
|
|
|
#include "llvm/Function.h"
|
2002-02-26 20:00:48 +01:00
|
|
|
#include "llvm/BasicBlock.h"
|
|
|
|
#include "llvm/ConstantVals.h"
|
|
|
|
#include "llvm/DerivedTypes.h"
|
|
|
|
#include "llvm/iMemory.h"
|
2002-02-26 21:04:59 +01:00
|
|
|
#include "llvm/Pass.h"
|
2002-02-26 20:00:48 +01:00
|
|
|
#include "Graph.h"
|
|
|
|
|
|
|
|
using std::vector;
|
|
|
|
|
2002-04-27 08:56:12 +02:00
|
|
|
class ProfilePaths: public FunctionPass {
|
2002-02-26 21:04:59 +01:00
|
|
|
public:
|
2002-04-27 08:56:12 +02:00
|
|
|
bool runOnFunction(Function *F);
|
2002-02-26 21:04:59 +01:00
|
|
|
|
|
|
|
// Before this pass, make sure that there is only one
|
2002-04-07 22:49:59 +02:00
|
|
|
// entry and only one exit node for the function in the CFG of the function
|
2002-02-26 21:04:59 +01:00
|
|
|
//
|
2002-04-27 08:56:12 +02:00
|
|
|
void ProfilePaths::getAnalysisUsage(AnalysisUsage &AU) const {
|
2002-04-27 09:27:19 +02:00
|
|
|
AU.addRequired(UnifyFunctionExitNodes::ID);
|
2002-02-26 21:04:59 +01:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
// createProfilePathsPass - Create a new pass to add path profiling
|
|
|
|
//
|
|
|
|
Pass *createProfilePathsPass() {
|
|
|
|
return new ProfilePaths();
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-02-26 20:40:28 +01:00
|
|
|
static Node *findBB(std::set<Node *> &st, BasicBlock *BB){
|
|
|
|
for(std::set<Node *>::iterator si=st.begin(); si!=st.end(); ++si){
|
2002-02-26 20:00:48 +01:00
|
|
|
if(((*si)->getElement())==BB){
|
|
|
|
return *si;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2002-04-07 22:49:59 +02:00
|
|
|
//Per function pass for inserting counters and trigger code
|
2002-04-27 08:56:12 +02:00
|
|
|
bool ProfilePaths::runOnFunction(Function *M){
|
2002-04-27 09:27:19 +02:00
|
|
|
// Transform the cfg s.t. we have just one exit node
|
|
|
|
BasicBlock *ExitNode = getAnalysis<UnifyFunctionExitNodes>().getExitNode();
|
2002-02-26 20:00:48 +01:00
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// iterating over BBs and making graph
|
2002-02-26 20:00:48 +01:00
|
|
|
std::set<Node *> nodes;
|
|
|
|
std::set<Edge> edges;
|
|
|
|
Node *tmp;
|
|
|
|
Node *exitNode, *startNode;
|
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// The nodes must be uniquesly identified:
|
|
|
|
// That is, no two nodes must hav same BB*
|
2002-02-26 20:00:48 +01:00
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// First enter just nodes: later enter edges
|
2002-04-07 22:49:59 +02:00
|
|
|
for (Function::iterator BB = M->begin(), BE=M->end(); BB != BE; ++BB){
|
2002-02-26 20:00:48 +01:00
|
|
|
Node *nd=new Node(*BB);
|
|
|
|
nodes.insert(nd);
|
|
|
|
if(*BB==ExitNode)
|
|
|
|
exitNode=nd;
|
|
|
|
if(*BB==M->front())
|
|
|
|
startNode=nd;
|
|
|
|
}
|
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// now do it againto insert edges
|
2002-04-07 22:49:59 +02:00
|
|
|
for (Function::iterator BB = M->begin(), BE=M->end(); BB != BE; ++BB){
|
2002-02-26 20:00:48 +01:00
|
|
|
Node *nd=findBB(nodes, *BB);
|
|
|
|
assert(nd && "No node for this edge!");
|
|
|
|
for(BasicBlock::succ_iterator s=succ_begin(*BB), se=succ_end(*BB);
|
|
|
|
s!=se; ++s){
|
|
|
|
Node *nd2=findBB(nodes,*s);
|
|
|
|
assert(nd2 && "No node for this edge!");
|
|
|
|
Edge ed(nd,nd2,0);
|
|
|
|
edges.insert(ed);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
Graph g(nodes,edges, startNode, exitNode);
|
|
|
|
|
|
|
|
#ifdef DEBUG_PATH_PROFILES
|
|
|
|
printGraph(g);
|
|
|
|
#endif
|
|
|
|
|
|
|
|
BasicBlock *fr=M->front();
|
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// If only one BB, don't instrument
|
2002-02-26 20:00:48 +01:00
|
|
|
if (M->getBasicBlocks().size() == 1) {
|
2002-04-27 09:27:19 +02:00
|
|
|
// The graph is made acyclic: this is done
|
|
|
|
// by removing back edges for now, and adding them later on
|
2002-02-26 20:40:28 +01:00
|
|
|
vector<Edge> be;
|
2002-02-26 20:00:48 +01:00
|
|
|
g.getBackEdges(be);
|
|
|
|
#ifdef DEBUG_PATH_PROFILES
|
|
|
|
cerr<<"Backedges:"<<be.size()<<endl;
|
|
|
|
#endif
|
2002-04-27 09:27:19 +02:00
|
|
|
// Now we need to reflect the effect of back edges
|
|
|
|
// This is done by adding dummy edges
|
|
|
|
// If a->b is a back edge
|
|
|
|
// Then we add 2 back edges for it:
|
|
|
|
// 1. from root->b (in vector stDummy)
|
|
|
|
// and 2. from a->exit (in vector exDummy)
|
2002-02-26 20:40:28 +01:00
|
|
|
vector<Edge> stDummy;
|
|
|
|
vector<Edge> exDummy;
|
2002-02-26 20:00:48 +01:00
|
|
|
addDummyEdges(stDummy, exDummy, g, be);
|
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// Now, every edge in the graph is assigned a weight
|
|
|
|
// This weight later adds on to assign path
|
|
|
|
// numbers to different paths in the graph
|
|
|
|
// All paths for now are acyclic,
|
|
|
|
// since no back edges in the graph now
|
|
|
|
// numPaths is the number of acyclic paths in the graph
|
2002-02-26 20:00:48 +01:00
|
|
|
int numPaths=valueAssignmentToEdges(g);
|
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// create instruction allocation r and count
|
|
|
|
// r is the variable that'll act like an accumulator
|
|
|
|
// all along the path, we just add edge values to r
|
|
|
|
// and at the end, r reflects the path number
|
|
|
|
// count is an array: count[x] would store
|
|
|
|
// the number of executions of path numbered x
|
2002-02-26 20:00:48 +01:00
|
|
|
Instruction *rVar=new
|
|
|
|
AllocaInst(PointerType::get(Type::IntTy),
|
|
|
|
ConstantUInt::get(Type::UIntTy,1),"R");
|
|
|
|
|
|
|
|
Instruction *countVar=new
|
|
|
|
AllocaInst(PointerType::get(Type::IntTy),
|
|
|
|
ConstantUInt::get(Type::UIntTy, numPaths), "Count");
|
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// insert initialization code in first (entry) BB
|
|
|
|
// this includes initializing r and count
|
2002-02-26 20:00:48 +01:00
|
|
|
insertInTopBB(M->getEntryNode(),numPaths, rVar, countVar);
|
|
|
|
|
2002-04-27 09:27:19 +02:00
|
|
|
// now process the graph: get path numbers,
|
|
|
|
// get increments along different paths,
|
|
|
|
// and assign "increments" and "updates" (to r and count)
|
|
|
|
// "optimally". Finally, insert llvm code along various edges
|
2002-02-26 20:00:48 +01:00
|
|
|
processGraph(g, rVar, countVar, be, stDummy, exDummy);
|
|
|
|
}
|
|
|
|
|
2002-04-07 22:49:59 +02:00
|
|
|
return true; // Always modifies function
|
2002-02-26 20:00:48 +01:00
|
|
|
}
|