1 //===- PathNumbering.cpp --------------------------------------*- C++ -*---===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // Ball-Larus path numbers uniquely identify paths through a directed acyclic 11 // graph (DAG) [Ball96]. For a CFG backedges are removed and replaced by phony 12 // edges to obtain a DAG, and thus the unique path numbers [Ball96]. 13 // 14 // The purpose of this analysis is to enumerate the edges in a CFG in order 15 // to obtain paths from path numbers in a convenient manner. As described in 16 // [Ball96] edges can be enumerated such that given a path number by following 17 // the CFG and updating the path number, the path is obtained. 18 // 19 // [Ball96] 20 // T. Ball and J. R. Larus. "Efficient Path Profiling." 21 // International Symposium on Microarchitecture, pages 46-57, 1996. 22 // http://portal.acm.org/citation.cfm?id=243857 23 // 24 //===----------------------------------------------------------------------===// 25 #define DEBUG_TYPE "ball-larus-numbering" 26 27 #include "llvm/Analysis/PathNumbering.h" 28 #include "llvm/Constants.h" 29 #include "llvm/DerivedTypes.h" 30 #include "llvm/InstrTypes.h" 31 #include "llvm/Instructions.h" 32 #include "llvm/Module.h" 33 #include "llvm/Pass.h" 34 #include "llvm/Support/CFG.h" 35 #include "llvm/Support/CommandLine.h" 36 #include "llvm/Support/Compiler.h" 37 #include "llvm/Support/Debug.h" 38 #include "llvm/Support/TypeBuilder.h" 39 #include "llvm/Support/raw_ostream.h" 40 41 #include <queue> 42 #include <stack> 43 #include <string> 44 #include <utility> 45 #include <sstream> 46 47 using namespace llvm; 48 49 // Are we enabling early termination 50 static cl::opt<bool> ProcessEarlyTermination( 51 "path-profile-early-termination", cl::Hidden, 52 cl::desc("In path profiling, insert extra instrumentation to account for " 53 "unexpected function termination.")); 54 55 // Returns the basic block for the BallLarusNode 56 BasicBlock* BallLarusNode::getBlock() { 57 return(_basicBlock); 58 } 59 60 // Returns the number of paths to the exit starting at the node. 61 unsigned BallLarusNode::getNumberPaths() { 62 return(_numberPaths); 63 } 64 65 // Sets the number of paths to the exit starting at the node. 66 void BallLarusNode::setNumberPaths(unsigned numberPaths) { 67 _numberPaths = numberPaths; 68 } 69 70 // Gets the NodeColor used in graph algorithms. 71 BallLarusNode::NodeColor BallLarusNode::getColor() { 72 return(_color); 73 } 74 75 // Sets the NodeColor used in graph algorithms. 76 void BallLarusNode::setColor(BallLarusNode::NodeColor color) { 77 _color = color; 78 } 79 80 // Returns an iterator over predecessor edges. Includes phony and 81 // backedges. 82 BLEdgeIterator BallLarusNode::predBegin() { 83 return(_predEdges.begin()); 84 } 85 86 // Returns the end sentinel for the predecessor iterator. 87 BLEdgeIterator BallLarusNode::predEnd() { 88 return(_predEdges.end()); 89 } 90 91 // Returns the number of predecessor edges. Includes phony and 92 // backedges. 93 unsigned BallLarusNode::getNumberPredEdges() { 94 return(_predEdges.size()); 95 } 96 97 // Returns an iterator over successor edges. Includes phony and 98 // backedges. 99 BLEdgeIterator BallLarusNode::succBegin() { 100 return(_succEdges.begin()); 101 } 102 103 // Returns the end sentinel for the successor iterator. 104 BLEdgeIterator BallLarusNode::succEnd() { 105 return(_succEdges.end()); 106 } 107 108 // Returns the number of successor edges. Includes phony and 109 // backedges. 110 unsigned BallLarusNode::getNumberSuccEdges() { 111 return(_succEdges.size()); 112 } 113 114 // Add an edge to the predecessor list. 115 void BallLarusNode::addPredEdge(BallLarusEdge* edge) { 116 _predEdges.push_back(edge); 117 } 118 119 // Remove an edge from the predecessor list. 120 void BallLarusNode::removePredEdge(BallLarusEdge* edge) { 121 removeEdge(_predEdges, edge); 122 } 123 124 // Add an edge to the successor list. 125 void BallLarusNode::addSuccEdge(BallLarusEdge* edge) { 126 _succEdges.push_back(edge); 127 } 128 129 // Remove an edge from the successor list. 130 void BallLarusNode::removeSuccEdge(BallLarusEdge* edge) { 131 removeEdge(_succEdges, edge); 132 } 133 134 // Returns the name of the BasicBlock being represented. If BasicBlock 135 // is null then returns "<null>". If BasicBlock has no name, then 136 // "<unnamed>" is returned. Intended for use with debug output. 137 std::string BallLarusNode::getName() { 138 std::stringstream name; 139 140 if(getBlock() != NULL) { 141 if(getBlock()->hasName()) { 142 std::string tempName(getBlock()->getName()); 143 name << tempName.c_str() << " (" << _uid << ")"; 144 } else 145 name << "<unnamed> (" << _uid << ")"; 146 } else 147 name << "<null> (" << _uid << ")"; 148 149 return name.str(); 150 } 151 152 // Removes an edge from an edgeVector. Used by removePredEdge and 153 // removeSuccEdge. 154 void BallLarusNode::removeEdge(BLEdgeVector& v, BallLarusEdge* e) { 155 // TODO: Avoid linear scan by using a set instead 156 for(BLEdgeIterator i = v.begin(), 157 end = v.end(); 158 i != end; 159 ++i) { 160 if((*i) == e) { 161 v.erase(i); 162 break; 163 } 164 } 165 } 166 167 // Returns the source node of this edge. 168 BallLarusNode* BallLarusEdge::getSource() const { 169 return(_source); 170 } 171 172 // Returns the target node of this edge. 173 BallLarusNode* BallLarusEdge::getTarget() const { 174 return(_target); 175 } 176 177 // Sets the type of the edge. 178 BallLarusEdge::EdgeType BallLarusEdge::getType() const { 179 return _edgeType; 180 } 181 182 // Gets the type of the edge. 183 void BallLarusEdge::setType(EdgeType type) { 184 _edgeType = type; 185 } 186 187 // Returns the weight of this edge. Used to decode path numbers to sequences 188 // of basic blocks. 189 unsigned BallLarusEdge::getWeight() { 190 return(_weight); 191 } 192 193 // Sets the weight of the edge. Used during path numbering. 194 void BallLarusEdge::setWeight(unsigned weight) { 195 _weight = weight; 196 } 197 198 // Gets the phony edge originating at the root. 199 BallLarusEdge* BallLarusEdge::getPhonyRoot() { 200 return _phonyRoot; 201 } 202 203 // Sets the phony edge originating at the root. 204 void BallLarusEdge::setPhonyRoot(BallLarusEdge* phonyRoot) { 205 _phonyRoot = phonyRoot; 206 } 207 208 // Gets the phony edge terminating at the exit. 209 BallLarusEdge* BallLarusEdge::getPhonyExit() { 210 return _phonyExit; 211 } 212 213 // Sets the phony edge terminating at the exit. 214 void BallLarusEdge::setPhonyExit(BallLarusEdge* phonyExit) { 215 _phonyExit = phonyExit; 216 } 217 218 // Gets the associated real edge if this is a phony edge. 219 BallLarusEdge* BallLarusEdge::getRealEdge() { 220 return _realEdge; 221 } 222 223 // Sets the associated real edge if this is a phony edge. 224 void BallLarusEdge::setRealEdge(BallLarusEdge* realEdge) { 225 _realEdge = realEdge; 226 } 227 228 // Returns the duplicate number of the edge. 229 unsigned BallLarusEdge::getDuplicateNumber() { 230 return(_duplicateNumber); 231 } 232 233 // Initialization that requires virtual functions which are not fully 234 // functional in the constructor. 235 void BallLarusDag::init() { 236 BLBlockNodeMap inDag; 237 std::stack<BallLarusNode*> dfsStack; 238 239 _root = addNode(&(_function.getEntryBlock())); 240 _exit = addNode(NULL); 241 242 // start search from root 243 dfsStack.push(getRoot()); 244 245 // dfs to add each bb into the dag 246 while(dfsStack.size()) 247 buildNode(inDag, dfsStack); 248 249 // put in the final edge 250 addEdge(getExit(),getRoot(),0); 251 } 252 253 // Frees all memory associated with the DAG. 254 BallLarusDag::~BallLarusDag() { 255 for(BLEdgeIterator edge = _edges.begin(), end = _edges.end(); edge != end; 256 ++edge) 257 delete (*edge); 258 259 for(BLNodeIterator node = _nodes.begin(), end = _nodes.end(); node != end; 260 ++node) 261 delete (*node); 262 } 263 264 // Calculate the path numbers by assigning edge increments as prescribed 265 // in Ball-Larus path profiling. 266 void BallLarusDag::calculatePathNumbers() { 267 BallLarusNode* node; 268 std::queue<BallLarusNode*> bfsQueue; 269 bfsQueue.push(getExit()); 270 271 while(bfsQueue.size() > 0) { 272 node = bfsQueue.front(); 273 274 DEBUG(dbgs() << "calculatePathNumbers on " << node->getName() << "\n"); 275 276 bfsQueue.pop(); 277 unsigned prevPathNumber = node->getNumberPaths(); 278 calculatePathNumbersFrom(node); 279 280 // Check for DAG splitting 281 if( node->getNumberPaths() > 100000000 && node != getRoot() ) { 282 // Add new phony edge from the split-node to the DAG's exit 283 BallLarusEdge* exitEdge = addEdge(node, getExit(), 0); 284 exitEdge->setType(BallLarusEdge::SPLITEDGE_PHONY); 285 286 // Counters to handle the possibility of a multi-graph 287 BasicBlock* oldTarget = 0; 288 unsigned duplicateNumber = 0; 289 290 // Iterate through each successor edge, adding phony edges 291 for( BLEdgeIterator succ = node->succBegin(), end = node->succEnd(); 292 succ != end; oldTarget = (*succ)->getTarget()->getBlock(), succ++ ) { 293 294 if( (*succ)->getType() == BallLarusEdge::NORMAL ) { 295 // is this edge a duplicate? 296 if( oldTarget != (*succ)->getTarget()->getBlock() ) 297 duplicateNumber = 0; 298 299 // create the new phony edge: root -> succ 300 BallLarusEdge* rootEdge = 301 addEdge(getRoot(), (*succ)->getTarget(), duplicateNumber++); 302 rootEdge->setType(BallLarusEdge::SPLITEDGE_PHONY); 303 rootEdge->setRealEdge(*succ); 304 305 // split on this edge and reference it's exit/root phony edges 306 (*succ)->setType(BallLarusEdge::SPLITEDGE); 307 (*succ)->setPhonyRoot(rootEdge); 308 (*succ)->setPhonyExit(exitEdge); 309 (*succ)->setWeight(0); 310 } 311 } 312 313 calculatePathNumbersFrom(node); 314 } 315 316 DEBUG(dbgs() << "prev, new number paths " << prevPathNumber << ", " 317 << node->getNumberPaths() << ".\n"); 318 319 if(prevPathNumber == 0 && node->getNumberPaths() != 0) { 320 DEBUG(dbgs() << "node ready : " << node->getName() << "\n"); 321 for(BLEdgeIterator pred = node->predBegin(), end = node->predEnd(); 322 pred != end; pred++) { 323 if( (*pred)->getType() == BallLarusEdge::BACKEDGE || 324 (*pred)->getType() == BallLarusEdge::SPLITEDGE ) 325 continue; 326 327 BallLarusNode* nextNode = (*pred)->getSource(); 328 // not yet visited? 329 if(nextNode->getNumberPaths() == 0) 330 bfsQueue.push(nextNode); 331 } 332 } 333 } 334 335 DEBUG(dbgs() << "\tNumber of paths: " << getRoot()->getNumberPaths() << "\n"); 336 } 337 338 // Returns the number of paths for the Dag. 339 unsigned BallLarusDag::getNumberOfPaths() { 340 return(getRoot()->getNumberPaths()); 341 } 342 343 // Returns the root (i.e. entry) node for the DAG. 344 BallLarusNode* BallLarusDag::getRoot() { 345 return _root; 346 } 347 348 // Returns the exit node for the DAG. 349 BallLarusNode* BallLarusDag::getExit() { 350 return _exit; 351 } 352 353 // Returns the function for the DAG. 354 Function& BallLarusDag::getFunction() { 355 return(_function); 356 } 357 358 // Clears the node colors. 359 void BallLarusDag::clearColors(BallLarusNode::NodeColor color) { 360 for (BLNodeIterator nodeIt = _nodes.begin(); nodeIt != _nodes.end(); nodeIt++) 361 (*nodeIt)->setColor(color); 362 } 363 364 // Processes one node and its imediate edges for building the DAG. 365 void BallLarusDag::buildNode(BLBlockNodeMap& inDag, BLNodeStack& dfsStack) { 366 BallLarusNode* currentNode = dfsStack.top(); 367 BasicBlock* currentBlock = currentNode->getBlock(); 368 369 if(currentNode->getColor() != BallLarusNode::WHITE) { 370 // we have already visited this node 371 dfsStack.pop(); 372 currentNode->setColor(BallLarusNode::BLACK); 373 } else { 374 // are there any external procedure calls? 375 if( ProcessEarlyTermination ) { 376 for( BasicBlock::iterator bbCurrent = currentNode->getBlock()->begin(), 377 bbEnd = currentNode->getBlock()->end(); bbCurrent != bbEnd; 378 bbCurrent++ ) { 379 Instruction& instr = *bbCurrent; 380 if( instr.getOpcode() == Instruction::Call ) { 381 BallLarusEdge* callEdge = addEdge(currentNode, getExit(), 0); 382 callEdge->setType(BallLarusEdge::CALLEDGE_PHONY); 383 break; 384 } 385 } 386 } 387 388 TerminatorInst* terminator = currentNode->getBlock()->getTerminator(); 389 if(isa<ReturnInst>(terminator) || isa<UnreachableInst>(terminator) 390 || isa<UnwindInst>(terminator)) 391 addEdge(currentNode, getExit(),0); 392 393 currentNode->setColor(BallLarusNode::GRAY); 394 inDag[currentBlock] = currentNode; 395 396 BasicBlock* oldSuccessor = 0; 397 unsigned duplicateNumber = 0; 398 399 // iterate through this node's successors 400 for(succ_iterator successor = succ_begin(currentBlock), 401 succEnd = succ_end(currentBlock); successor != succEnd; 402 oldSuccessor = *successor, ++successor ) { 403 BasicBlock* succBB = *successor; 404 405 // is this edge a duplicate? 406 if (oldSuccessor == succBB) 407 duplicateNumber++; 408 else 409 duplicateNumber = 0; 410 411 buildEdge(inDag, dfsStack, currentNode, succBB, duplicateNumber); 412 } 413 } 414 } 415 416 // Process an edge in the CFG for DAG building. 417 void BallLarusDag::buildEdge(BLBlockNodeMap& inDag, std::stack<BallLarusNode*>& 418 dfsStack, BallLarusNode* currentNode, 419 BasicBlock* succBB, unsigned duplicateCount) { 420 BallLarusNode* succNode = inDag[succBB]; 421 422 if(succNode && succNode->getColor() == BallLarusNode::BLACK) { 423 // visited node and forward edge 424 addEdge(currentNode, succNode, duplicateCount); 425 } else if(succNode && succNode->getColor() == BallLarusNode::GRAY) { 426 // visited node and back edge 427 DEBUG(dbgs() << "Backedge detected.\n"); 428 addBackedge(currentNode, succNode, duplicateCount); 429 } else { 430 BallLarusNode* childNode; 431 // not visited node and forward edge 432 if(succNode) // an unvisited node that is child of a gray node 433 childNode = succNode; 434 else { // an unvisited node that is a child of a an unvisted node 435 childNode = addNode(succBB); 436 inDag[succBB] = childNode; 437 } 438 addEdge(currentNode, childNode, duplicateCount); 439 dfsStack.push(childNode); 440 } 441 } 442 443 // The weight on each edge is the increment required along any path that 444 // contains that edge. 445 void BallLarusDag::calculatePathNumbersFrom(BallLarusNode* node) { 446 if(node == getExit()) 447 // The Exit node must be base case 448 node->setNumberPaths(1); 449 else { 450 unsigned sumPaths = 0; 451 BallLarusNode* succNode; 452 453 for(BLEdgeIterator succ = node->succBegin(), end = node->succEnd(); 454 succ != end; succ++) { 455 if( (*succ)->getType() == BallLarusEdge::BACKEDGE || 456 (*succ)->getType() == BallLarusEdge::SPLITEDGE ) 457 continue; 458 459 (*succ)->setWeight(sumPaths); 460 succNode = (*succ)->getTarget(); 461 462 if( !succNode->getNumberPaths() ) 463 return; 464 sumPaths += succNode->getNumberPaths(); 465 } 466 467 node->setNumberPaths(sumPaths); 468 } 469 } 470 471 // Allows subclasses to determine which type of Node is created. 472 // Override this method to produce subclasses of BallLarusNode if 473 // necessary. The destructor of BallLarusDag will call free on each 474 // pointer created. 475 BallLarusNode* BallLarusDag::createNode(BasicBlock* BB) { 476 return( new BallLarusNode(BB) ); 477 } 478 479 // Allows subclasses to determine which type of Edge is created. 480 // Override this method to produce subclasses of BallLarusEdge if 481 // necessary. The destructor of BallLarusDag will call free on each 482 // pointer created. 483 BallLarusEdge* BallLarusDag::createEdge(BallLarusNode* source, 484 BallLarusNode* target, 485 unsigned duplicateCount) { 486 return( new BallLarusEdge(source, target, duplicateCount) ); 487 } 488 489 // Proxy to node's constructor. Updates the DAG state. 490 BallLarusNode* BallLarusDag::addNode(BasicBlock* BB) { 491 BallLarusNode* newNode = createNode(BB); 492 _nodes.push_back(newNode); 493 return( newNode ); 494 } 495 496 // Proxy to edge's constructor. Updates the DAG state. 497 BallLarusEdge* BallLarusDag::addEdge(BallLarusNode* source, 498 BallLarusNode* target, 499 unsigned duplicateCount) { 500 BallLarusEdge* newEdge = createEdge(source, target, duplicateCount); 501 _edges.push_back(newEdge); 502 source->addSuccEdge(newEdge); 503 target->addPredEdge(newEdge); 504 return(newEdge); 505 } 506 507 // Adds a backedge with its phony edges. Updates the DAG state. 508 void BallLarusDag::addBackedge(BallLarusNode* source, BallLarusNode* target, 509 unsigned duplicateCount) { 510 BallLarusEdge* childEdge = addEdge(source, target, duplicateCount); 511 childEdge->setType(BallLarusEdge::BACKEDGE); 512 513 childEdge->setPhonyRoot(addEdge(getRoot(), target,0)); 514 childEdge->setPhonyExit(addEdge(source, getExit(),0)); 515 516 childEdge->getPhonyRoot()->setRealEdge(childEdge); 517 childEdge->getPhonyRoot()->setType(BallLarusEdge::BACKEDGE_PHONY); 518 519 childEdge->getPhonyExit()->setRealEdge(childEdge); 520 childEdge->getPhonyExit()->setType(BallLarusEdge::BACKEDGE_PHONY); 521 _backEdges.push_back(childEdge); 522 } 523