1 //===-- StructurizeCFG.cpp ------------------------------------------------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 10 #include "llvm/Transforms/Scalar.h" 11 #include "llvm/ADT/MapVector.h" 12 #include "llvm/ADT/PostOrderIterator.h" 13 #include "llvm/ADT/SCCIterator.h" 14 #include "llvm/Analysis/DivergenceAnalysis.h" 15 #include "llvm/Analysis/LoopInfo.h" 16 #include "llvm/Analysis/RegionInfo.h" 17 #include "llvm/Analysis/RegionIterator.h" 18 #include "llvm/Analysis/RegionPass.h" 19 #include "llvm/IR/Module.h" 20 #include "llvm/IR/PatternMatch.h" 21 #include "llvm/Support/Debug.h" 22 #include "llvm/Support/raw_ostream.h" 23 #include "llvm/Transforms/Utils/SSAUpdater.h" 24 25 using namespace llvm; 26 using namespace llvm::PatternMatch; 27 28 #define DEBUG_TYPE "structurizecfg" 29 30 namespace { 31 32 // Definition of the complex types used in this pass. 33 34 typedef std::pair<BasicBlock *, Value *> BBValuePair; 35 36 typedef SmallVector<RegionNode*, 8> RNVector; 37 typedef SmallVector<BasicBlock*, 8> BBVector; 38 typedef SmallVector<BranchInst*, 8> BranchVector; 39 typedef SmallVector<BBValuePair, 2> BBValueVector; 40 41 typedef SmallPtrSet<BasicBlock *, 8> BBSet; 42 43 typedef MapVector<PHINode *, BBValueVector> PhiMap; 44 typedef MapVector<BasicBlock *, BBVector> BB2BBVecMap; 45 46 typedef DenseMap<DomTreeNode *, unsigned> DTN2UnsignedMap; 47 typedef DenseMap<BasicBlock *, PhiMap> BBPhiMap; 48 typedef DenseMap<BasicBlock *, Value *> BBPredicates; 49 typedef DenseMap<BasicBlock *, BBPredicates> PredMap; 50 typedef DenseMap<BasicBlock *, BasicBlock*> BB2BBMap; 51 52 // The name for newly created blocks. 53 54 static const char *const FlowBlockName = "Flow"; 55 56 /// @brief Find the nearest common dominator for multiple BasicBlocks 57 /// 58 /// Helper class for StructurizeCFG 59 /// TODO: Maybe move into common code 60 class NearestCommonDominator { 61 DominatorTree *DT; 62 63 DTN2UnsignedMap IndexMap; 64 65 BasicBlock *Result; 66 unsigned ResultIndex; 67 bool ExplicitMentioned; 68 69 public: 70 /// \brief Start a new query 71 NearestCommonDominator(DominatorTree *DomTree) { 72 DT = DomTree; 73 Result = nullptr; 74 } 75 76 /// \brief Add BB to the resulting dominator 77 void addBlock(BasicBlock *BB, bool Remember = true) { 78 DomTreeNode *Node = DT->getNode(BB); 79 80 if (!Result) { 81 unsigned Numbering = 0; 82 for (;Node;Node = Node->getIDom()) 83 IndexMap[Node] = ++Numbering; 84 Result = BB; 85 ResultIndex = 1; 86 ExplicitMentioned = Remember; 87 return; 88 } 89 90 for (;Node;Node = Node->getIDom()) 91 if (IndexMap.count(Node)) 92 break; 93 else 94 IndexMap[Node] = 0; 95 96 assert(Node && "Dominator tree invalid!"); 97 98 unsigned Numbering = IndexMap[Node]; 99 if (Numbering > ResultIndex) { 100 Result = Node->getBlock(); 101 ResultIndex = Numbering; 102 ExplicitMentioned = Remember && (Result == BB); 103 } else if (Numbering == ResultIndex) { 104 ExplicitMentioned |= Remember; 105 } 106 } 107 108 /// \brief Is "Result" one of the BBs added with "Remember" = True? 109 bool wasResultExplicitMentioned() { 110 return ExplicitMentioned; 111 } 112 113 /// \brief Get the query result 114 BasicBlock *getResult() { 115 return Result; 116 } 117 }; 118 119 /// @brief Transforms the control flow graph on one single entry/exit region 120 /// at a time. 121 /// 122 /// After the transform all "If"/"Then"/"Else" style control flow looks like 123 /// this: 124 /// 125 /// \verbatim 126 /// 1 127 /// || 128 /// | | 129 /// 2 | 130 /// | / 131 /// |/ 132 /// 3 133 /// || Where: 134 /// | | 1 = "If" block, calculates the condition 135 /// 4 | 2 = "Then" subregion, runs if the condition is true 136 /// | / 3 = "Flow" blocks, newly inserted flow blocks, rejoins the flow 137 /// |/ 4 = "Else" optional subregion, runs if the condition is false 138 /// 5 5 = "End" block, also rejoins the control flow 139 /// \endverbatim 140 /// 141 /// Control flow is expressed as a branch where the true exit goes into the 142 /// "Then"/"Else" region, while the false exit skips the region 143 /// The condition for the optional "Else" region is expressed as a PHI node. 144 /// The incomming values of the PHI node are true for the "If" edge and false 145 /// for the "Then" edge. 146 /// 147 /// Additionally to that even complicated loops look like this: 148 /// 149 /// \verbatim 150 /// 1 151 /// || 152 /// | | 153 /// 2 ^ Where: 154 /// | / 1 = "Entry" block 155 /// |/ 2 = "Loop" optional subregion, with all exits at "Flow" block 156 /// 3 3 = "Flow" block, with back edge to entry block 157 /// | 158 /// \endverbatim 159 /// 160 /// The back edge of the "Flow" block is always on the false side of the branch 161 /// while the true side continues the general flow. So the loop condition 162 /// consist of a network of PHI nodes where the true incoming values expresses 163 /// breaks and the false values expresses continue states. 164 class StructurizeCFG : public RegionPass { 165 bool SkipUniformRegions; 166 DivergenceAnalysis *DA; 167 168 Type *Boolean; 169 ConstantInt *BoolTrue; 170 ConstantInt *BoolFalse; 171 UndefValue *BoolUndef; 172 173 Function *Func; 174 Region *ParentRegion; 175 176 DominatorTree *DT; 177 LoopInfo *LI; 178 179 RNVector Order; 180 BBSet Visited; 181 182 BBPhiMap DeletedPhis; 183 BB2BBVecMap AddedPhis; 184 185 PredMap Predicates; 186 BranchVector Conditions; 187 188 BB2BBMap Loops; 189 PredMap LoopPreds; 190 BranchVector LoopConds; 191 192 RegionNode *PrevNode; 193 194 void orderNodes(); 195 196 void analyzeLoops(RegionNode *N); 197 198 Value *invert(Value *Condition); 199 200 Value *buildCondition(BranchInst *Term, unsigned Idx, bool Invert); 201 202 void gatherPredicates(RegionNode *N); 203 204 void collectInfos(); 205 206 void insertConditions(bool Loops); 207 208 void delPhiValues(BasicBlock *From, BasicBlock *To); 209 210 void addPhiValues(BasicBlock *From, BasicBlock *To); 211 212 void setPhiValues(); 213 214 void killTerminator(BasicBlock *BB); 215 216 void changeExit(RegionNode *Node, BasicBlock *NewExit, 217 bool IncludeDominator); 218 219 BasicBlock *getNextFlow(BasicBlock *Dominator); 220 221 BasicBlock *needPrefix(bool NeedEmpty); 222 223 BasicBlock *needPostfix(BasicBlock *Flow, bool ExitUseAllowed); 224 225 void setPrevNode(BasicBlock *BB); 226 227 bool dominatesPredicates(BasicBlock *BB, RegionNode *Node); 228 229 bool isPredictableTrue(RegionNode *Node); 230 231 void wireFlow(bool ExitUseAllowed, BasicBlock *LoopEnd); 232 233 void handleLoops(bool ExitUseAllowed, BasicBlock *LoopEnd); 234 235 void createFlow(); 236 237 void rebuildSSA(); 238 239 bool hasOnlyUniformBranches(const Region *R); 240 241 public: 242 static char ID; 243 244 StructurizeCFG() : 245 RegionPass(ID), SkipUniformRegions(false) { 246 initializeStructurizeCFGPass(*PassRegistry::getPassRegistry()); 247 } 248 249 StructurizeCFG(bool SkipUniformRegions) : 250 RegionPass(ID), SkipUniformRegions(SkipUniformRegions) { 251 initializeStructurizeCFGPass(*PassRegistry::getPassRegistry()); 252 } 253 254 using Pass::doInitialization; 255 bool doInitialization(Region *R, RGPassManager &RGM) override; 256 257 bool runOnRegion(Region *R, RGPassManager &RGM) override; 258 259 const char *getPassName() const override { 260 return "Structurize control flow"; 261 } 262 263 void getAnalysisUsage(AnalysisUsage &AU) const override { 264 if (SkipUniformRegions) 265 AU.addRequired<DivergenceAnalysis>(); 266 AU.addRequiredID(LowerSwitchID); 267 AU.addRequired<DominatorTreeWrapperPass>(); 268 AU.addRequired<LoopInfoWrapperPass>(); 269 AU.addPreserved<DominatorTreeWrapperPass>(); 270 RegionPass::getAnalysisUsage(AU); 271 } 272 }; 273 274 } // end anonymous namespace 275 276 char StructurizeCFG::ID = 0; 277 278 INITIALIZE_PASS_BEGIN(StructurizeCFG, "structurizecfg", "Structurize the CFG", 279 false, false) 280 INITIALIZE_PASS_DEPENDENCY(DivergenceAnalysis) 281 INITIALIZE_PASS_DEPENDENCY(LowerSwitch) 282 INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) 283 INITIALIZE_PASS_DEPENDENCY(RegionInfoPass) 284 INITIALIZE_PASS_END(StructurizeCFG, "structurizecfg", "Structurize the CFG", 285 false, false) 286 287 /// \brief Initialize the types and constants used in the pass 288 bool StructurizeCFG::doInitialization(Region *R, RGPassManager &RGM) { 289 LLVMContext &Context = R->getEntry()->getContext(); 290 291 Boolean = Type::getInt1Ty(Context); 292 BoolTrue = ConstantInt::getTrue(Context); 293 BoolFalse = ConstantInt::getFalse(Context); 294 BoolUndef = UndefValue::get(Boolean); 295 296 return false; 297 } 298 299 /// \brief Build up the general order of nodes 300 void StructurizeCFG::orderNodes() { 301 RNVector TempOrder; 302 ReversePostOrderTraversal<Region*> RPOT(ParentRegion); 303 TempOrder.append(RPOT.begin(), RPOT.end()); 304 305 std::map<Loop*, unsigned> LoopBlocks; 306 307 308 // The reverse post-order traversal of the list gives us an ordering close 309 // to what we want. The only problem with it is that sometimes backedges 310 // for outer loops will be visited before backedges for inner loops. 311 for (RegionNode *RN : TempOrder) { 312 BasicBlock *BB = RN->getEntry(); 313 Loop *Loop = LI->getLoopFor(BB); 314 ++LoopBlocks[Loop]; 315 } 316 317 unsigned CurrentLoopDepth = 0; 318 Loop *CurrentLoop = nullptr; 319 BBSet TempVisited; 320 for (RNVector::iterator I = TempOrder.begin(), E = TempOrder.end(); I != E; ++I) { 321 BasicBlock *BB = (*I)->getEntry(); 322 unsigned LoopDepth = LI->getLoopDepth(BB); 323 324 if (std::find(Order.begin(), Order.end(), *I) != Order.end()) 325 continue; 326 327 if (LoopDepth < CurrentLoopDepth) { 328 // Make sure we have visited all blocks in this loop before moving back to 329 // the outer loop. 330 331 RNVector::iterator LoopI = I; 332 while (unsigned &BlockCount = LoopBlocks[CurrentLoop]) { 333 LoopI++; 334 BasicBlock *LoopBB = (*LoopI)->getEntry(); 335 if (LI->getLoopFor(LoopBB) == CurrentLoop) { 336 --BlockCount; 337 Order.push_back(*LoopI); 338 } 339 } 340 } 341 342 CurrentLoop = LI->getLoopFor(BB); 343 if (CurrentLoop) { 344 LoopBlocks[CurrentLoop]--; 345 } 346 347 CurrentLoopDepth = LoopDepth; 348 Order.push_back(*I); 349 } 350 351 // This pass originally used a post-order traversal and then operated on 352 // the list in reverse. Now that we are using a reverse post-order traversal 353 // rather than re-working the whole pass to operate on the list in order, 354 // we just reverse the list and continue to operate on it in reverse. 355 std::reverse(Order.begin(), Order.end()); 356 } 357 358 /// \brief Determine the end of the loops 359 void StructurizeCFG::analyzeLoops(RegionNode *N) { 360 if (N->isSubRegion()) { 361 // Test for exit as back edge 362 BasicBlock *Exit = N->getNodeAs<Region>()->getExit(); 363 if (Visited.count(Exit)) 364 Loops[Exit] = N->getEntry(); 365 366 } else { 367 // Test for sucessors as back edge 368 BasicBlock *BB = N->getNodeAs<BasicBlock>(); 369 BranchInst *Term = cast<BranchInst>(BB->getTerminator()); 370 371 for (BasicBlock *Succ : Term->successors()) 372 if (Visited.count(Succ)) 373 Loops[Succ] = BB; 374 } 375 } 376 377 /// \brief Invert the given condition 378 Value *StructurizeCFG::invert(Value *Condition) { 379 // First: Check if it's a constant 380 if (Condition == BoolTrue) 381 return BoolFalse; 382 383 if (Condition == BoolFalse) 384 return BoolTrue; 385 386 if (Condition == BoolUndef) 387 return BoolUndef; 388 389 // Second: If the condition is already inverted, return the original value 390 if (match(Condition, m_Not(m_Value(Condition)))) 391 return Condition; 392 393 if (Instruction *Inst = dyn_cast<Instruction>(Condition)) { 394 // Third: Check all the users for an invert 395 BasicBlock *Parent = Inst->getParent(); 396 for (User *U : Condition->users()) 397 if (Instruction *I = dyn_cast<Instruction>(U)) 398 if (I->getParent() == Parent && match(I, m_Not(m_Specific(Condition)))) 399 return I; 400 401 // Last option: Create a new instruction 402 return BinaryOperator::CreateNot(Condition, "", Parent->getTerminator()); 403 } 404 405 if (Argument *Arg = dyn_cast<Argument>(Condition)) { 406 BasicBlock &EntryBlock = Arg->getParent()->getEntryBlock(); 407 return BinaryOperator::CreateNot(Condition, 408 Arg->getName() + ".inv", 409 EntryBlock.getTerminator()); 410 } 411 412 llvm_unreachable("Unhandled condition to invert"); 413 } 414 415 /// \brief Build the condition for one edge 416 Value *StructurizeCFG::buildCondition(BranchInst *Term, unsigned Idx, 417 bool Invert) { 418 Value *Cond = Invert ? BoolFalse : BoolTrue; 419 if (Term->isConditional()) { 420 Cond = Term->getCondition(); 421 422 if (Idx != (unsigned)Invert) 423 Cond = invert(Cond); 424 } 425 return Cond; 426 } 427 428 /// \brief Analyze the predecessors of each block and build up predicates 429 void StructurizeCFG::gatherPredicates(RegionNode *N) { 430 RegionInfo *RI = ParentRegion->getRegionInfo(); 431 BasicBlock *BB = N->getEntry(); 432 BBPredicates &Pred = Predicates[BB]; 433 BBPredicates &LPred = LoopPreds[BB]; 434 435 for (pred_iterator PI = pred_begin(BB), PE = pred_end(BB); 436 PI != PE; ++PI) { 437 438 // Ignore it if it's a branch from outside into our region entry 439 if (!ParentRegion->contains(*PI)) 440 continue; 441 442 Region *R = RI->getRegionFor(*PI); 443 if (R == ParentRegion) { 444 445 // It's a top level block in our region 446 BranchInst *Term = cast<BranchInst>((*PI)->getTerminator()); 447 for (unsigned i = 0, e = Term->getNumSuccessors(); i != e; ++i) { 448 BasicBlock *Succ = Term->getSuccessor(i); 449 if (Succ != BB) 450 continue; 451 452 if (Visited.count(*PI)) { 453 // Normal forward edge 454 if (Term->isConditional()) { 455 // Try to treat it like an ELSE block 456 BasicBlock *Other = Term->getSuccessor(!i); 457 if (Visited.count(Other) && !Loops.count(Other) && 458 !Pred.count(Other) && !Pred.count(*PI)) { 459 460 Pred[Other] = BoolFalse; 461 Pred[*PI] = BoolTrue; 462 continue; 463 } 464 } 465 Pred[*PI] = buildCondition(Term, i, false); 466 467 } else { 468 // Back edge 469 LPred[*PI] = buildCondition(Term, i, true); 470 } 471 } 472 473 } else { 474 475 // It's an exit from a sub region 476 while (R->getParent() != ParentRegion) 477 R = R->getParent(); 478 479 // Edge from inside a subregion to its entry, ignore it 480 if (*R == *N) 481 continue; 482 483 BasicBlock *Entry = R->getEntry(); 484 if (Visited.count(Entry)) 485 Pred[Entry] = BoolTrue; 486 else 487 LPred[Entry] = BoolFalse; 488 } 489 } 490 } 491 492 /// \brief Collect various loop and predicate infos 493 void StructurizeCFG::collectInfos() { 494 // Reset predicate 495 Predicates.clear(); 496 497 // and loop infos 498 Loops.clear(); 499 LoopPreds.clear(); 500 501 // Reset the visited nodes 502 Visited.clear(); 503 504 for (RegionNode *RN : reverse(Order)) { 505 506 DEBUG(dbgs() << "Visiting: " 507 << (RN->isSubRegion() ? "SubRegion with entry: " : "") 508 << RN->getEntry()->getName() << " Loop Depth: " 509 << LI->getLoopDepth(RN->getEntry()) << "\n"); 510 511 // Analyze all the conditions leading to a node 512 gatherPredicates(RN); 513 514 // Remember that we've seen this node 515 Visited.insert(RN->getEntry()); 516 517 // Find the last back edges 518 analyzeLoops(RN); 519 } 520 } 521 522 /// \brief Insert the missing branch conditions 523 void StructurizeCFG::insertConditions(bool Loops) { 524 BranchVector &Conds = Loops ? LoopConds : Conditions; 525 Value *Default = Loops ? BoolTrue : BoolFalse; 526 SSAUpdater PhiInserter; 527 528 for (BranchInst *Term : Conds) { 529 assert(Term->isConditional()); 530 531 BasicBlock *Parent = Term->getParent(); 532 BasicBlock *SuccTrue = Term->getSuccessor(0); 533 BasicBlock *SuccFalse = Term->getSuccessor(1); 534 535 PhiInserter.Initialize(Boolean, ""); 536 PhiInserter.AddAvailableValue(&Func->getEntryBlock(), Default); 537 PhiInserter.AddAvailableValue(Loops ? SuccFalse : Parent, Default); 538 539 BBPredicates &Preds = Loops ? LoopPreds[SuccFalse] : Predicates[SuccTrue]; 540 541 NearestCommonDominator Dominator(DT); 542 Dominator.addBlock(Parent, false); 543 544 Value *ParentValue = nullptr; 545 for (BBPredicates::iterator PI = Preds.begin(), PE = Preds.end(); 546 PI != PE; ++PI) { 547 548 if (PI->first == Parent) { 549 ParentValue = PI->second; 550 break; 551 } 552 PhiInserter.AddAvailableValue(PI->first, PI->second); 553 Dominator.addBlock(PI->first); 554 } 555 556 if (ParentValue) { 557 Term->setCondition(ParentValue); 558 } else { 559 if (!Dominator.wasResultExplicitMentioned()) 560 PhiInserter.AddAvailableValue(Dominator.getResult(), Default); 561 562 Term->setCondition(PhiInserter.GetValueInMiddleOfBlock(Parent)); 563 } 564 } 565 } 566 567 /// \brief Remove all PHI values coming from "From" into "To" and remember 568 /// them in DeletedPhis 569 void StructurizeCFG::delPhiValues(BasicBlock *From, BasicBlock *To) { 570 PhiMap &Map = DeletedPhis[To]; 571 for (BasicBlock::iterator I = To->begin(), E = To->end(); 572 I != E && isa<PHINode>(*I);) { 573 574 PHINode &Phi = cast<PHINode>(*I++); 575 while (Phi.getBasicBlockIndex(From) != -1) { 576 Value *Deleted = Phi.removeIncomingValue(From, false); 577 Map[&Phi].push_back(std::make_pair(From, Deleted)); 578 } 579 } 580 } 581 582 /// \brief Add a dummy PHI value as soon as we knew the new predecessor 583 void StructurizeCFG::addPhiValues(BasicBlock *From, BasicBlock *To) { 584 for (BasicBlock::iterator I = To->begin(), E = To->end(); 585 I != E && isa<PHINode>(*I);) { 586 587 PHINode &Phi = cast<PHINode>(*I++); 588 Value *Undef = UndefValue::get(Phi.getType()); 589 Phi.addIncoming(Undef, From); 590 } 591 AddedPhis[To].push_back(From); 592 } 593 594 /// \brief Add the real PHI value as soon as everything is set up 595 void StructurizeCFG::setPhiValues() { 596 SSAUpdater Updater; 597 for (BB2BBVecMap::iterator AI = AddedPhis.begin(), AE = AddedPhis.end(); 598 AI != AE; ++AI) { 599 600 BasicBlock *To = AI->first; 601 BBVector &From = AI->second; 602 603 if (!DeletedPhis.count(To)) 604 continue; 605 606 PhiMap &Map = DeletedPhis[To]; 607 for (PhiMap::iterator PI = Map.begin(), PE = Map.end(); 608 PI != PE; ++PI) { 609 610 PHINode *Phi = PI->first; 611 Value *Undef = UndefValue::get(Phi->getType()); 612 Updater.Initialize(Phi->getType(), ""); 613 Updater.AddAvailableValue(&Func->getEntryBlock(), Undef); 614 Updater.AddAvailableValue(To, Undef); 615 616 NearestCommonDominator Dominator(DT); 617 Dominator.addBlock(To, false); 618 for (BBValueVector::iterator VI = PI->second.begin(), 619 VE = PI->second.end(); VI != VE; ++VI) { 620 621 Updater.AddAvailableValue(VI->first, VI->second); 622 Dominator.addBlock(VI->first); 623 } 624 625 if (!Dominator.wasResultExplicitMentioned()) 626 Updater.AddAvailableValue(Dominator.getResult(), Undef); 627 628 for (BBVector::iterator FI = From.begin(), FE = From.end(); 629 FI != FE; ++FI) { 630 631 int Idx = Phi->getBasicBlockIndex(*FI); 632 assert(Idx != -1); 633 Phi->setIncomingValue(Idx, Updater.GetValueAtEndOfBlock(*FI)); 634 } 635 } 636 637 DeletedPhis.erase(To); 638 } 639 assert(DeletedPhis.empty()); 640 } 641 642 /// \brief Remove phi values from all successors and then remove the terminator. 643 void StructurizeCFG::killTerminator(BasicBlock *BB) { 644 TerminatorInst *Term = BB->getTerminator(); 645 if (!Term) 646 return; 647 648 for (succ_iterator SI = succ_begin(BB), SE = succ_end(BB); 649 SI != SE; ++SI) { 650 651 delPhiValues(BB, *SI); 652 } 653 654 Term->eraseFromParent(); 655 } 656 657 /// \brief Let node exit(s) point to NewExit 658 void StructurizeCFG::changeExit(RegionNode *Node, BasicBlock *NewExit, 659 bool IncludeDominator) { 660 if (Node->isSubRegion()) { 661 Region *SubRegion = Node->getNodeAs<Region>(); 662 BasicBlock *OldExit = SubRegion->getExit(); 663 BasicBlock *Dominator = nullptr; 664 665 // Find all the edges from the sub region to the exit 666 for (pred_iterator I = pred_begin(OldExit), E = pred_end(OldExit); 667 I != E;) { 668 669 BasicBlock *BB = *I++; 670 if (!SubRegion->contains(BB)) 671 continue; 672 673 // Modify the edges to point to the new exit 674 delPhiValues(BB, OldExit); 675 BB->getTerminator()->replaceUsesOfWith(OldExit, NewExit); 676 addPhiValues(BB, NewExit); 677 678 // Find the new dominator (if requested) 679 if (IncludeDominator) { 680 if (!Dominator) 681 Dominator = BB; 682 else 683 Dominator = DT->findNearestCommonDominator(Dominator, BB); 684 } 685 } 686 687 // Change the dominator (if requested) 688 if (Dominator) 689 DT->changeImmediateDominator(NewExit, Dominator); 690 691 // Update the region info 692 SubRegion->replaceExit(NewExit); 693 694 } else { 695 BasicBlock *BB = Node->getNodeAs<BasicBlock>(); 696 killTerminator(BB); 697 BranchInst::Create(NewExit, BB); 698 addPhiValues(BB, NewExit); 699 if (IncludeDominator) 700 DT->changeImmediateDominator(NewExit, BB); 701 } 702 } 703 704 /// \brief Create a new flow node and update dominator tree and region info 705 BasicBlock *StructurizeCFG::getNextFlow(BasicBlock *Dominator) { 706 LLVMContext &Context = Func->getContext(); 707 BasicBlock *Insert = Order.empty() ? ParentRegion->getExit() : 708 Order.back()->getEntry(); 709 BasicBlock *Flow = BasicBlock::Create(Context, FlowBlockName, 710 Func, Insert); 711 DT->addNewBlock(Flow, Dominator); 712 ParentRegion->getRegionInfo()->setRegionFor(Flow, ParentRegion); 713 return Flow; 714 } 715 716 /// \brief Create a new or reuse the previous node as flow node 717 BasicBlock *StructurizeCFG::needPrefix(bool NeedEmpty) { 718 BasicBlock *Entry = PrevNode->getEntry(); 719 720 if (!PrevNode->isSubRegion()) { 721 killTerminator(Entry); 722 if (!NeedEmpty || Entry->getFirstInsertionPt() == Entry->end()) 723 return Entry; 724 725 } 726 727 // create a new flow node 728 BasicBlock *Flow = getNextFlow(Entry); 729 730 // and wire it up 731 changeExit(PrevNode, Flow, true); 732 PrevNode = ParentRegion->getBBNode(Flow); 733 return Flow; 734 } 735 736 /// \brief Returns the region exit if possible, otherwise just a new flow node 737 BasicBlock *StructurizeCFG::needPostfix(BasicBlock *Flow, 738 bool ExitUseAllowed) { 739 if (Order.empty() && ExitUseAllowed) { 740 BasicBlock *Exit = ParentRegion->getExit(); 741 DT->changeImmediateDominator(Exit, Flow); 742 addPhiValues(Flow, Exit); 743 return Exit; 744 } 745 return getNextFlow(Flow); 746 } 747 748 /// \brief Set the previous node 749 void StructurizeCFG::setPrevNode(BasicBlock *BB) { 750 PrevNode = ParentRegion->contains(BB) ? ParentRegion->getBBNode(BB) 751 : nullptr; 752 } 753 754 /// \brief Does BB dominate all the predicates of Node ? 755 bool StructurizeCFG::dominatesPredicates(BasicBlock *BB, RegionNode *Node) { 756 BBPredicates &Preds = Predicates[Node->getEntry()]; 757 for (BBPredicates::iterator PI = Preds.begin(), PE = Preds.end(); 758 PI != PE; ++PI) { 759 760 if (!DT->dominates(BB, PI->first)) 761 return false; 762 } 763 return true; 764 } 765 766 /// \brief Can we predict that this node will always be called? 767 bool StructurizeCFG::isPredictableTrue(RegionNode *Node) { 768 BBPredicates &Preds = Predicates[Node->getEntry()]; 769 bool Dominated = false; 770 771 // Regionentry is always true 772 if (!PrevNode) 773 return true; 774 775 for (BBPredicates::iterator I = Preds.begin(), E = Preds.end(); 776 I != E; ++I) { 777 778 if (I->second != BoolTrue) 779 return false; 780 781 if (!Dominated && DT->dominates(I->first, PrevNode->getEntry())) 782 Dominated = true; 783 } 784 785 // TODO: The dominator check is too strict 786 return Dominated; 787 } 788 789 /// Take one node from the order vector and wire it up 790 void StructurizeCFG::wireFlow(bool ExitUseAllowed, 791 BasicBlock *LoopEnd) { 792 RegionNode *Node = Order.pop_back_val(); 793 Visited.insert(Node->getEntry()); 794 795 if (isPredictableTrue(Node)) { 796 // Just a linear flow 797 if (PrevNode) { 798 changeExit(PrevNode, Node->getEntry(), true); 799 } 800 PrevNode = Node; 801 802 } else { 803 // Insert extra prefix node (or reuse last one) 804 BasicBlock *Flow = needPrefix(false); 805 806 // Insert extra postfix node (or use exit instead) 807 BasicBlock *Entry = Node->getEntry(); 808 BasicBlock *Next = needPostfix(Flow, ExitUseAllowed); 809 810 // let it point to entry and next block 811 Conditions.push_back(BranchInst::Create(Entry, Next, BoolUndef, Flow)); 812 addPhiValues(Flow, Entry); 813 DT->changeImmediateDominator(Entry, Flow); 814 815 PrevNode = Node; 816 while (!Order.empty() && !Visited.count(LoopEnd) && 817 dominatesPredicates(Entry, Order.back())) { 818 handleLoops(false, LoopEnd); 819 } 820 821 changeExit(PrevNode, Next, false); 822 setPrevNode(Next); 823 } 824 } 825 826 void StructurizeCFG::handleLoops(bool ExitUseAllowed, 827 BasicBlock *LoopEnd) { 828 RegionNode *Node = Order.back(); 829 BasicBlock *LoopStart = Node->getEntry(); 830 831 if (!Loops.count(LoopStart)) { 832 wireFlow(ExitUseAllowed, LoopEnd); 833 return; 834 } 835 836 if (!isPredictableTrue(Node)) 837 LoopStart = needPrefix(true); 838 839 LoopEnd = Loops[Node->getEntry()]; 840 wireFlow(false, LoopEnd); 841 while (!Visited.count(LoopEnd)) { 842 handleLoops(false, LoopEnd); 843 } 844 845 // If the start of the loop is the entry block, we can't branch to it so 846 // insert a new dummy entry block. 847 Function *LoopFunc = LoopStart->getParent(); 848 if (LoopStart == &LoopFunc->getEntryBlock()) { 849 LoopStart->setName("entry.orig"); 850 851 BasicBlock *NewEntry = 852 BasicBlock::Create(LoopStart->getContext(), 853 "entry", 854 LoopFunc, 855 LoopStart); 856 BranchInst::Create(LoopStart, NewEntry); 857 } 858 859 // Create an extra loop end node 860 LoopEnd = needPrefix(false); 861 BasicBlock *Next = needPostfix(LoopEnd, ExitUseAllowed); 862 LoopConds.push_back(BranchInst::Create(Next, LoopStart, 863 BoolUndef, LoopEnd)); 864 addPhiValues(LoopEnd, LoopStart); 865 setPrevNode(Next); 866 } 867 868 /// After this function control flow looks like it should be, but 869 /// branches and PHI nodes only have undefined conditions. 870 void StructurizeCFG::createFlow() { 871 BasicBlock *Exit = ParentRegion->getExit(); 872 bool EntryDominatesExit = DT->dominates(ParentRegion->getEntry(), Exit); 873 874 DeletedPhis.clear(); 875 AddedPhis.clear(); 876 Conditions.clear(); 877 LoopConds.clear(); 878 879 PrevNode = nullptr; 880 Visited.clear(); 881 882 while (!Order.empty()) { 883 handleLoops(EntryDominatesExit, nullptr); 884 } 885 886 if (PrevNode) 887 changeExit(PrevNode, Exit, EntryDominatesExit); 888 else 889 assert(EntryDominatesExit); 890 } 891 892 /// Handle a rare case where the disintegrated nodes instructions 893 /// no longer dominate all their uses. Not sure if this is really nessasary 894 void StructurizeCFG::rebuildSSA() { 895 SSAUpdater Updater; 896 for (auto *BB : ParentRegion->blocks()) 897 for (BasicBlock::iterator II = BB->begin(), IE = BB->end(); 898 II != IE; ++II) { 899 900 bool Initialized = false; 901 for (auto I = II->use_begin(), E = II->use_end(); I != E;) { 902 Use &U = *I++; 903 Instruction *User = cast<Instruction>(U.getUser()); 904 if (User->getParent() == BB) { 905 continue; 906 907 } else if (PHINode *UserPN = dyn_cast<PHINode>(User)) { 908 if (UserPN->getIncomingBlock(U) == BB) 909 continue; 910 } 911 912 if (DT->dominates(&*II, User)) 913 continue; 914 915 if (!Initialized) { 916 Value *Undef = UndefValue::get(II->getType()); 917 Updater.Initialize(II->getType(), ""); 918 Updater.AddAvailableValue(&Func->getEntryBlock(), Undef); 919 Updater.AddAvailableValue(BB, &*II); 920 Initialized = true; 921 } 922 Updater.RewriteUseAfterInsertions(U); 923 } 924 } 925 } 926 927 bool StructurizeCFG::hasOnlyUniformBranches(const Region *R) { 928 for (const BasicBlock *BB : R->blocks()) { 929 const BranchInst *Br = dyn_cast<BranchInst>(BB->getTerminator()); 930 if (!Br || !Br->isConditional()) 931 continue; 932 933 if (!DA->isUniform(Br->getCondition())) 934 return false; 935 DEBUG(dbgs() << "BB: " << BB->getName() << " has uniform terminator\n"); 936 } 937 return true; 938 } 939 940 /// \brief Run the transformation for each region found 941 bool StructurizeCFG::runOnRegion(Region *R, RGPassManager &RGM) { 942 if (R->isTopLevelRegion()) 943 return false; 944 945 if (SkipUniformRegions) { 946 DA = &getAnalysis<DivergenceAnalysis>(); 947 // TODO: We could probably be smarter here with how we handle sub-regions. 948 if (hasOnlyUniformBranches(R)) { 949 DEBUG(dbgs() << "Skipping region with uniform control flow: " << *R << '\n'); 950 951 // Mark all direct child block terminators as having been treated as 952 // uniform. To account for a possible future in which non-uniform 953 // sub-regions are treated more cleverly, indirect children are not 954 // marked as uniform. 955 MDNode *MD = MDNode::get(R->getEntry()->getParent()->getContext(), {}); 956 Region::element_iterator E = R->element_end(); 957 for (Region::element_iterator I = R->element_begin(); I != E; ++I) { 958 if (I->isSubRegion()) 959 continue; 960 961 if (Instruction *Term = I->getEntry()->getTerminator()) 962 Term->setMetadata("structurizecfg.uniform", MD); 963 } 964 965 return false; 966 } 967 } 968 969 Func = R->getEntry()->getParent(); 970 ParentRegion = R; 971 972 DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree(); 973 LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo(); 974 975 orderNodes(); 976 collectInfos(); 977 createFlow(); 978 insertConditions(false); 979 insertConditions(true); 980 setPhiValues(); 981 rebuildSSA(); 982 983 // Cleanup 984 Order.clear(); 985 Visited.clear(); 986 DeletedPhis.clear(); 987 AddedPhis.clear(); 988 Predicates.clear(); 989 Conditions.clear(); 990 Loops.clear(); 991 LoopPreds.clear(); 992 LoopConds.clear(); 993 994 return true; 995 } 996 997 Pass *llvm::createStructurizeCFGPass(bool SkipUniformRegions) { 998 return new StructurizeCFG(SkipUniformRegions); 999 } 1000