xref: /openbsd-src/gnu/llvm/llvm/lib/Transforms/Utils/LowerSwitch.cpp (revision d415bd752c734aee168c4ee86ff32e8cc249eb16)
109467b48Spatrick //===- LowerSwitch.cpp - Eliminate Switch instructions --------------------===//
209467b48Spatrick //
309467b48Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
409467b48Spatrick // See https://llvm.org/LICENSE.txt for license information.
509467b48Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
609467b48Spatrick //
709467b48Spatrick //===----------------------------------------------------------------------===//
809467b48Spatrick //
909467b48Spatrick // The LowerSwitch transformation rewrites switch instructions with a sequence
1009467b48Spatrick // of branches, which allows targets to get away with not implementing the
1109467b48Spatrick // switch instruction until it is convenient.
1209467b48Spatrick //
1309467b48Spatrick //===----------------------------------------------------------------------===//
1409467b48Spatrick 
1573471bf0Spatrick #include "llvm/Transforms/Utils/LowerSwitch.h"
1609467b48Spatrick #include "llvm/ADT/DenseMap.h"
1709467b48Spatrick #include "llvm/ADT/STLExtras.h"
1809467b48Spatrick #include "llvm/ADT/SmallPtrSet.h"
1909467b48Spatrick #include "llvm/ADT/SmallVector.h"
2009467b48Spatrick #include "llvm/Analysis/AssumptionCache.h"
2109467b48Spatrick #include "llvm/Analysis/LazyValueInfo.h"
2209467b48Spatrick #include "llvm/Analysis/ValueTracking.h"
2309467b48Spatrick #include "llvm/IR/BasicBlock.h"
2409467b48Spatrick #include "llvm/IR/CFG.h"
2509467b48Spatrick #include "llvm/IR/ConstantRange.h"
2609467b48Spatrick #include "llvm/IR/Constants.h"
2709467b48Spatrick #include "llvm/IR/Function.h"
2809467b48Spatrick #include "llvm/IR/InstrTypes.h"
2909467b48Spatrick #include "llvm/IR/Instructions.h"
3073471bf0Spatrick #include "llvm/IR/PassManager.h"
3109467b48Spatrick #include "llvm/IR/Value.h"
3209467b48Spatrick #include "llvm/InitializePasses.h"
3309467b48Spatrick #include "llvm/Pass.h"
3409467b48Spatrick #include "llvm/Support/Casting.h"
3509467b48Spatrick #include "llvm/Support/Compiler.h"
3609467b48Spatrick #include "llvm/Support/Debug.h"
3709467b48Spatrick #include "llvm/Support/KnownBits.h"
3809467b48Spatrick #include "llvm/Support/raw_ostream.h"
3909467b48Spatrick #include "llvm/Transforms/Utils.h"
4009467b48Spatrick #include "llvm/Transforms/Utils/BasicBlockUtils.h"
4109467b48Spatrick #include <algorithm>
4209467b48Spatrick #include <cassert>
4309467b48Spatrick #include <cstdint>
4409467b48Spatrick #include <iterator>
4509467b48Spatrick #include <limits>
4609467b48Spatrick #include <vector>
4709467b48Spatrick 
4809467b48Spatrick using namespace llvm;
4909467b48Spatrick 
5009467b48Spatrick #define DEBUG_TYPE "lower-switch"
5109467b48Spatrick 
5209467b48Spatrick namespace {
5309467b48Spatrick 
5409467b48Spatrick struct IntRange {
55*d415bd75Srobert   APInt Low, High;
5609467b48Spatrick };
5709467b48Spatrick 
5809467b48Spatrick } // end anonymous namespace
5909467b48Spatrick 
6073471bf0Spatrick namespace {
6109467b48Spatrick // Return true iff R is covered by Ranges.
IsInRanges(const IntRange & R,const std::vector<IntRange> & Ranges)6273471bf0Spatrick bool IsInRanges(const IntRange &R, const std::vector<IntRange> &Ranges) {
6309467b48Spatrick   // Note: Ranges must be sorted, non-overlapping and non-adjacent.
6409467b48Spatrick 
6509467b48Spatrick   // Find the first range whose High field is >= R.High,
6609467b48Spatrick   // then check if the Low field is <= R.Low. If so, we
6709467b48Spatrick   // have a Range that covers R.
6809467b48Spatrick   auto I = llvm::lower_bound(
69*d415bd75Srobert       Ranges, R, [](IntRange A, IntRange B) { return A.High.slt(B.High); });
70*d415bd75Srobert   return I != Ranges.end() && I->Low.sle(R.Low);
7109467b48Spatrick }
7209467b48Spatrick 
7309467b48Spatrick struct CaseRange {
7409467b48Spatrick   ConstantInt *Low;
7509467b48Spatrick   ConstantInt *High;
7609467b48Spatrick   BasicBlock *BB;
7709467b48Spatrick 
CaseRange__anon9f57d2800211::CaseRange7809467b48Spatrick   CaseRange(ConstantInt *low, ConstantInt *high, BasicBlock *bb)
7909467b48Spatrick       : Low(low), High(high), BB(bb) {}
8009467b48Spatrick };
8109467b48Spatrick 
8209467b48Spatrick using CaseVector = std::vector<CaseRange>;
8309467b48Spatrick using CaseItr = std::vector<CaseRange>::iterator;
8409467b48Spatrick 
8509467b48Spatrick /// The comparison function for sorting the switch case values in the vector.
8609467b48Spatrick /// WARNING: Case ranges should be disjoint!
8709467b48Spatrick struct CaseCmp {
operator ()__anon9f57d2800211::CaseCmp8873471bf0Spatrick   bool operator()(const CaseRange &C1, const CaseRange &C2) {
8909467b48Spatrick     const ConstantInt *CI1 = cast<const ConstantInt>(C1.Low);
9009467b48Spatrick     const ConstantInt *CI2 = cast<const ConstantInt>(C2.High);
9109467b48Spatrick     return CI1->getValue().slt(CI2->getValue());
9209467b48Spatrick   }
9309467b48Spatrick };
9409467b48Spatrick 
9509467b48Spatrick /// Used for debugging purposes.
9609467b48Spatrick LLVM_ATTRIBUTE_USED
operator <<(raw_ostream & O,const CaseVector & C)9773471bf0Spatrick raw_ostream &operator<<(raw_ostream &O, const CaseVector &C) {
9809467b48Spatrick   O << "[";
9909467b48Spatrick 
10073471bf0Spatrick   for (CaseVector::const_iterator B = C.begin(), E = C.end(); B != E;) {
10109467b48Spatrick     O << "[" << B->Low->getValue() << ", " << B->High->getValue() << "]";
10209467b48Spatrick     if (++B != E)
10309467b48Spatrick       O << ", ";
10409467b48Spatrick   }
10509467b48Spatrick 
10609467b48Spatrick   return O << "]";
10709467b48Spatrick }
10809467b48Spatrick 
10909467b48Spatrick /// Update the first occurrence of the "switch statement" BB in the PHI
11009467b48Spatrick /// node with the "new" BB. The other occurrences will:
11109467b48Spatrick ///
11209467b48Spatrick /// 1) Be updated by subsequent calls to this function.  Switch statements may
11309467b48Spatrick /// have more than one outcoming edge into the same BB if they all have the same
11409467b48Spatrick /// value. When the switch statement is converted these incoming edges are now
11509467b48Spatrick /// coming from multiple BBs.
11609467b48Spatrick /// 2) Removed if subsequent incoming values now share the same case, i.e.,
11709467b48Spatrick /// multiple outcome edges are condensed into one. This is necessary to keep the
11809467b48Spatrick /// number of phi values equal to the number of branches to SuccBB.
FixPhis(BasicBlock * SuccBB,BasicBlock * OrigBB,BasicBlock * NewBB,const APInt & NumMergedCases)119*d415bd75Srobert void FixPhis(BasicBlock *SuccBB, BasicBlock *OrigBB, BasicBlock *NewBB,
120*d415bd75Srobert              const APInt &NumMergedCases) {
121*d415bd75Srobert   for (auto &I : SuccBB->phis()) {
122*d415bd75Srobert     PHINode *PN = cast<PHINode>(&I);
12309467b48Spatrick 
124*d415bd75Srobert     // Only update the first occurrence if NewBB exists.
12509467b48Spatrick     unsigned Idx = 0, E = PN->getNumIncomingValues();
126*d415bd75Srobert     APInt LocalNumMergedCases = NumMergedCases;
127*d415bd75Srobert     for (; Idx != E && NewBB; ++Idx) {
12809467b48Spatrick       if (PN->getIncomingBlock(Idx) == OrigBB) {
12909467b48Spatrick         PN->setIncomingBlock(Idx, NewBB);
13009467b48Spatrick         break;
13109467b48Spatrick       }
13209467b48Spatrick     }
13309467b48Spatrick 
134*d415bd75Srobert     // Skip the updated incoming block so that it will not be removed.
135*d415bd75Srobert     if (NewBB)
136*d415bd75Srobert       ++Idx;
137*d415bd75Srobert 
13809467b48Spatrick     // Remove additional occurrences coming from condensed cases and keep the
13909467b48Spatrick     // number of incoming values equal to the number of branches to SuccBB.
14009467b48Spatrick     SmallVector<unsigned, 8> Indices;
141*d415bd75Srobert     for (; LocalNumMergedCases.ugt(0) && Idx < E; ++Idx)
14209467b48Spatrick       if (PN->getIncomingBlock(Idx) == OrigBB) {
14309467b48Spatrick         Indices.push_back(Idx);
144*d415bd75Srobert         LocalNumMergedCases -= 1;
14509467b48Spatrick       }
14609467b48Spatrick     // Remove incoming values in the reverse order to prevent invalidating
14709467b48Spatrick     // *successive* index.
14809467b48Spatrick     for (unsigned III : llvm::reverse(Indices))
14909467b48Spatrick       PN->removeIncomingValue(III);
15009467b48Spatrick   }
15109467b48Spatrick }
15209467b48Spatrick 
15373471bf0Spatrick /// Create a new leaf block for the binary lookup tree. It checks if the
15473471bf0Spatrick /// switch's value == the case's value. If not, then it jumps to the default
15573471bf0Spatrick /// branch. At this point in the tree, the value can't be another valid case
15673471bf0Spatrick /// value, so the jump to the "default" branch is warranted.
NewLeafBlock(CaseRange & Leaf,Value * Val,ConstantInt * LowerBound,ConstantInt * UpperBound,BasicBlock * OrigBlock,BasicBlock * Default)15773471bf0Spatrick BasicBlock *NewLeafBlock(CaseRange &Leaf, Value *Val, ConstantInt *LowerBound,
15873471bf0Spatrick                          ConstantInt *UpperBound, BasicBlock *OrigBlock,
15973471bf0Spatrick                          BasicBlock *Default) {
16073471bf0Spatrick   Function *F = OrigBlock->getParent();
16173471bf0Spatrick   BasicBlock *NewLeaf = BasicBlock::Create(Val->getContext(), "LeafBlock");
162*d415bd75Srobert   F->insert(++OrigBlock->getIterator(), NewLeaf);
16373471bf0Spatrick 
16473471bf0Spatrick   // Emit comparison
16573471bf0Spatrick   ICmpInst *Comp = nullptr;
16673471bf0Spatrick   if (Leaf.Low == Leaf.High) {
16773471bf0Spatrick     // Make the seteq instruction...
16873471bf0Spatrick     Comp =
16973471bf0Spatrick         new ICmpInst(*NewLeaf, ICmpInst::ICMP_EQ, Val, Leaf.Low, "SwitchLeaf");
17073471bf0Spatrick   } else {
17173471bf0Spatrick     // Make range comparison
17273471bf0Spatrick     if (Leaf.Low == LowerBound) {
17373471bf0Spatrick       // Val >= Min && Val <= Hi --> Val <= Hi
17473471bf0Spatrick       Comp = new ICmpInst(*NewLeaf, ICmpInst::ICMP_SLE, Val, Leaf.High,
17573471bf0Spatrick                           "SwitchLeaf");
17673471bf0Spatrick     } else if (Leaf.High == UpperBound) {
17773471bf0Spatrick       // Val <= Max && Val >= Lo --> Val >= Lo
17873471bf0Spatrick       Comp = new ICmpInst(*NewLeaf, ICmpInst::ICMP_SGE, Val, Leaf.Low,
17973471bf0Spatrick                           "SwitchLeaf");
18073471bf0Spatrick     } else if (Leaf.Low->isZero()) {
18173471bf0Spatrick       // Val >= 0 && Val <= Hi --> Val <=u Hi
18273471bf0Spatrick       Comp = new ICmpInst(*NewLeaf, ICmpInst::ICMP_ULE, Val, Leaf.High,
18373471bf0Spatrick                           "SwitchLeaf");
18473471bf0Spatrick     } else {
18573471bf0Spatrick       // Emit V-Lo <=u Hi-Lo
18673471bf0Spatrick       Constant *NegLo = ConstantExpr::getNeg(Leaf.Low);
18773471bf0Spatrick       Instruction *Add = BinaryOperator::CreateAdd(
18873471bf0Spatrick           Val, NegLo, Val->getName() + ".off", NewLeaf);
18973471bf0Spatrick       Constant *UpperBound = ConstantExpr::getAdd(NegLo, Leaf.High);
19073471bf0Spatrick       Comp = new ICmpInst(*NewLeaf, ICmpInst::ICMP_ULE, Add, UpperBound,
19173471bf0Spatrick                           "SwitchLeaf");
19273471bf0Spatrick     }
19373471bf0Spatrick   }
19473471bf0Spatrick 
19573471bf0Spatrick   // Make the conditional branch...
19673471bf0Spatrick   BasicBlock *Succ = Leaf.BB;
19773471bf0Spatrick   BranchInst::Create(Succ, Default, Comp, NewLeaf);
19873471bf0Spatrick 
199*d415bd75Srobert   // Update the PHI incoming value/block for the default.
200*d415bd75Srobert   for (auto &I : Default->phis()) {
201*d415bd75Srobert     PHINode *PN = cast<PHINode>(&I);
202*d415bd75Srobert     auto *V = PN->getIncomingValueForBlock(OrigBlock);
203*d415bd75Srobert     PN->addIncoming(V, NewLeaf);
204*d415bd75Srobert   }
205*d415bd75Srobert 
20673471bf0Spatrick   // If there were any PHI nodes in this successor, rewrite one entry
20773471bf0Spatrick   // from OrigBlock to come from NewLeaf.
20873471bf0Spatrick   for (BasicBlock::iterator I = Succ->begin(); isa<PHINode>(I); ++I) {
20973471bf0Spatrick     PHINode *PN = cast<PHINode>(I);
21073471bf0Spatrick     // Remove all but one incoming entries from the cluster
211*d415bd75Srobert     APInt Range = Leaf.High->getValue() - Leaf.Low->getValue();
212*d415bd75Srobert     for (APInt j(Range.getBitWidth(), 0, true); j.slt(Range); ++j) {
21373471bf0Spatrick       PN->removeIncomingValue(OrigBlock);
21473471bf0Spatrick     }
21573471bf0Spatrick 
21673471bf0Spatrick     int BlockIdx = PN->getBasicBlockIndex(OrigBlock);
21773471bf0Spatrick     assert(BlockIdx != -1 && "Switch didn't go to this successor??");
21873471bf0Spatrick     PN->setIncomingBlock((unsigned)BlockIdx, NewLeaf);
21973471bf0Spatrick   }
22073471bf0Spatrick 
22173471bf0Spatrick   return NewLeaf;
22273471bf0Spatrick }
22373471bf0Spatrick 
22409467b48Spatrick /// Convert the switch statement into a binary lookup of the case values.
22509467b48Spatrick /// The function recursively builds this tree. LowerBound and UpperBound are
22609467b48Spatrick /// used to keep track of the bounds for Val that have already been checked by
22709467b48Spatrick /// a block emitted by one of the previous calls to switchConvert in the call
22809467b48Spatrick /// stack.
SwitchConvert(CaseItr Begin,CaseItr End,ConstantInt * LowerBound,ConstantInt * UpperBound,Value * Val,BasicBlock * Predecessor,BasicBlock * OrigBlock,BasicBlock * Default,const std::vector<IntRange> & UnreachableRanges)22973471bf0Spatrick BasicBlock *SwitchConvert(CaseItr Begin, CaseItr End, ConstantInt *LowerBound,
23009467b48Spatrick                           ConstantInt *UpperBound, Value *Val,
23109467b48Spatrick                           BasicBlock *Predecessor, BasicBlock *OrigBlock,
23209467b48Spatrick                           BasicBlock *Default,
23309467b48Spatrick                           const std::vector<IntRange> &UnreachableRanges) {
23409467b48Spatrick   assert(LowerBound && UpperBound && "Bounds must be initialized");
23509467b48Spatrick   unsigned Size = End - Begin;
23609467b48Spatrick 
23709467b48Spatrick   if (Size == 1) {
23809467b48Spatrick     // Check if the Case Range is perfectly squeezed in between
23909467b48Spatrick     // already checked Upper and Lower bounds. If it is then we can avoid
24009467b48Spatrick     // emitting the code that checks if the value actually falls in the range
24109467b48Spatrick     // because the bounds already tell us so.
24209467b48Spatrick     if (Begin->Low == LowerBound && Begin->High == UpperBound) {
243*d415bd75Srobert       APInt NumMergedCases = UpperBound->getValue() - LowerBound->getValue();
24473471bf0Spatrick       FixPhis(Begin->BB, OrigBlock, Predecessor, NumMergedCases);
24509467b48Spatrick       return Begin->BB;
24609467b48Spatrick     }
24773471bf0Spatrick     return NewLeafBlock(*Begin, Val, LowerBound, UpperBound, OrigBlock,
24809467b48Spatrick                         Default);
24909467b48Spatrick   }
25009467b48Spatrick 
25109467b48Spatrick   unsigned Mid = Size / 2;
25209467b48Spatrick   std::vector<CaseRange> LHS(Begin, Begin + Mid);
25309467b48Spatrick   LLVM_DEBUG(dbgs() << "LHS: " << LHS << "\n");
25409467b48Spatrick   std::vector<CaseRange> RHS(Begin + Mid, End);
25509467b48Spatrick   LLVM_DEBUG(dbgs() << "RHS: " << RHS << "\n");
25609467b48Spatrick 
25709467b48Spatrick   CaseRange &Pivot = *(Begin + Mid);
25809467b48Spatrick   LLVM_DEBUG(dbgs() << "Pivot ==> [" << Pivot.Low->getValue() << ", "
25909467b48Spatrick                     << Pivot.High->getValue() << "]\n");
26009467b48Spatrick 
26109467b48Spatrick   // NewLowerBound here should never be the integer minimal value.
26209467b48Spatrick   // This is because it is computed from a case range that is never
26309467b48Spatrick   // the smallest, so there is always a case range that has at least
26409467b48Spatrick   // a smaller value.
26509467b48Spatrick   ConstantInt *NewLowerBound = Pivot.Low;
26609467b48Spatrick 
26709467b48Spatrick   // Because NewLowerBound is never the smallest representable integer
26809467b48Spatrick   // it is safe here to subtract one.
26909467b48Spatrick   ConstantInt *NewUpperBound = ConstantInt::get(NewLowerBound->getContext(),
27009467b48Spatrick                                                 NewLowerBound->getValue() - 1);
27109467b48Spatrick 
27209467b48Spatrick   if (!UnreachableRanges.empty()) {
27309467b48Spatrick     // Check if the gap between LHS's highest and NewLowerBound is unreachable.
274*d415bd75Srobert     APInt GapLow = LHS.back().High->getValue() + 1;
275*d415bd75Srobert     APInt GapHigh = NewLowerBound->getValue() - 1;
27609467b48Spatrick     IntRange Gap = {GapLow, GapHigh};
277*d415bd75Srobert     if (GapHigh.sge(GapLow) && IsInRanges(Gap, UnreachableRanges))
27809467b48Spatrick       NewUpperBound = LHS.back().High;
27909467b48Spatrick   }
28009467b48Spatrick 
281*d415bd75Srobert   LLVM_DEBUG(dbgs() << "LHS Bounds ==> [" << LowerBound->getValue() << ", "
282*d415bd75Srobert                     << NewUpperBound->getValue() << "]\n"
283*d415bd75Srobert                     << "RHS Bounds ==> [" << NewLowerBound->getValue() << ", "
284*d415bd75Srobert                     << UpperBound->getValue() << "]\n");
28509467b48Spatrick 
28609467b48Spatrick   // Create a new node that checks if the value is < pivot. Go to the
28709467b48Spatrick   // left branch if it is and right branch if not.
28809467b48Spatrick   Function *F = OrigBlock->getParent();
28909467b48Spatrick   BasicBlock *NewNode = BasicBlock::Create(Val->getContext(), "NodeBlock");
29009467b48Spatrick 
291*d415bd75Srobert   ICmpInst *Comp = new ICmpInst(ICmpInst::ICMP_SLT, Val, Pivot.Low, "Pivot");
29209467b48Spatrick 
29373471bf0Spatrick   BasicBlock *LBranch =
29473471bf0Spatrick       SwitchConvert(LHS.begin(), LHS.end(), LowerBound, NewUpperBound, Val,
29573471bf0Spatrick                     NewNode, OrigBlock, Default, UnreachableRanges);
29673471bf0Spatrick   BasicBlock *RBranch =
29773471bf0Spatrick       SwitchConvert(RHS.begin(), RHS.end(), NewLowerBound, UpperBound, Val,
29873471bf0Spatrick                     NewNode, OrigBlock, Default, UnreachableRanges);
29909467b48Spatrick 
300*d415bd75Srobert   F->insert(++OrigBlock->getIterator(), NewNode);
301*d415bd75Srobert   Comp->insertInto(NewNode, NewNode->end());
30209467b48Spatrick 
30309467b48Spatrick   BranchInst::Create(LBranch, RBranch, Comp, NewNode);
30409467b48Spatrick   return NewNode;
30509467b48Spatrick }
30609467b48Spatrick 
30709467b48Spatrick /// Transform simple list of \p SI's cases into list of CaseRange's \p Cases.
30809467b48Spatrick /// \post \p Cases wouldn't contain references to \p SI's default BB.
30909467b48Spatrick /// \returns Number of \p SI's cases that do not reference \p SI's default BB.
Clusterify(CaseVector & Cases,SwitchInst * SI)31073471bf0Spatrick unsigned Clusterify(CaseVector &Cases, SwitchInst *SI) {
31109467b48Spatrick   unsigned NumSimpleCases = 0;
31209467b48Spatrick 
31309467b48Spatrick   // Start with "simple" cases
31409467b48Spatrick   for (auto Case : SI->cases()) {
31509467b48Spatrick     if (Case.getCaseSuccessor() == SI->getDefaultDest())
31609467b48Spatrick       continue;
31709467b48Spatrick     Cases.push_back(CaseRange(Case.getCaseValue(), Case.getCaseValue(),
31809467b48Spatrick                               Case.getCaseSuccessor()));
31909467b48Spatrick     ++NumSimpleCases;
32009467b48Spatrick   }
32109467b48Spatrick 
32209467b48Spatrick   llvm::sort(Cases, CaseCmp());
32309467b48Spatrick 
32409467b48Spatrick   // Merge case into clusters
32509467b48Spatrick   if (Cases.size() >= 2) {
32609467b48Spatrick     CaseItr I = Cases.begin();
32709467b48Spatrick     for (CaseItr J = std::next(I), E = Cases.end(); J != E; ++J) {
328*d415bd75Srobert       const APInt &nextValue = J->Low->getValue();
329*d415bd75Srobert       const APInt &currentValue = I->High->getValue();
33009467b48Spatrick       BasicBlock *nextBB = J->BB;
33109467b48Spatrick       BasicBlock *currentBB = I->BB;
33209467b48Spatrick 
33309467b48Spatrick       // If the two neighboring cases go to the same destination, merge them
33409467b48Spatrick       // into a single case.
335*d415bd75Srobert       assert(nextValue.sgt(currentValue) &&
336*d415bd75Srobert              "Cases should be strictly ascending");
33709467b48Spatrick       if ((nextValue == currentValue + 1) && (currentBB == nextBB)) {
33809467b48Spatrick         I->High = J->High;
33909467b48Spatrick         // FIXME: Combine branch weights.
34009467b48Spatrick       } else if (++I != J) {
34109467b48Spatrick         *I = *J;
34209467b48Spatrick       }
34309467b48Spatrick     }
34409467b48Spatrick     Cases.erase(std::next(I), Cases.end());
34509467b48Spatrick   }
34609467b48Spatrick 
34709467b48Spatrick   return NumSimpleCases;
34809467b48Spatrick }
34909467b48Spatrick 
35009467b48Spatrick /// Replace the specified switch instruction with a sequence of chained if-then
35109467b48Spatrick /// insts in a balanced binary search.
ProcessSwitchInst(SwitchInst * SI,SmallPtrSetImpl<BasicBlock * > & DeleteList,AssumptionCache * AC,LazyValueInfo * LVI)35273471bf0Spatrick void ProcessSwitchInst(SwitchInst *SI,
35309467b48Spatrick                        SmallPtrSetImpl<BasicBlock *> &DeleteList,
35409467b48Spatrick                        AssumptionCache *AC, LazyValueInfo *LVI) {
35509467b48Spatrick   BasicBlock *OrigBlock = SI->getParent();
35609467b48Spatrick   Function *F = OrigBlock->getParent();
35709467b48Spatrick   Value *Val = SI->getCondition(); // The value we are switching on...
35809467b48Spatrick   BasicBlock *Default = SI->getDefaultDest();
35909467b48Spatrick 
36009467b48Spatrick   // Don't handle unreachable blocks. If there are successors with phis, this
36109467b48Spatrick   // would leave them behind with missing predecessors.
36209467b48Spatrick   if ((OrigBlock != &F->getEntryBlock() && pred_empty(OrigBlock)) ||
36309467b48Spatrick       OrigBlock->getSinglePredecessor() == OrigBlock) {
36409467b48Spatrick     DeleteList.insert(OrigBlock);
36509467b48Spatrick     return;
36609467b48Spatrick   }
36709467b48Spatrick 
36809467b48Spatrick   // Prepare cases vector.
36909467b48Spatrick   CaseVector Cases;
37009467b48Spatrick   const unsigned NumSimpleCases = Clusterify(Cases, SI);
371*d415bd75Srobert   IntegerType *IT = cast<IntegerType>(SI->getCondition()->getType());
372*d415bd75Srobert   const unsigned BitWidth = IT->getBitWidth();
373*d415bd75Srobert   // Explictly use higher precision to prevent unsigned overflow where
374*d415bd75Srobert   // `UnsignedMax - 0 + 1 == 0`
375*d415bd75Srobert   APInt UnsignedZero(BitWidth + 1, 0);
376*d415bd75Srobert   APInt UnsignedMax = APInt::getMaxValue(BitWidth);
37709467b48Spatrick   LLVM_DEBUG(dbgs() << "Clusterify finished. Total clusters: " << Cases.size()
37809467b48Spatrick                     << ". Total non-default cases: " << NumSimpleCases
37909467b48Spatrick                     << "\nCase clusters: " << Cases << "\n");
38009467b48Spatrick 
38109467b48Spatrick   // If there is only the default destination, just branch.
38209467b48Spatrick   if (Cases.empty()) {
38309467b48Spatrick     BranchInst::Create(Default, OrigBlock);
38409467b48Spatrick     // Remove all the references from Default's PHIs to OrigBlock, but one.
385*d415bd75Srobert     FixPhis(Default, OrigBlock, OrigBlock, UnsignedMax);
38609467b48Spatrick     SI->eraseFromParent();
38709467b48Spatrick     return;
38809467b48Spatrick   }
38909467b48Spatrick 
39009467b48Spatrick   ConstantInt *LowerBound = nullptr;
39109467b48Spatrick   ConstantInt *UpperBound = nullptr;
39209467b48Spatrick   bool DefaultIsUnreachableFromSwitch = false;
39309467b48Spatrick 
39409467b48Spatrick   if (isa<UnreachableInst>(Default->getFirstNonPHIOrDbg())) {
39509467b48Spatrick     // Make the bounds tightly fitted around the case value range, because we
39609467b48Spatrick     // know that the value passed to the switch must be exactly one of the case
39709467b48Spatrick     // values.
39809467b48Spatrick     LowerBound = Cases.front().Low;
39909467b48Spatrick     UpperBound = Cases.back().High;
40009467b48Spatrick     DefaultIsUnreachableFromSwitch = true;
40109467b48Spatrick   } else {
40209467b48Spatrick     // Constraining the range of the value being switched over helps eliminating
40309467b48Spatrick     // unreachable BBs and minimizing the number of `add` instructions
40409467b48Spatrick     // newLeafBlock ends up emitting. Running CorrelatedValuePropagation after
40509467b48Spatrick     // LowerSwitch isn't as good, and also much more expensive in terms of
40609467b48Spatrick     // compile time for the following reasons:
40709467b48Spatrick     // 1. it processes many kinds of instructions, not just switches;
40809467b48Spatrick     // 2. even if limited to icmp instructions only, it will have to process
40909467b48Spatrick     //    roughly C icmp's per switch, where C is the number of cases in the
41009467b48Spatrick     //    switch, while LowerSwitch only needs to call LVI once per switch.
41109467b48Spatrick     const DataLayout &DL = F->getParent()->getDataLayout();
41209467b48Spatrick     KnownBits Known = computeKnownBits(Val, DL, /*Depth=*/0, AC, SI);
41309467b48Spatrick     // TODO Shouldn't this create a signed range?
41409467b48Spatrick     ConstantRange KnownBitsRange =
41509467b48Spatrick         ConstantRange::fromKnownBits(Known, /*IsSigned=*/false);
41673471bf0Spatrick     const ConstantRange LVIRange = LVI->getConstantRange(Val, SI);
41709467b48Spatrick     ConstantRange ValRange = KnownBitsRange.intersectWith(LVIRange);
41809467b48Spatrick     // We delegate removal of unreachable non-default cases to other passes. In
41909467b48Spatrick     // the unlikely event that some of them survived, we just conservatively
42009467b48Spatrick     // maintain the invariant that all the cases lie between the bounds. This
42109467b48Spatrick     // may, however, still render the default case effectively unreachable.
422*d415bd75Srobert     const APInt &Low = Cases.front().Low->getValue();
423*d415bd75Srobert     const APInt &High = Cases.back().High->getValue();
42409467b48Spatrick     APInt Min = APIntOps::smin(ValRange.getSignedMin(), Low);
42509467b48Spatrick     APInt Max = APIntOps::smax(ValRange.getSignedMax(), High);
42609467b48Spatrick 
42709467b48Spatrick     LowerBound = ConstantInt::get(SI->getContext(), Min);
42809467b48Spatrick     UpperBound = ConstantInt::get(SI->getContext(), Max);
42909467b48Spatrick     DefaultIsUnreachableFromSwitch = (Min + (NumSimpleCases - 1) == Max);
43009467b48Spatrick   }
43109467b48Spatrick 
43209467b48Spatrick   std::vector<IntRange> UnreachableRanges;
43309467b48Spatrick 
43409467b48Spatrick   if (DefaultIsUnreachableFromSwitch) {
435*d415bd75Srobert     DenseMap<BasicBlock *, APInt> Popularity;
436*d415bd75Srobert     APInt MaxPop(UnsignedZero);
43709467b48Spatrick     BasicBlock *PopSucc = nullptr;
43809467b48Spatrick 
439*d415bd75Srobert     APInt SignedMax = APInt::getSignedMaxValue(BitWidth);
440*d415bd75Srobert     APInt SignedMin = APInt::getSignedMinValue(BitWidth);
441*d415bd75Srobert     IntRange R = {SignedMin, SignedMax};
44209467b48Spatrick     UnreachableRanges.push_back(R);
44309467b48Spatrick     for (const auto &I : Cases) {
444*d415bd75Srobert       const APInt &Low = I.Low->getValue();
445*d415bd75Srobert       const APInt &High = I.High->getValue();
44609467b48Spatrick 
44709467b48Spatrick       IntRange &LastRange = UnreachableRanges.back();
448*d415bd75Srobert       if (LastRange.Low.eq(Low)) {
44909467b48Spatrick         // There is nothing left of the previous range.
45009467b48Spatrick         UnreachableRanges.pop_back();
45109467b48Spatrick       } else {
45209467b48Spatrick         // Terminate the previous range.
453*d415bd75Srobert         assert(Low.sgt(LastRange.Low));
45409467b48Spatrick         LastRange.High = Low - 1;
45509467b48Spatrick       }
456*d415bd75Srobert       if (High.ne(SignedMax)) {
457*d415bd75Srobert         IntRange R = {High + 1, SignedMax};
45809467b48Spatrick         UnreachableRanges.push_back(R);
45909467b48Spatrick       }
46009467b48Spatrick 
46109467b48Spatrick       // Count popularity.
462*d415bd75Srobert       assert(High.sge(Low) && "Popularity shouldn't be negative.");
463*d415bd75Srobert       APInt N = High.sext(BitWidth + 1) - Low.sext(BitWidth + 1) + 1;
464*d415bd75Srobert       // Explict insert to make sure the bitwidth of APInts match
465*d415bd75Srobert       APInt &Pop = Popularity.insert({I.BB, APInt(UnsignedZero)}).first->second;
466*d415bd75Srobert       if ((Pop += N).ugt(MaxPop)) {
46709467b48Spatrick         MaxPop = Pop;
46809467b48Spatrick         PopSucc = I.BB;
46909467b48Spatrick       }
47009467b48Spatrick     }
47109467b48Spatrick #ifndef NDEBUG
47209467b48Spatrick     /* UnreachableRanges should be sorted and the ranges non-adjacent. */
47309467b48Spatrick     for (auto I = UnreachableRanges.begin(), E = UnreachableRanges.end();
47409467b48Spatrick          I != E; ++I) {
475*d415bd75Srobert       assert(I->Low.sle(I->High));
47609467b48Spatrick       auto Next = I + 1;
47709467b48Spatrick       if (Next != E) {
478*d415bd75Srobert         assert(Next->Low.sgt(I->High));
47909467b48Spatrick       }
48009467b48Spatrick     }
48109467b48Spatrick #endif
48209467b48Spatrick 
48309467b48Spatrick     // As the default block in the switch is unreachable, update the PHI nodes
48409467b48Spatrick     // (remove all of the references to the default block) to reflect this.
48509467b48Spatrick     const unsigned NumDefaultEdges = SI->getNumCases() + 1 - NumSimpleCases;
48609467b48Spatrick     for (unsigned I = 0; I < NumDefaultEdges; ++I)
48709467b48Spatrick       Default->removePredecessor(OrigBlock);
48809467b48Spatrick 
48909467b48Spatrick     // Use the most popular block as the new default, reducing the number of
49009467b48Spatrick     // cases.
49109467b48Spatrick     Default = PopSucc;
49273471bf0Spatrick     llvm::erase_if(Cases,
49373471bf0Spatrick                    [PopSucc](const CaseRange &R) { return R.BB == PopSucc; });
49409467b48Spatrick 
49509467b48Spatrick     // If there are no cases left, just branch.
49609467b48Spatrick     if (Cases.empty()) {
49709467b48Spatrick       BranchInst::Create(Default, OrigBlock);
49809467b48Spatrick       SI->eraseFromParent();
49909467b48Spatrick       // As all the cases have been replaced with a single branch, only keep
50009467b48Spatrick       // one entry in the PHI nodes.
501*d415bd75Srobert       if (!MaxPop.isZero())
502*d415bd75Srobert         for (APInt I(UnsignedZero); I.ult(MaxPop - 1); ++I)
50309467b48Spatrick           PopSucc->removePredecessor(OrigBlock);
50409467b48Spatrick       return;
50509467b48Spatrick     }
50609467b48Spatrick 
50709467b48Spatrick     // If the condition was a PHI node with the switch block as a predecessor
50809467b48Spatrick     // removing predecessors may have caused the condition to be erased.
50909467b48Spatrick     // Getting the condition value again here protects against that.
51009467b48Spatrick     Val = SI->getCondition();
51109467b48Spatrick   }
51209467b48Spatrick 
51309467b48Spatrick   BasicBlock *SwitchBlock =
51473471bf0Spatrick       SwitchConvert(Cases.begin(), Cases.end(), LowerBound, UpperBound, Val,
515*d415bd75Srobert                     OrigBlock, OrigBlock, Default, UnreachableRanges);
51609467b48Spatrick 
517*d415bd75Srobert   // We have added incoming values for newly-created predecessors in
518*d415bd75Srobert   // NewLeafBlock(). The only meaningful work we offload to FixPhis() is to
519*d415bd75Srobert   // remove the incoming values from OrigBlock. There might be a special case
520*d415bd75Srobert   // that SwitchBlock is the same as Default, under which the PHIs in Default
521*d415bd75Srobert   // are fixed inside SwitchConvert().
522*d415bd75Srobert   if (SwitchBlock != Default)
523*d415bd75Srobert     FixPhis(Default, OrigBlock, nullptr, UnsignedMax);
52409467b48Spatrick 
52509467b48Spatrick   // Branch to our shiny new if-then stuff...
52609467b48Spatrick   BranchInst::Create(SwitchBlock, OrigBlock);
52709467b48Spatrick 
52809467b48Spatrick   // We are now done with the switch instruction, delete it.
52909467b48Spatrick   BasicBlock *OldDefault = SI->getDefaultDest();
530*d415bd75Srobert   SI->eraseFromParent();
53109467b48Spatrick 
53209467b48Spatrick   // If the Default block has no more predecessors just add it to DeleteList.
53373471bf0Spatrick   if (pred_empty(OldDefault))
53409467b48Spatrick     DeleteList.insert(OldDefault);
53509467b48Spatrick }
53673471bf0Spatrick 
LowerSwitch(Function & F,LazyValueInfo * LVI,AssumptionCache * AC)53773471bf0Spatrick bool LowerSwitch(Function &F, LazyValueInfo *LVI, AssumptionCache *AC) {
53873471bf0Spatrick   bool Changed = false;
53973471bf0Spatrick   SmallPtrSet<BasicBlock *, 8> DeleteList;
54073471bf0Spatrick 
541*d415bd75Srobert   // We use make_early_inc_range here so that we don't traverse new blocks.
542*d415bd75Srobert   for (BasicBlock &Cur : llvm::make_early_inc_range(F)) {
54373471bf0Spatrick     // If the block is a dead Default block that will be deleted later, don't
54473471bf0Spatrick     // waste time processing it.
545*d415bd75Srobert     if (DeleteList.count(&Cur))
54673471bf0Spatrick       continue;
54773471bf0Spatrick 
548*d415bd75Srobert     if (SwitchInst *SI = dyn_cast<SwitchInst>(Cur.getTerminator())) {
54973471bf0Spatrick       Changed = true;
55073471bf0Spatrick       ProcessSwitchInst(SI, DeleteList, AC, LVI);
55173471bf0Spatrick     }
55273471bf0Spatrick   }
55373471bf0Spatrick 
55473471bf0Spatrick   for (BasicBlock *BB : DeleteList) {
55573471bf0Spatrick     LVI->eraseBlock(BB);
55673471bf0Spatrick     DeleteDeadBlock(BB);
55773471bf0Spatrick   }
55873471bf0Spatrick 
55973471bf0Spatrick   return Changed;
56073471bf0Spatrick }
56173471bf0Spatrick 
56273471bf0Spatrick /// Replace all SwitchInst instructions with chained branch instructions.
56373471bf0Spatrick class LowerSwitchLegacyPass : public FunctionPass {
56473471bf0Spatrick public:
56573471bf0Spatrick   // Pass identification, replacement for typeid
56673471bf0Spatrick   static char ID;
56773471bf0Spatrick 
LowerSwitchLegacyPass()56873471bf0Spatrick   LowerSwitchLegacyPass() : FunctionPass(ID) {
56973471bf0Spatrick     initializeLowerSwitchLegacyPassPass(*PassRegistry::getPassRegistry());
57073471bf0Spatrick   }
57173471bf0Spatrick 
57273471bf0Spatrick   bool runOnFunction(Function &F) override;
57373471bf0Spatrick 
getAnalysisUsage(AnalysisUsage & AU) const57473471bf0Spatrick   void getAnalysisUsage(AnalysisUsage &AU) const override {
57573471bf0Spatrick     AU.addRequired<LazyValueInfoWrapperPass>();
57673471bf0Spatrick   }
57773471bf0Spatrick };
57873471bf0Spatrick 
57973471bf0Spatrick } // end anonymous namespace
58073471bf0Spatrick 
58173471bf0Spatrick char LowerSwitchLegacyPass::ID = 0;
58273471bf0Spatrick 
58373471bf0Spatrick // Publicly exposed interface to pass...
58473471bf0Spatrick char &llvm::LowerSwitchID = LowerSwitchLegacyPass::ID;
58573471bf0Spatrick 
58673471bf0Spatrick INITIALIZE_PASS_BEGIN(LowerSwitchLegacyPass, "lowerswitch",
58773471bf0Spatrick                       "Lower SwitchInst's to branches", false, false)
INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)58873471bf0Spatrick INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)
58973471bf0Spatrick INITIALIZE_PASS_DEPENDENCY(LazyValueInfoWrapperPass)
59073471bf0Spatrick INITIALIZE_PASS_END(LowerSwitchLegacyPass, "lowerswitch",
59173471bf0Spatrick                     "Lower SwitchInst's to branches", false, false)
59273471bf0Spatrick 
59373471bf0Spatrick // createLowerSwitchPass - Interface to this file...
59473471bf0Spatrick FunctionPass *llvm::createLowerSwitchPass() {
59573471bf0Spatrick   return new LowerSwitchLegacyPass();
59673471bf0Spatrick }
59773471bf0Spatrick 
runOnFunction(Function & F)59873471bf0Spatrick bool LowerSwitchLegacyPass::runOnFunction(Function &F) {
59973471bf0Spatrick   LazyValueInfo *LVI = &getAnalysis<LazyValueInfoWrapperPass>().getLVI();
60073471bf0Spatrick   auto *ACT = getAnalysisIfAvailable<AssumptionCacheTracker>();
60173471bf0Spatrick   AssumptionCache *AC = ACT ? &ACT->getAssumptionCache(F) : nullptr;
60273471bf0Spatrick   return LowerSwitch(F, LVI, AC);
60373471bf0Spatrick }
60473471bf0Spatrick 
run(Function & F,FunctionAnalysisManager & AM)60573471bf0Spatrick PreservedAnalyses LowerSwitchPass::run(Function &F,
60673471bf0Spatrick                                        FunctionAnalysisManager &AM) {
60773471bf0Spatrick   LazyValueInfo *LVI = &AM.getResult<LazyValueAnalysis>(F);
60873471bf0Spatrick   AssumptionCache *AC = AM.getCachedResult<AssumptionAnalysis>(F);
60973471bf0Spatrick   return LowerSwitch(F, LVI, AC) ? PreservedAnalyses::none()
61073471bf0Spatrick                                  : PreservedAnalyses::all();
61173471bf0Spatrick }
612