109467b48Spatrick //===- LowerSwitch.cpp - Eliminate Switch instructions --------------------===//
209467b48Spatrick //
309467b48Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
409467b48Spatrick // See https://llvm.org/LICENSE.txt for license information.
509467b48Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
609467b48Spatrick //
709467b48Spatrick //===----------------------------------------------------------------------===//
809467b48Spatrick //
909467b48Spatrick // The LowerSwitch transformation rewrites switch instructions with a sequence
1009467b48Spatrick // of branches, which allows targets to get away with not implementing the
1109467b48Spatrick // switch instruction until it is convenient.
1209467b48Spatrick //
1309467b48Spatrick //===----------------------------------------------------------------------===//
1409467b48Spatrick
1573471bf0Spatrick #include "llvm/Transforms/Utils/LowerSwitch.h"
1609467b48Spatrick #include "llvm/ADT/DenseMap.h"
1709467b48Spatrick #include "llvm/ADT/STLExtras.h"
1809467b48Spatrick #include "llvm/ADT/SmallPtrSet.h"
1909467b48Spatrick #include "llvm/ADT/SmallVector.h"
2009467b48Spatrick #include "llvm/Analysis/AssumptionCache.h"
2109467b48Spatrick #include "llvm/Analysis/LazyValueInfo.h"
2209467b48Spatrick #include "llvm/Analysis/ValueTracking.h"
2309467b48Spatrick #include "llvm/IR/BasicBlock.h"
2409467b48Spatrick #include "llvm/IR/CFG.h"
2509467b48Spatrick #include "llvm/IR/ConstantRange.h"
2609467b48Spatrick #include "llvm/IR/Constants.h"
2709467b48Spatrick #include "llvm/IR/Function.h"
2809467b48Spatrick #include "llvm/IR/InstrTypes.h"
2909467b48Spatrick #include "llvm/IR/Instructions.h"
3073471bf0Spatrick #include "llvm/IR/PassManager.h"
3109467b48Spatrick #include "llvm/IR/Value.h"
3209467b48Spatrick #include "llvm/InitializePasses.h"
3309467b48Spatrick #include "llvm/Pass.h"
3409467b48Spatrick #include "llvm/Support/Casting.h"
3509467b48Spatrick #include "llvm/Support/Compiler.h"
3609467b48Spatrick #include "llvm/Support/Debug.h"
3709467b48Spatrick #include "llvm/Support/KnownBits.h"
3809467b48Spatrick #include "llvm/Support/raw_ostream.h"
3909467b48Spatrick #include "llvm/Transforms/Utils.h"
4009467b48Spatrick #include "llvm/Transforms/Utils/BasicBlockUtils.h"
4109467b48Spatrick #include <algorithm>
4209467b48Spatrick #include <cassert>
4309467b48Spatrick #include <cstdint>
4409467b48Spatrick #include <iterator>
4509467b48Spatrick #include <limits>
4609467b48Spatrick #include <vector>
4709467b48Spatrick
4809467b48Spatrick using namespace llvm;
4909467b48Spatrick
5009467b48Spatrick #define DEBUG_TYPE "lower-switch"
5109467b48Spatrick
5209467b48Spatrick namespace {
5309467b48Spatrick
5409467b48Spatrick struct IntRange {
55*d415bd75Srobert APInt Low, High;
5609467b48Spatrick };
5709467b48Spatrick
5809467b48Spatrick } // end anonymous namespace
5909467b48Spatrick
6073471bf0Spatrick namespace {
6109467b48Spatrick // Return true iff R is covered by Ranges.
IsInRanges(const IntRange & R,const std::vector<IntRange> & Ranges)6273471bf0Spatrick bool IsInRanges(const IntRange &R, const std::vector<IntRange> &Ranges) {
6309467b48Spatrick // Note: Ranges must be sorted, non-overlapping and non-adjacent.
6409467b48Spatrick
6509467b48Spatrick // Find the first range whose High field is >= R.High,
6609467b48Spatrick // then check if the Low field is <= R.Low. If so, we
6709467b48Spatrick // have a Range that covers R.
6809467b48Spatrick auto I = llvm::lower_bound(
69*d415bd75Srobert Ranges, R, [](IntRange A, IntRange B) { return A.High.slt(B.High); });
70*d415bd75Srobert return I != Ranges.end() && I->Low.sle(R.Low);
7109467b48Spatrick }
7209467b48Spatrick
7309467b48Spatrick struct CaseRange {
7409467b48Spatrick ConstantInt *Low;
7509467b48Spatrick ConstantInt *High;
7609467b48Spatrick BasicBlock *BB;
7709467b48Spatrick
CaseRange__anon9f57d2800211::CaseRange7809467b48Spatrick CaseRange(ConstantInt *low, ConstantInt *high, BasicBlock *bb)
7909467b48Spatrick : Low(low), High(high), BB(bb) {}
8009467b48Spatrick };
8109467b48Spatrick
8209467b48Spatrick using CaseVector = std::vector<CaseRange>;
8309467b48Spatrick using CaseItr = std::vector<CaseRange>::iterator;
8409467b48Spatrick
8509467b48Spatrick /// The comparison function for sorting the switch case values in the vector.
8609467b48Spatrick /// WARNING: Case ranges should be disjoint!
8709467b48Spatrick struct CaseCmp {
operator ()__anon9f57d2800211::CaseCmp8873471bf0Spatrick bool operator()(const CaseRange &C1, const CaseRange &C2) {
8909467b48Spatrick const ConstantInt *CI1 = cast<const ConstantInt>(C1.Low);
9009467b48Spatrick const ConstantInt *CI2 = cast<const ConstantInt>(C2.High);
9109467b48Spatrick return CI1->getValue().slt(CI2->getValue());
9209467b48Spatrick }
9309467b48Spatrick };
9409467b48Spatrick
9509467b48Spatrick /// Used for debugging purposes.
9609467b48Spatrick LLVM_ATTRIBUTE_USED
operator <<(raw_ostream & O,const CaseVector & C)9773471bf0Spatrick raw_ostream &operator<<(raw_ostream &O, const CaseVector &C) {
9809467b48Spatrick O << "[";
9909467b48Spatrick
10073471bf0Spatrick for (CaseVector::const_iterator B = C.begin(), E = C.end(); B != E;) {
10109467b48Spatrick O << "[" << B->Low->getValue() << ", " << B->High->getValue() << "]";
10209467b48Spatrick if (++B != E)
10309467b48Spatrick O << ", ";
10409467b48Spatrick }
10509467b48Spatrick
10609467b48Spatrick return O << "]";
10709467b48Spatrick }
10809467b48Spatrick
10909467b48Spatrick /// Update the first occurrence of the "switch statement" BB in the PHI
11009467b48Spatrick /// node with the "new" BB. The other occurrences will:
11109467b48Spatrick ///
11209467b48Spatrick /// 1) Be updated by subsequent calls to this function. Switch statements may
11309467b48Spatrick /// have more than one outcoming edge into the same BB if they all have the same
11409467b48Spatrick /// value. When the switch statement is converted these incoming edges are now
11509467b48Spatrick /// coming from multiple BBs.
11609467b48Spatrick /// 2) Removed if subsequent incoming values now share the same case, i.e.,
11709467b48Spatrick /// multiple outcome edges are condensed into one. This is necessary to keep the
11809467b48Spatrick /// number of phi values equal to the number of branches to SuccBB.
FixPhis(BasicBlock * SuccBB,BasicBlock * OrigBB,BasicBlock * NewBB,const APInt & NumMergedCases)119*d415bd75Srobert void FixPhis(BasicBlock *SuccBB, BasicBlock *OrigBB, BasicBlock *NewBB,
120*d415bd75Srobert const APInt &NumMergedCases) {
121*d415bd75Srobert for (auto &I : SuccBB->phis()) {
122*d415bd75Srobert PHINode *PN = cast<PHINode>(&I);
12309467b48Spatrick
124*d415bd75Srobert // Only update the first occurrence if NewBB exists.
12509467b48Spatrick unsigned Idx = 0, E = PN->getNumIncomingValues();
126*d415bd75Srobert APInt LocalNumMergedCases = NumMergedCases;
127*d415bd75Srobert for (; Idx != E && NewBB; ++Idx) {
12809467b48Spatrick if (PN->getIncomingBlock(Idx) == OrigBB) {
12909467b48Spatrick PN->setIncomingBlock(Idx, NewBB);
13009467b48Spatrick break;
13109467b48Spatrick }
13209467b48Spatrick }
13309467b48Spatrick
134*d415bd75Srobert // Skip the updated incoming block so that it will not be removed.
135*d415bd75Srobert if (NewBB)
136*d415bd75Srobert ++Idx;
137*d415bd75Srobert
13809467b48Spatrick // Remove additional occurrences coming from condensed cases and keep the
13909467b48Spatrick // number of incoming values equal to the number of branches to SuccBB.
14009467b48Spatrick SmallVector<unsigned, 8> Indices;
141*d415bd75Srobert for (; LocalNumMergedCases.ugt(0) && Idx < E; ++Idx)
14209467b48Spatrick if (PN->getIncomingBlock(Idx) == OrigBB) {
14309467b48Spatrick Indices.push_back(Idx);
144*d415bd75Srobert LocalNumMergedCases -= 1;
14509467b48Spatrick }
14609467b48Spatrick // Remove incoming values in the reverse order to prevent invalidating
14709467b48Spatrick // *successive* index.
14809467b48Spatrick for (unsigned III : llvm::reverse(Indices))
14909467b48Spatrick PN->removeIncomingValue(III);
15009467b48Spatrick }
15109467b48Spatrick }
15209467b48Spatrick
15373471bf0Spatrick /// Create a new leaf block for the binary lookup tree. It checks if the
15473471bf0Spatrick /// switch's value == the case's value. If not, then it jumps to the default
15573471bf0Spatrick /// branch. At this point in the tree, the value can't be another valid case
15673471bf0Spatrick /// value, so the jump to the "default" branch is warranted.
NewLeafBlock(CaseRange & Leaf,Value * Val,ConstantInt * LowerBound,ConstantInt * UpperBound,BasicBlock * OrigBlock,BasicBlock * Default)15773471bf0Spatrick BasicBlock *NewLeafBlock(CaseRange &Leaf, Value *Val, ConstantInt *LowerBound,
15873471bf0Spatrick ConstantInt *UpperBound, BasicBlock *OrigBlock,
15973471bf0Spatrick BasicBlock *Default) {
16073471bf0Spatrick Function *F = OrigBlock->getParent();
16173471bf0Spatrick BasicBlock *NewLeaf = BasicBlock::Create(Val->getContext(), "LeafBlock");
162*d415bd75Srobert F->insert(++OrigBlock->getIterator(), NewLeaf);
16373471bf0Spatrick
16473471bf0Spatrick // Emit comparison
16573471bf0Spatrick ICmpInst *Comp = nullptr;
16673471bf0Spatrick if (Leaf.Low == Leaf.High) {
16773471bf0Spatrick // Make the seteq instruction...
16873471bf0Spatrick Comp =
16973471bf0Spatrick new ICmpInst(*NewLeaf, ICmpInst::ICMP_EQ, Val, Leaf.Low, "SwitchLeaf");
17073471bf0Spatrick } else {
17173471bf0Spatrick // Make range comparison
17273471bf0Spatrick if (Leaf.Low == LowerBound) {
17373471bf0Spatrick // Val >= Min && Val <= Hi --> Val <= Hi
17473471bf0Spatrick Comp = new ICmpInst(*NewLeaf, ICmpInst::ICMP_SLE, Val, Leaf.High,
17573471bf0Spatrick "SwitchLeaf");
17673471bf0Spatrick } else if (Leaf.High == UpperBound) {
17773471bf0Spatrick // Val <= Max && Val >= Lo --> Val >= Lo
17873471bf0Spatrick Comp = new ICmpInst(*NewLeaf, ICmpInst::ICMP_SGE, Val, Leaf.Low,
17973471bf0Spatrick "SwitchLeaf");
18073471bf0Spatrick } else if (Leaf.Low->isZero()) {
18173471bf0Spatrick // Val >= 0 && Val <= Hi --> Val <=u Hi
18273471bf0Spatrick Comp = new ICmpInst(*NewLeaf, ICmpInst::ICMP_ULE, Val, Leaf.High,
18373471bf0Spatrick "SwitchLeaf");
18473471bf0Spatrick } else {
18573471bf0Spatrick // Emit V-Lo <=u Hi-Lo
18673471bf0Spatrick Constant *NegLo = ConstantExpr::getNeg(Leaf.Low);
18773471bf0Spatrick Instruction *Add = BinaryOperator::CreateAdd(
18873471bf0Spatrick Val, NegLo, Val->getName() + ".off", NewLeaf);
18973471bf0Spatrick Constant *UpperBound = ConstantExpr::getAdd(NegLo, Leaf.High);
19073471bf0Spatrick Comp = new ICmpInst(*NewLeaf, ICmpInst::ICMP_ULE, Add, UpperBound,
19173471bf0Spatrick "SwitchLeaf");
19273471bf0Spatrick }
19373471bf0Spatrick }
19473471bf0Spatrick
19573471bf0Spatrick // Make the conditional branch...
19673471bf0Spatrick BasicBlock *Succ = Leaf.BB;
19773471bf0Spatrick BranchInst::Create(Succ, Default, Comp, NewLeaf);
19873471bf0Spatrick
199*d415bd75Srobert // Update the PHI incoming value/block for the default.
200*d415bd75Srobert for (auto &I : Default->phis()) {
201*d415bd75Srobert PHINode *PN = cast<PHINode>(&I);
202*d415bd75Srobert auto *V = PN->getIncomingValueForBlock(OrigBlock);
203*d415bd75Srobert PN->addIncoming(V, NewLeaf);
204*d415bd75Srobert }
205*d415bd75Srobert
20673471bf0Spatrick // If there were any PHI nodes in this successor, rewrite one entry
20773471bf0Spatrick // from OrigBlock to come from NewLeaf.
20873471bf0Spatrick for (BasicBlock::iterator I = Succ->begin(); isa<PHINode>(I); ++I) {
20973471bf0Spatrick PHINode *PN = cast<PHINode>(I);
21073471bf0Spatrick // Remove all but one incoming entries from the cluster
211*d415bd75Srobert APInt Range = Leaf.High->getValue() - Leaf.Low->getValue();
212*d415bd75Srobert for (APInt j(Range.getBitWidth(), 0, true); j.slt(Range); ++j) {
21373471bf0Spatrick PN->removeIncomingValue(OrigBlock);
21473471bf0Spatrick }
21573471bf0Spatrick
21673471bf0Spatrick int BlockIdx = PN->getBasicBlockIndex(OrigBlock);
21773471bf0Spatrick assert(BlockIdx != -1 && "Switch didn't go to this successor??");
21873471bf0Spatrick PN->setIncomingBlock((unsigned)BlockIdx, NewLeaf);
21973471bf0Spatrick }
22073471bf0Spatrick
22173471bf0Spatrick return NewLeaf;
22273471bf0Spatrick }
22373471bf0Spatrick
22409467b48Spatrick /// Convert the switch statement into a binary lookup of the case values.
22509467b48Spatrick /// The function recursively builds this tree. LowerBound and UpperBound are
22609467b48Spatrick /// used to keep track of the bounds for Val that have already been checked by
22709467b48Spatrick /// a block emitted by one of the previous calls to switchConvert in the call
22809467b48Spatrick /// stack.
SwitchConvert(CaseItr Begin,CaseItr End,ConstantInt * LowerBound,ConstantInt * UpperBound,Value * Val,BasicBlock * Predecessor,BasicBlock * OrigBlock,BasicBlock * Default,const std::vector<IntRange> & UnreachableRanges)22973471bf0Spatrick BasicBlock *SwitchConvert(CaseItr Begin, CaseItr End, ConstantInt *LowerBound,
23009467b48Spatrick ConstantInt *UpperBound, Value *Val,
23109467b48Spatrick BasicBlock *Predecessor, BasicBlock *OrigBlock,
23209467b48Spatrick BasicBlock *Default,
23309467b48Spatrick const std::vector<IntRange> &UnreachableRanges) {
23409467b48Spatrick assert(LowerBound && UpperBound && "Bounds must be initialized");
23509467b48Spatrick unsigned Size = End - Begin;
23609467b48Spatrick
23709467b48Spatrick if (Size == 1) {
23809467b48Spatrick // Check if the Case Range is perfectly squeezed in between
23909467b48Spatrick // already checked Upper and Lower bounds. If it is then we can avoid
24009467b48Spatrick // emitting the code that checks if the value actually falls in the range
24109467b48Spatrick // because the bounds already tell us so.
24209467b48Spatrick if (Begin->Low == LowerBound && Begin->High == UpperBound) {
243*d415bd75Srobert APInt NumMergedCases = UpperBound->getValue() - LowerBound->getValue();
24473471bf0Spatrick FixPhis(Begin->BB, OrigBlock, Predecessor, NumMergedCases);
24509467b48Spatrick return Begin->BB;
24609467b48Spatrick }
24773471bf0Spatrick return NewLeafBlock(*Begin, Val, LowerBound, UpperBound, OrigBlock,
24809467b48Spatrick Default);
24909467b48Spatrick }
25009467b48Spatrick
25109467b48Spatrick unsigned Mid = Size / 2;
25209467b48Spatrick std::vector<CaseRange> LHS(Begin, Begin + Mid);
25309467b48Spatrick LLVM_DEBUG(dbgs() << "LHS: " << LHS << "\n");
25409467b48Spatrick std::vector<CaseRange> RHS(Begin + Mid, End);
25509467b48Spatrick LLVM_DEBUG(dbgs() << "RHS: " << RHS << "\n");
25609467b48Spatrick
25709467b48Spatrick CaseRange &Pivot = *(Begin + Mid);
25809467b48Spatrick LLVM_DEBUG(dbgs() << "Pivot ==> [" << Pivot.Low->getValue() << ", "
25909467b48Spatrick << Pivot.High->getValue() << "]\n");
26009467b48Spatrick
26109467b48Spatrick // NewLowerBound here should never be the integer minimal value.
26209467b48Spatrick // This is because it is computed from a case range that is never
26309467b48Spatrick // the smallest, so there is always a case range that has at least
26409467b48Spatrick // a smaller value.
26509467b48Spatrick ConstantInt *NewLowerBound = Pivot.Low;
26609467b48Spatrick
26709467b48Spatrick // Because NewLowerBound is never the smallest representable integer
26809467b48Spatrick // it is safe here to subtract one.
26909467b48Spatrick ConstantInt *NewUpperBound = ConstantInt::get(NewLowerBound->getContext(),
27009467b48Spatrick NewLowerBound->getValue() - 1);
27109467b48Spatrick
27209467b48Spatrick if (!UnreachableRanges.empty()) {
27309467b48Spatrick // Check if the gap between LHS's highest and NewLowerBound is unreachable.
274*d415bd75Srobert APInt GapLow = LHS.back().High->getValue() + 1;
275*d415bd75Srobert APInt GapHigh = NewLowerBound->getValue() - 1;
27609467b48Spatrick IntRange Gap = {GapLow, GapHigh};
277*d415bd75Srobert if (GapHigh.sge(GapLow) && IsInRanges(Gap, UnreachableRanges))
27809467b48Spatrick NewUpperBound = LHS.back().High;
27909467b48Spatrick }
28009467b48Spatrick
281*d415bd75Srobert LLVM_DEBUG(dbgs() << "LHS Bounds ==> [" << LowerBound->getValue() << ", "
282*d415bd75Srobert << NewUpperBound->getValue() << "]\n"
283*d415bd75Srobert << "RHS Bounds ==> [" << NewLowerBound->getValue() << ", "
284*d415bd75Srobert << UpperBound->getValue() << "]\n");
28509467b48Spatrick
28609467b48Spatrick // Create a new node that checks if the value is < pivot. Go to the
28709467b48Spatrick // left branch if it is and right branch if not.
28809467b48Spatrick Function *F = OrigBlock->getParent();
28909467b48Spatrick BasicBlock *NewNode = BasicBlock::Create(Val->getContext(), "NodeBlock");
29009467b48Spatrick
291*d415bd75Srobert ICmpInst *Comp = new ICmpInst(ICmpInst::ICMP_SLT, Val, Pivot.Low, "Pivot");
29209467b48Spatrick
29373471bf0Spatrick BasicBlock *LBranch =
29473471bf0Spatrick SwitchConvert(LHS.begin(), LHS.end(), LowerBound, NewUpperBound, Val,
29573471bf0Spatrick NewNode, OrigBlock, Default, UnreachableRanges);
29673471bf0Spatrick BasicBlock *RBranch =
29773471bf0Spatrick SwitchConvert(RHS.begin(), RHS.end(), NewLowerBound, UpperBound, Val,
29873471bf0Spatrick NewNode, OrigBlock, Default, UnreachableRanges);
29909467b48Spatrick
300*d415bd75Srobert F->insert(++OrigBlock->getIterator(), NewNode);
301*d415bd75Srobert Comp->insertInto(NewNode, NewNode->end());
30209467b48Spatrick
30309467b48Spatrick BranchInst::Create(LBranch, RBranch, Comp, NewNode);
30409467b48Spatrick return NewNode;
30509467b48Spatrick }
30609467b48Spatrick
30709467b48Spatrick /// Transform simple list of \p SI's cases into list of CaseRange's \p Cases.
30809467b48Spatrick /// \post \p Cases wouldn't contain references to \p SI's default BB.
30909467b48Spatrick /// \returns Number of \p SI's cases that do not reference \p SI's default BB.
Clusterify(CaseVector & Cases,SwitchInst * SI)31073471bf0Spatrick unsigned Clusterify(CaseVector &Cases, SwitchInst *SI) {
31109467b48Spatrick unsigned NumSimpleCases = 0;
31209467b48Spatrick
31309467b48Spatrick // Start with "simple" cases
31409467b48Spatrick for (auto Case : SI->cases()) {
31509467b48Spatrick if (Case.getCaseSuccessor() == SI->getDefaultDest())
31609467b48Spatrick continue;
31709467b48Spatrick Cases.push_back(CaseRange(Case.getCaseValue(), Case.getCaseValue(),
31809467b48Spatrick Case.getCaseSuccessor()));
31909467b48Spatrick ++NumSimpleCases;
32009467b48Spatrick }
32109467b48Spatrick
32209467b48Spatrick llvm::sort(Cases, CaseCmp());
32309467b48Spatrick
32409467b48Spatrick // Merge case into clusters
32509467b48Spatrick if (Cases.size() >= 2) {
32609467b48Spatrick CaseItr I = Cases.begin();
32709467b48Spatrick for (CaseItr J = std::next(I), E = Cases.end(); J != E; ++J) {
328*d415bd75Srobert const APInt &nextValue = J->Low->getValue();
329*d415bd75Srobert const APInt ¤tValue = I->High->getValue();
33009467b48Spatrick BasicBlock *nextBB = J->BB;
33109467b48Spatrick BasicBlock *currentBB = I->BB;
33209467b48Spatrick
33309467b48Spatrick // If the two neighboring cases go to the same destination, merge them
33409467b48Spatrick // into a single case.
335*d415bd75Srobert assert(nextValue.sgt(currentValue) &&
336*d415bd75Srobert "Cases should be strictly ascending");
33709467b48Spatrick if ((nextValue == currentValue + 1) && (currentBB == nextBB)) {
33809467b48Spatrick I->High = J->High;
33909467b48Spatrick // FIXME: Combine branch weights.
34009467b48Spatrick } else if (++I != J) {
34109467b48Spatrick *I = *J;
34209467b48Spatrick }
34309467b48Spatrick }
34409467b48Spatrick Cases.erase(std::next(I), Cases.end());
34509467b48Spatrick }
34609467b48Spatrick
34709467b48Spatrick return NumSimpleCases;
34809467b48Spatrick }
34909467b48Spatrick
35009467b48Spatrick /// Replace the specified switch instruction with a sequence of chained if-then
35109467b48Spatrick /// insts in a balanced binary search.
ProcessSwitchInst(SwitchInst * SI,SmallPtrSetImpl<BasicBlock * > & DeleteList,AssumptionCache * AC,LazyValueInfo * LVI)35273471bf0Spatrick void ProcessSwitchInst(SwitchInst *SI,
35309467b48Spatrick SmallPtrSetImpl<BasicBlock *> &DeleteList,
35409467b48Spatrick AssumptionCache *AC, LazyValueInfo *LVI) {
35509467b48Spatrick BasicBlock *OrigBlock = SI->getParent();
35609467b48Spatrick Function *F = OrigBlock->getParent();
35709467b48Spatrick Value *Val = SI->getCondition(); // The value we are switching on...
35809467b48Spatrick BasicBlock *Default = SI->getDefaultDest();
35909467b48Spatrick
36009467b48Spatrick // Don't handle unreachable blocks. If there are successors with phis, this
36109467b48Spatrick // would leave them behind with missing predecessors.
36209467b48Spatrick if ((OrigBlock != &F->getEntryBlock() && pred_empty(OrigBlock)) ||
36309467b48Spatrick OrigBlock->getSinglePredecessor() == OrigBlock) {
36409467b48Spatrick DeleteList.insert(OrigBlock);
36509467b48Spatrick return;
36609467b48Spatrick }
36709467b48Spatrick
36809467b48Spatrick // Prepare cases vector.
36909467b48Spatrick CaseVector Cases;
37009467b48Spatrick const unsigned NumSimpleCases = Clusterify(Cases, SI);
371*d415bd75Srobert IntegerType *IT = cast<IntegerType>(SI->getCondition()->getType());
372*d415bd75Srobert const unsigned BitWidth = IT->getBitWidth();
373*d415bd75Srobert // Explictly use higher precision to prevent unsigned overflow where
374*d415bd75Srobert // `UnsignedMax - 0 + 1 == 0`
375*d415bd75Srobert APInt UnsignedZero(BitWidth + 1, 0);
376*d415bd75Srobert APInt UnsignedMax = APInt::getMaxValue(BitWidth);
37709467b48Spatrick LLVM_DEBUG(dbgs() << "Clusterify finished. Total clusters: " << Cases.size()
37809467b48Spatrick << ". Total non-default cases: " << NumSimpleCases
37909467b48Spatrick << "\nCase clusters: " << Cases << "\n");
38009467b48Spatrick
38109467b48Spatrick // If there is only the default destination, just branch.
38209467b48Spatrick if (Cases.empty()) {
38309467b48Spatrick BranchInst::Create(Default, OrigBlock);
38409467b48Spatrick // Remove all the references from Default's PHIs to OrigBlock, but one.
385*d415bd75Srobert FixPhis(Default, OrigBlock, OrigBlock, UnsignedMax);
38609467b48Spatrick SI->eraseFromParent();
38709467b48Spatrick return;
38809467b48Spatrick }
38909467b48Spatrick
39009467b48Spatrick ConstantInt *LowerBound = nullptr;
39109467b48Spatrick ConstantInt *UpperBound = nullptr;
39209467b48Spatrick bool DefaultIsUnreachableFromSwitch = false;
39309467b48Spatrick
39409467b48Spatrick if (isa<UnreachableInst>(Default->getFirstNonPHIOrDbg())) {
39509467b48Spatrick // Make the bounds tightly fitted around the case value range, because we
39609467b48Spatrick // know that the value passed to the switch must be exactly one of the case
39709467b48Spatrick // values.
39809467b48Spatrick LowerBound = Cases.front().Low;
39909467b48Spatrick UpperBound = Cases.back().High;
40009467b48Spatrick DefaultIsUnreachableFromSwitch = true;
40109467b48Spatrick } else {
40209467b48Spatrick // Constraining the range of the value being switched over helps eliminating
40309467b48Spatrick // unreachable BBs and minimizing the number of `add` instructions
40409467b48Spatrick // newLeafBlock ends up emitting. Running CorrelatedValuePropagation after
40509467b48Spatrick // LowerSwitch isn't as good, and also much more expensive in terms of
40609467b48Spatrick // compile time for the following reasons:
40709467b48Spatrick // 1. it processes many kinds of instructions, not just switches;
40809467b48Spatrick // 2. even if limited to icmp instructions only, it will have to process
40909467b48Spatrick // roughly C icmp's per switch, where C is the number of cases in the
41009467b48Spatrick // switch, while LowerSwitch only needs to call LVI once per switch.
41109467b48Spatrick const DataLayout &DL = F->getParent()->getDataLayout();
41209467b48Spatrick KnownBits Known = computeKnownBits(Val, DL, /*Depth=*/0, AC, SI);
41309467b48Spatrick // TODO Shouldn't this create a signed range?
41409467b48Spatrick ConstantRange KnownBitsRange =
41509467b48Spatrick ConstantRange::fromKnownBits(Known, /*IsSigned=*/false);
41673471bf0Spatrick const ConstantRange LVIRange = LVI->getConstantRange(Val, SI);
41709467b48Spatrick ConstantRange ValRange = KnownBitsRange.intersectWith(LVIRange);
41809467b48Spatrick // We delegate removal of unreachable non-default cases to other passes. In
41909467b48Spatrick // the unlikely event that some of them survived, we just conservatively
42009467b48Spatrick // maintain the invariant that all the cases lie between the bounds. This
42109467b48Spatrick // may, however, still render the default case effectively unreachable.
422*d415bd75Srobert const APInt &Low = Cases.front().Low->getValue();
423*d415bd75Srobert const APInt &High = Cases.back().High->getValue();
42409467b48Spatrick APInt Min = APIntOps::smin(ValRange.getSignedMin(), Low);
42509467b48Spatrick APInt Max = APIntOps::smax(ValRange.getSignedMax(), High);
42609467b48Spatrick
42709467b48Spatrick LowerBound = ConstantInt::get(SI->getContext(), Min);
42809467b48Spatrick UpperBound = ConstantInt::get(SI->getContext(), Max);
42909467b48Spatrick DefaultIsUnreachableFromSwitch = (Min + (NumSimpleCases - 1) == Max);
43009467b48Spatrick }
43109467b48Spatrick
43209467b48Spatrick std::vector<IntRange> UnreachableRanges;
43309467b48Spatrick
43409467b48Spatrick if (DefaultIsUnreachableFromSwitch) {
435*d415bd75Srobert DenseMap<BasicBlock *, APInt> Popularity;
436*d415bd75Srobert APInt MaxPop(UnsignedZero);
43709467b48Spatrick BasicBlock *PopSucc = nullptr;
43809467b48Spatrick
439*d415bd75Srobert APInt SignedMax = APInt::getSignedMaxValue(BitWidth);
440*d415bd75Srobert APInt SignedMin = APInt::getSignedMinValue(BitWidth);
441*d415bd75Srobert IntRange R = {SignedMin, SignedMax};
44209467b48Spatrick UnreachableRanges.push_back(R);
44309467b48Spatrick for (const auto &I : Cases) {
444*d415bd75Srobert const APInt &Low = I.Low->getValue();
445*d415bd75Srobert const APInt &High = I.High->getValue();
44609467b48Spatrick
44709467b48Spatrick IntRange &LastRange = UnreachableRanges.back();
448*d415bd75Srobert if (LastRange.Low.eq(Low)) {
44909467b48Spatrick // There is nothing left of the previous range.
45009467b48Spatrick UnreachableRanges.pop_back();
45109467b48Spatrick } else {
45209467b48Spatrick // Terminate the previous range.
453*d415bd75Srobert assert(Low.sgt(LastRange.Low));
45409467b48Spatrick LastRange.High = Low - 1;
45509467b48Spatrick }
456*d415bd75Srobert if (High.ne(SignedMax)) {
457*d415bd75Srobert IntRange R = {High + 1, SignedMax};
45809467b48Spatrick UnreachableRanges.push_back(R);
45909467b48Spatrick }
46009467b48Spatrick
46109467b48Spatrick // Count popularity.
462*d415bd75Srobert assert(High.sge(Low) && "Popularity shouldn't be negative.");
463*d415bd75Srobert APInt N = High.sext(BitWidth + 1) - Low.sext(BitWidth + 1) + 1;
464*d415bd75Srobert // Explict insert to make sure the bitwidth of APInts match
465*d415bd75Srobert APInt &Pop = Popularity.insert({I.BB, APInt(UnsignedZero)}).first->second;
466*d415bd75Srobert if ((Pop += N).ugt(MaxPop)) {
46709467b48Spatrick MaxPop = Pop;
46809467b48Spatrick PopSucc = I.BB;
46909467b48Spatrick }
47009467b48Spatrick }
47109467b48Spatrick #ifndef NDEBUG
47209467b48Spatrick /* UnreachableRanges should be sorted and the ranges non-adjacent. */
47309467b48Spatrick for (auto I = UnreachableRanges.begin(), E = UnreachableRanges.end();
47409467b48Spatrick I != E; ++I) {
475*d415bd75Srobert assert(I->Low.sle(I->High));
47609467b48Spatrick auto Next = I + 1;
47709467b48Spatrick if (Next != E) {
478*d415bd75Srobert assert(Next->Low.sgt(I->High));
47909467b48Spatrick }
48009467b48Spatrick }
48109467b48Spatrick #endif
48209467b48Spatrick
48309467b48Spatrick // As the default block in the switch is unreachable, update the PHI nodes
48409467b48Spatrick // (remove all of the references to the default block) to reflect this.
48509467b48Spatrick const unsigned NumDefaultEdges = SI->getNumCases() + 1 - NumSimpleCases;
48609467b48Spatrick for (unsigned I = 0; I < NumDefaultEdges; ++I)
48709467b48Spatrick Default->removePredecessor(OrigBlock);
48809467b48Spatrick
48909467b48Spatrick // Use the most popular block as the new default, reducing the number of
49009467b48Spatrick // cases.
49109467b48Spatrick Default = PopSucc;
49273471bf0Spatrick llvm::erase_if(Cases,
49373471bf0Spatrick [PopSucc](const CaseRange &R) { return R.BB == PopSucc; });
49409467b48Spatrick
49509467b48Spatrick // If there are no cases left, just branch.
49609467b48Spatrick if (Cases.empty()) {
49709467b48Spatrick BranchInst::Create(Default, OrigBlock);
49809467b48Spatrick SI->eraseFromParent();
49909467b48Spatrick // As all the cases have been replaced with a single branch, only keep
50009467b48Spatrick // one entry in the PHI nodes.
501*d415bd75Srobert if (!MaxPop.isZero())
502*d415bd75Srobert for (APInt I(UnsignedZero); I.ult(MaxPop - 1); ++I)
50309467b48Spatrick PopSucc->removePredecessor(OrigBlock);
50409467b48Spatrick return;
50509467b48Spatrick }
50609467b48Spatrick
50709467b48Spatrick // If the condition was a PHI node with the switch block as a predecessor
50809467b48Spatrick // removing predecessors may have caused the condition to be erased.
50909467b48Spatrick // Getting the condition value again here protects against that.
51009467b48Spatrick Val = SI->getCondition();
51109467b48Spatrick }
51209467b48Spatrick
51309467b48Spatrick BasicBlock *SwitchBlock =
51473471bf0Spatrick SwitchConvert(Cases.begin(), Cases.end(), LowerBound, UpperBound, Val,
515*d415bd75Srobert OrigBlock, OrigBlock, Default, UnreachableRanges);
51609467b48Spatrick
517*d415bd75Srobert // We have added incoming values for newly-created predecessors in
518*d415bd75Srobert // NewLeafBlock(). The only meaningful work we offload to FixPhis() is to
519*d415bd75Srobert // remove the incoming values from OrigBlock. There might be a special case
520*d415bd75Srobert // that SwitchBlock is the same as Default, under which the PHIs in Default
521*d415bd75Srobert // are fixed inside SwitchConvert().
522*d415bd75Srobert if (SwitchBlock != Default)
523*d415bd75Srobert FixPhis(Default, OrigBlock, nullptr, UnsignedMax);
52409467b48Spatrick
52509467b48Spatrick // Branch to our shiny new if-then stuff...
52609467b48Spatrick BranchInst::Create(SwitchBlock, OrigBlock);
52709467b48Spatrick
52809467b48Spatrick // We are now done with the switch instruction, delete it.
52909467b48Spatrick BasicBlock *OldDefault = SI->getDefaultDest();
530*d415bd75Srobert SI->eraseFromParent();
53109467b48Spatrick
53209467b48Spatrick // If the Default block has no more predecessors just add it to DeleteList.
53373471bf0Spatrick if (pred_empty(OldDefault))
53409467b48Spatrick DeleteList.insert(OldDefault);
53509467b48Spatrick }
53673471bf0Spatrick
LowerSwitch(Function & F,LazyValueInfo * LVI,AssumptionCache * AC)53773471bf0Spatrick bool LowerSwitch(Function &F, LazyValueInfo *LVI, AssumptionCache *AC) {
53873471bf0Spatrick bool Changed = false;
53973471bf0Spatrick SmallPtrSet<BasicBlock *, 8> DeleteList;
54073471bf0Spatrick
541*d415bd75Srobert // We use make_early_inc_range here so that we don't traverse new blocks.
542*d415bd75Srobert for (BasicBlock &Cur : llvm::make_early_inc_range(F)) {
54373471bf0Spatrick // If the block is a dead Default block that will be deleted later, don't
54473471bf0Spatrick // waste time processing it.
545*d415bd75Srobert if (DeleteList.count(&Cur))
54673471bf0Spatrick continue;
54773471bf0Spatrick
548*d415bd75Srobert if (SwitchInst *SI = dyn_cast<SwitchInst>(Cur.getTerminator())) {
54973471bf0Spatrick Changed = true;
55073471bf0Spatrick ProcessSwitchInst(SI, DeleteList, AC, LVI);
55173471bf0Spatrick }
55273471bf0Spatrick }
55373471bf0Spatrick
55473471bf0Spatrick for (BasicBlock *BB : DeleteList) {
55573471bf0Spatrick LVI->eraseBlock(BB);
55673471bf0Spatrick DeleteDeadBlock(BB);
55773471bf0Spatrick }
55873471bf0Spatrick
55973471bf0Spatrick return Changed;
56073471bf0Spatrick }
56173471bf0Spatrick
56273471bf0Spatrick /// Replace all SwitchInst instructions with chained branch instructions.
56373471bf0Spatrick class LowerSwitchLegacyPass : public FunctionPass {
56473471bf0Spatrick public:
56573471bf0Spatrick // Pass identification, replacement for typeid
56673471bf0Spatrick static char ID;
56773471bf0Spatrick
LowerSwitchLegacyPass()56873471bf0Spatrick LowerSwitchLegacyPass() : FunctionPass(ID) {
56973471bf0Spatrick initializeLowerSwitchLegacyPassPass(*PassRegistry::getPassRegistry());
57073471bf0Spatrick }
57173471bf0Spatrick
57273471bf0Spatrick bool runOnFunction(Function &F) override;
57373471bf0Spatrick
getAnalysisUsage(AnalysisUsage & AU) const57473471bf0Spatrick void getAnalysisUsage(AnalysisUsage &AU) const override {
57573471bf0Spatrick AU.addRequired<LazyValueInfoWrapperPass>();
57673471bf0Spatrick }
57773471bf0Spatrick };
57873471bf0Spatrick
57973471bf0Spatrick } // end anonymous namespace
58073471bf0Spatrick
58173471bf0Spatrick char LowerSwitchLegacyPass::ID = 0;
58273471bf0Spatrick
58373471bf0Spatrick // Publicly exposed interface to pass...
58473471bf0Spatrick char &llvm::LowerSwitchID = LowerSwitchLegacyPass::ID;
58573471bf0Spatrick
58673471bf0Spatrick INITIALIZE_PASS_BEGIN(LowerSwitchLegacyPass, "lowerswitch",
58773471bf0Spatrick "Lower SwitchInst's to branches", false, false)
INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)58873471bf0Spatrick INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)
58973471bf0Spatrick INITIALIZE_PASS_DEPENDENCY(LazyValueInfoWrapperPass)
59073471bf0Spatrick INITIALIZE_PASS_END(LowerSwitchLegacyPass, "lowerswitch",
59173471bf0Spatrick "Lower SwitchInst's to branches", false, false)
59273471bf0Spatrick
59373471bf0Spatrick // createLowerSwitchPass - Interface to this file...
59473471bf0Spatrick FunctionPass *llvm::createLowerSwitchPass() {
59573471bf0Spatrick return new LowerSwitchLegacyPass();
59673471bf0Spatrick }
59773471bf0Spatrick
runOnFunction(Function & F)59873471bf0Spatrick bool LowerSwitchLegacyPass::runOnFunction(Function &F) {
59973471bf0Spatrick LazyValueInfo *LVI = &getAnalysis<LazyValueInfoWrapperPass>().getLVI();
60073471bf0Spatrick auto *ACT = getAnalysisIfAvailable<AssumptionCacheTracker>();
60173471bf0Spatrick AssumptionCache *AC = ACT ? &ACT->getAssumptionCache(F) : nullptr;
60273471bf0Spatrick return LowerSwitch(F, LVI, AC);
60373471bf0Spatrick }
60473471bf0Spatrick
run(Function & F,FunctionAnalysisManager & AM)60573471bf0Spatrick PreservedAnalyses LowerSwitchPass::run(Function &F,
60673471bf0Spatrick FunctionAnalysisManager &AM) {
60773471bf0Spatrick LazyValueInfo *LVI = &AM.getResult<LazyValueAnalysis>(F);
60873471bf0Spatrick AssumptionCache *AC = AM.getCachedResult<AssumptionAnalysis>(F);
60973471bf0Spatrick return LowerSwitch(F, LVI, AC) ? PreservedAnalyses::none()
61073471bf0Spatrick : PreservedAnalyses::all();
61173471bf0Spatrick }
612