xref: /freebsd-src/contrib/llvm-project/llvm/lib/Target/AMDGPU/R600MachineCFGStructurizer.cpp (revision 81ad626541db97eb356e2c1d4a20eb2a26a766ab)
1*81ad6265SDimitry Andric //===- R600MachineCFGStructurizer.cpp - CFG Structurizer ------------------===//
2*81ad6265SDimitry Andric //
3*81ad6265SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*81ad6265SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*81ad6265SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*81ad6265SDimitry Andric //
7*81ad6265SDimitry Andric //==-----------------------------------------------------------------------===//
8*81ad6265SDimitry Andric 
9*81ad6265SDimitry Andric #include "MCTargetDesc/R600MCTargetDesc.h"
10*81ad6265SDimitry Andric #include "R600.h"
11*81ad6265SDimitry Andric #include "R600RegisterInfo.h"
12*81ad6265SDimitry Andric #include "R600Subtarget.h"
13*81ad6265SDimitry Andric #include "llvm/ADT/DepthFirstIterator.h"
14*81ad6265SDimitry Andric #include "llvm/ADT/SCCIterator.h"
15*81ad6265SDimitry Andric #include "llvm/ADT/Statistic.h"
16*81ad6265SDimitry Andric #include "llvm/CodeGen/MachineFunction.h"
17*81ad6265SDimitry Andric #include "llvm/CodeGen/MachineFunctionPass.h"
18*81ad6265SDimitry Andric #include "llvm/CodeGen/MachineJumpTableInfo.h"
19*81ad6265SDimitry Andric #include "llvm/CodeGen/MachineLoopInfo.h"
20*81ad6265SDimitry Andric #include "llvm/CodeGen/MachinePostDominators.h"
21*81ad6265SDimitry Andric #include "llvm/InitializePasses.h"
22*81ad6265SDimitry Andric 
23*81ad6265SDimitry Andric using namespace llvm;
24*81ad6265SDimitry Andric 
25*81ad6265SDimitry Andric #define DEBUG_TYPE "structcfg"
26*81ad6265SDimitry Andric 
27*81ad6265SDimitry Andric #define DEFAULT_VEC_SLOTS 8
28*81ad6265SDimitry Andric 
29*81ad6265SDimitry Andric // TODO: move-begin.
30*81ad6265SDimitry Andric 
31*81ad6265SDimitry Andric //===----------------------------------------------------------------------===//
32*81ad6265SDimitry Andric //
33*81ad6265SDimitry Andric // Statistics for CFGStructurizer.
34*81ad6265SDimitry Andric //
35*81ad6265SDimitry Andric //===----------------------------------------------------------------------===//
36*81ad6265SDimitry Andric 
37*81ad6265SDimitry Andric STATISTIC(numSerialPatternMatch,    "CFGStructurizer number of serial pattern "
38*81ad6265SDimitry Andric     "matched");
39*81ad6265SDimitry Andric STATISTIC(numIfPatternMatch,        "CFGStructurizer number of if pattern "
40*81ad6265SDimitry Andric     "matched");
41*81ad6265SDimitry Andric STATISTIC(numClonedBlock,           "CFGStructurizer cloned blocks");
42*81ad6265SDimitry Andric STATISTIC(numClonedInstr,           "CFGStructurizer cloned instructions");
43*81ad6265SDimitry Andric 
44*81ad6265SDimitry Andric namespace llvm {
45*81ad6265SDimitry Andric 
46*81ad6265SDimitry Andric void initializeR600MachineCFGStructurizerPass(PassRegistry &);
47*81ad6265SDimitry Andric 
48*81ad6265SDimitry Andric } // end namespace llvm
49*81ad6265SDimitry Andric 
50*81ad6265SDimitry Andric namespace {
51*81ad6265SDimitry Andric 
52*81ad6265SDimitry Andric //===----------------------------------------------------------------------===//
53*81ad6265SDimitry Andric //
54*81ad6265SDimitry Andric // Miscellaneous utility for CFGStructurizer.
55*81ad6265SDimitry Andric //
56*81ad6265SDimitry Andric //===----------------------------------------------------------------------===//
57*81ad6265SDimitry Andric 
58*81ad6265SDimitry Andric #define SHOWNEWINSTR(i) LLVM_DEBUG(dbgs() << "New instr: " << *i << "\n");
59*81ad6265SDimitry Andric 
60*81ad6265SDimitry Andric #define SHOWNEWBLK(b, msg)                                                     \
61*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << msg << "BB" << b->getNumber() << "size " << b->size();  \
62*81ad6265SDimitry Andric              dbgs() << "\n";);
63*81ad6265SDimitry Andric 
64*81ad6265SDimitry Andric #define SHOWBLK_DETAIL(b, msg)                                                 \
65*81ad6265SDimitry Andric   LLVM_DEBUG(if (b) {                                                          \
66*81ad6265SDimitry Andric     dbgs() << msg << "BB" << b->getNumber() << "size " << b->size();           \
67*81ad6265SDimitry Andric     b->print(dbgs());                                                          \
68*81ad6265SDimitry Andric     dbgs() << "\n";                                                            \
69*81ad6265SDimitry Andric   });
70*81ad6265SDimitry Andric 
71*81ad6265SDimitry Andric #define INVALIDSCCNUM -1
72*81ad6265SDimitry Andric 
73*81ad6265SDimitry Andric //===----------------------------------------------------------------------===//
74*81ad6265SDimitry Andric //
75*81ad6265SDimitry Andric // supporting data structure for CFGStructurizer
76*81ad6265SDimitry Andric //
77*81ad6265SDimitry Andric //===----------------------------------------------------------------------===//
78*81ad6265SDimitry Andric 
79*81ad6265SDimitry Andric class BlockInformation {
80*81ad6265SDimitry Andric public:
81*81ad6265SDimitry Andric   bool IsRetired = false;
82*81ad6265SDimitry Andric   int SccNum = INVALIDSCCNUM;
83*81ad6265SDimitry Andric 
84*81ad6265SDimitry Andric   BlockInformation() = default;
85*81ad6265SDimitry Andric };
86*81ad6265SDimitry Andric 
87*81ad6265SDimitry Andric //===----------------------------------------------------------------------===//
88*81ad6265SDimitry Andric //
89*81ad6265SDimitry Andric // CFGStructurizer
90*81ad6265SDimitry Andric //
91*81ad6265SDimitry Andric //===----------------------------------------------------------------------===//
92*81ad6265SDimitry Andric 
93*81ad6265SDimitry Andric class R600MachineCFGStructurizer : public MachineFunctionPass {
94*81ad6265SDimitry Andric public:
95*81ad6265SDimitry Andric   using MBBVector = SmallVector<MachineBasicBlock *, 32>;
96*81ad6265SDimitry Andric   using MBBInfoMap = std::map<MachineBasicBlock *, BlockInformation *>;
97*81ad6265SDimitry Andric   using LoopLandInfoMap = std::map<MachineLoop *, MachineBasicBlock *>;
98*81ad6265SDimitry Andric 
99*81ad6265SDimitry Andric   enum PathToKind {
100*81ad6265SDimitry Andric     Not_SinglePath = 0,
101*81ad6265SDimitry Andric     SinglePath_InPath = 1,
102*81ad6265SDimitry Andric     SinglePath_NotInPath = 2
103*81ad6265SDimitry Andric   };
104*81ad6265SDimitry Andric 
105*81ad6265SDimitry Andric   static char ID;
106*81ad6265SDimitry Andric 
107*81ad6265SDimitry Andric   R600MachineCFGStructurizer() : MachineFunctionPass(ID) {
108*81ad6265SDimitry Andric     initializeR600MachineCFGStructurizerPass(*PassRegistry::getPassRegistry());
109*81ad6265SDimitry Andric   }
110*81ad6265SDimitry Andric 
111*81ad6265SDimitry Andric   StringRef getPassName() const override {
112*81ad6265SDimitry Andric     return "AMDGPU Control Flow Graph structurizer Pass";
113*81ad6265SDimitry Andric   }
114*81ad6265SDimitry Andric 
115*81ad6265SDimitry Andric   void getAnalysisUsage(AnalysisUsage &AU) const override {
116*81ad6265SDimitry Andric     AU.addRequired<MachineDominatorTree>();
117*81ad6265SDimitry Andric     AU.addRequired<MachinePostDominatorTree>();
118*81ad6265SDimitry Andric     AU.addRequired<MachineLoopInfo>();
119*81ad6265SDimitry Andric     MachineFunctionPass::getAnalysisUsage(AU);
120*81ad6265SDimitry Andric   }
121*81ad6265SDimitry Andric 
122*81ad6265SDimitry Andric   /// Perform the CFG structurization
123*81ad6265SDimitry Andric   bool run();
124*81ad6265SDimitry Andric 
125*81ad6265SDimitry Andric   /// Perform the CFG preparation
126*81ad6265SDimitry Andric   /// This step will remove every unconditionnal/dead jump instructions and make
127*81ad6265SDimitry Andric   /// sure all loops have an exit block
128*81ad6265SDimitry Andric   bool prepare();
129*81ad6265SDimitry Andric 
130*81ad6265SDimitry Andric   bool runOnMachineFunction(MachineFunction &MF) override {
131*81ad6265SDimitry Andric     // FIXME: This pass causes verification failures.
132*81ad6265SDimitry Andric     MF.getProperties().set(
133*81ad6265SDimitry Andric         MachineFunctionProperties::Property::FailsVerification);
134*81ad6265SDimitry Andric 
135*81ad6265SDimitry Andric     TII = MF.getSubtarget<R600Subtarget>().getInstrInfo();
136*81ad6265SDimitry Andric     TRI = &TII->getRegisterInfo();
137*81ad6265SDimitry Andric     LLVM_DEBUG(MF.dump(););
138*81ad6265SDimitry Andric     OrderedBlks.clear();
139*81ad6265SDimitry Andric     Visited.clear();
140*81ad6265SDimitry Andric     FuncRep = &MF;
141*81ad6265SDimitry Andric     MLI = &getAnalysis<MachineLoopInfo>();
142*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "LoopInfo:\n"; PrintLoopinfo(*MLI););
143*81ad6265SDimitry Andric     MDT = &getAnalysis<MachineDominatorTree>();
144*81ad6265SDimitry Andric     LLVM_DEBUG(MDT->print(dbgs(), (const Module *)nullptr););
145*81ad6265SDimitry Andric     PDT = &getAnalysis<MachinePostDominatorTree>();
146*81ad6265SDimitry Andric     LLVM_DEBUG(PDT->print(dbgs()););
147*81ad6265SDimitry Andric     prepare();
148*81ad6265SDimitry Andric     run();
149*81ad6265SDimitry Andric     LLVM_DEBUG(MF.dump(););
150*81ad6265SDimitry Andric     return true;
151*81ad6265SDimitry Andric   }
152*81ad6265SDimitry Andric 
153*81ad6265SDimitry Andric protected:
154*81ad6265SDimitry Andric   MachineDominatorTree *MDT;
155*81ad6265SDimitry Andric   MachinePostDominatorTree *PDT;
156*81ad6265SDimitry Andric   MachineLoopInfo *MLI;
157*81ad6265SDimitry Andric   const R600InstrInfo *TII = nullptr;
158*81ad6265SDimitry Andric   const R600RegisterInfo *TRI = nullptr;
159*81ad6265SDimitry Andric 
160*81ad6265SDimitry Andric   // PRINT FUNCTIONS
161*81ad6265SDimitry Andric   /// Print the ordered Blocks.
162*81ad6265SDimitry Andric   void printOrderedBlocks() const {
163*81ad6265SDimitry Andric     size_t i = 0;
164*81ad6265SDimitry Andric     for (MBBVector::const_iterator iterBlk = OrderedBlks.begin(),
165*81ad6265SDimitry Andric         iterBlkEnd = OrderedBlks.end(); iterBlk != iterBlkEnd; ++iterBlk, ++i) {
166*81ad6265SDimitry Andric       dbgs() << "BB" << (*iterBlk)->getNumber();
167*81ad6265SDimitry Andric       dbgs() << "(" << getSCCNum(*iterBlk) << "," << (*iterBlk)->size() << ")";
168*81ad6265SDimitry Andric       if (i != 0 && i % 10 == 0) {
169*81ad6265SDimitry Andric         dbgs() << "\n";
170*81ad6265SDimitry Andric       } else {
171*81ad6265SDimitry Andric         dbgs() << " ";
172*81ad6265SDimitry Andric       }
173*81ad6265SDimitry Andric     }
174*81ad6265SDimitry Andric   }
175*81ad6265SDimitry Andric 
176*81ad6265SDimitry Andric   static void PrintLoopinfo(const MachineLoopInfo &LoopInfo) {
177*81ad6265SDimitry Andric     for (const MachineLoop *L : LoopInfo)
178*81ad6265SDimitry Andric       L->print(dbgs());
179*81ad6265SDimitry Andric   }
180*81ad6265SDimitry Andric 
181*81ad6265SDimitry Andric   // UTILITY FUNCTIONS
182*81ad6265SDimitry Andric   int getSCCNum(MachineBasicBlock *MBB) const;
183*81ad6265SDimitry Andric   MachineBasicBlock *getLoopLandInfo(MachineLoop *LoopRep) const;
184*81ad6265SDimitry Andric   bool hasBackEdge(MachineBasicBlock *MBB) const;
185*81ad6265SDimitry Andric   bool isRetiredBlock(MachineBasicBlock *MBB) const;
186*81ad6265SDimitry Andric   bool isActiveLoophead(MachineBasicBlock *MBB) const;
187*81ad6265SDimitry Andric   PathToKind singlePathTo(MachineBasicBlock *SrcMBB, MachineBasicBlock *DstMBB,
188*81ad6265SDimitry Andric       bool AllowSideEntry = true) const;
189*81ad6265SDimitry Andric   int countActiveBlock(MBBVector::const_iterator It,
190*81ad6265SDimitry Andric       MBBVector::const_iterator E) const;
191*81ad6265SDimitry Andric   bool needMigrateBlock(MachineBasicBlock *MBB) const;
192*81ad6265SDimitry Andric 
193*81ad6265SDimitry Andric   // Utility Functions
194*81ad6265SDimitry Andric   void reversePredicateSetter(MachineBasicBlock::iterator I,
195*81ad6265SDimitry Andric                               MachineBasicBlock &MBB);
196*81ad6265SDimitry Andric   /// Compute the reversed DFS post order of Blocks
197*81ad6265SDimitry Andric   void orderBlocks(MachineFunction *MF);
198*81ad6265SDimitry Andric 
199*81ad6265SDimitry Andric   // Function originally from CFGStructTraits
200*81ad6265SDimitry Andric   void insertInstrEnd(MachineBasicBlock *MBB, int NewOpcode,
201*81ad6265SDimitry Andric                       const DebugLoc &DL = DebugLoc());
202*81ad6265SDimitry Andric   MachineInstr *insertInstrBefore(MachineBasicBlock *MBB, int NewOpcode,
203*81ad6265SDimitry Andric                                   const DebugLoc &DL = DebugLoc());
204*81ad6265SDimitry Andric   MachineInstr *insertInstrBefore(MachineBasicBlock::iterator I, int NewOpcode);
205*81ad6265SDimitry Andric   void insertCondBranchBefore(MachineBasicBlock::iterator I, int NewOpcode,
206*81ad6265SDimitry Andric                               const DebugLoc &DL);
207*81ad6265SDimitry Andric   void insertCondBranchBefore(MachineBasicBlock *MBB,
208*81ad6265SDimitry Andric                               MachineBasicBlock::iterator I, int NewOpcode,
209*81ad6265SDimitry Andric                               int RegNum, const DebugLoc &DL);
210*81ad6265SDimitry Andric 
211*81ad6265SDimitry Andric   static int getBranchNzeroOpcode(int OldOpcode);
212*81ad6265SDimitry Andric   static int getBranchZeroOpcode(int OldOpcode);
213*81ad6265SDimitry Andric   static int getContinueNzeroOpcode(int OldOpcode);
214*81ad6265SDimitry Andric   static int getContinueZeroOpcode(int OldOpcode);
215*81ad6265SDimitry Andric   static MachineBasicBlock *getTrueBranch(MachineInstr *MI);
216*81ad6265SDimitry Andric   static void setTrueBranch(MachineInstr *MI, MachineBasicBlock *MBB);
217*81ad6265SDimitry Andric   static MachineBasicBlock *getFalseBranch(MachineBasicBlock *MBB,
218*81ad6265SDimitry Andric       MachineInstr *MI);
219*81ad6265SDimitry Andric   static bool isCondBranch(MachineInstr *MI);
220*81ad6265SDimitry Andric   static bool isUncondBranch(MachineInstr *MI);
221*81ad6265SDimitry Andric   static DebugLoc getLastDebugLocInBB(MachineBasicBlock *MBB);
222*81ad6265SDimitry Andric   static MachineInstr *getNormalBlockBranchInstr(MachineBasicBlock *MBB);
223*81ad6265SDimitry Andric 
224*81ad6265SDimitry Andric   /// The correct naming for this is getPossibleLoopendBlockBranchInstr.
225*81ad6265SDimitry Andric   ///
226*81ad6265SDimitry Andric   /// BB with backward-edge could have move instructions after the branch
227*81ad6265SDimitry Andric   /// instruction.  Such move instruction "belong to" the loop backward-edge.
228*81ad6265SDimitry Andric   MachineInstr *getLoopendBlockBranchInstr(MachineBasicBlock *MBB);
229*81ad6265SDimitry Andric 
230*81ad6265SDimitry Andric   static MachineInstr *getReturnInstr(MachineBasicBlock *MBB);
231*81ad6265SDimitry Andric   static bool isReturnBlock(MachineBasicBlock *MBB);
232*81ad6265SDimitry Andric   static void cloneSuccessorList(MachineBasicBlock *DstMBB,
233*81ad6265SDimitry Andric       MachineBasicBlock *SrcMBB);
234*81ad6265SDimitry Andric   static MachineBasicBlock *clone(MachineBasicBlock *MBB);
235*81ad6265SDimitry Andric 
236*81ad6265SDimitry Andric   /// MachineBasicBlock::ReplaceUsesOfBlockWith doesn't serve the purpose
237*81ad6265SDimitry Andric   /// because the AMDGPU instruction is not recognized as terminator fix this
238*81ad6265SDimitry Andric   /// and retire this routine
239*81ad6265SDimitry Andric   void replaceInstrUseOfBlockWith(MachineBasicBlock *SrcMBB,
240*81ad6265SDimitry Andric       MachineBasicBlock *OldMBB, MachineBasicBlock *NewBlk);
241*81ad6265SDimitry Andric 
242*81ad6265SDimitry Andric   static void wrapup(MachineBasicBlock *MBB);
243*81ad6265SDimitry Andric 
244*81ad6265SDimitry Andric   int patternMatch(MachineBasicBlock *MBB);
245*81ad6265SDimitry Andric   int patternMatchGroup(MachineBasicBlock *MBB);
246*81ad6265SDimitry Andric   int serialPatternMatch(MachineBasicBlock *MBB);
247*81ad6265SDimitry Andric   int ifPatternMatch(MachineBasicBlock *MBB);
248*81ad6265SDimitry Andric   int loopendPatternMatch();
249*81ad6265SDimitry Andric   int mergeLoop(MachineLoop *LoopRep);
250*81ad6265SDimitry Andric 
251*81ad6265SDimitry Andric   /// return true iff src1Blk->succ_empty() && src1Blk and src2Blk are in
252*81ad6265SDimitry Andric   /// the same loop with LoopLandInfo without explicitly keeping track of
253*81ad6265SDimitry Andric   /// loopContBlks and loopBreakBlks, this is a method to get the information.
254*81ad6265SDimitry Andric   bool isSameloopDetachedContbreak(MachineBasicBlock *Src1MBB,
255*81ad6265SDimitry Andric       MachineBasicBlock *Src2MBB);
256*81ad6265SDimitry Andric   int handleJumpintoIf(MachineBasicBlock *HeadMBB,
257*81ad6265SDimitry Andric       MachineBasicBlock *TrueMBB, MachineBasicBlock *FalseMBB);
258*81ad6265SDimitry Andric   int handleJumpintoIfImp(MachineBasicBlock *HeadMBB,
259*81ad6265SDimitry Andric       MachineBasicBlock *TrueMBB, MachineBasicBlock *FalseMBB);
260*81ad6265SDimitry Andric   int improveSimpleJumpintoIf(MachineBasicBlock *HeadMBB,
261*81ad6265SDimitry Andric       MachineBasicBlock *TrueMBB, MachineBasicBlock *FalseMBB,
262*81ad6265SDimitry Andric       MachineBasicBlock **LandMBBPtr);
263*81ad6265SDimitry Andric   void showImproveSimpleJumpintoIf(MachineBasicBlock *HeadMBB,
264*81ad6265SDimitry Andric       MachineBasicBlock *TrueMBB, MachineBasicBlock *FalseMBB,
265*81ad6265SDimitry Andric       MachineBasicBlock *LandMBB, bool Detail = false);
266*81ad6265SDimitry Andric   int cloneOnSideEntryTo(MachineBasicBlock *PreMBB,
267*81ad6265SDimitry Andric       MachineBasicBlock *SrcMBB, MachineBasicBlock *DstMBB);
268*81ad6265SDimitry Andric   void mergeSerialBlock(MachineBasicBlock *DstMBB,
269*81ad6265SDimitry Andric       MachineBasicBlock *SrcMBB);
270*81ad6265SDimitry Andric 
271*81ad6265SDimitry Andric   void mergeIfthenelseBlock(MachineInstr *BranchMI,
272*81ad6265SDimitry Andric       MachineBasicBlock *MBB, MachineBasicBlock *TrueMBB,
273*81ad6265SDimitry Andric       MachineBasicBlock *FalseMBB, MachineBasicBlock *LandMBB);
274*81ad6265SDimitry Andric   void mergeLooplandBlock(MachineBasicBlock *DstMBB,
275*81ad6265SDimitry Andric       MachineBasicBlock *LandMBB);
276*81ad6265SDimitry Andric   void mergeLoopbreakBlock(MachineBasicBlock *ExitingMBB,
277*81ad6265SDimitry Andric       MachineBasicBlock *LandMBB);
278*81ad6265SDimitry Andric   void settleLoopcontBlock(MachineBasicBlock *ContingMBB,
279*81ad6265SDimitry Andric       MachineBasicBlock *ContMBB);
280*81ad6265SDimitry Andric 
281*81ad6265SDimitry Andric   /// normalizeInfiniteLoopExit change
282*81ad6265SDimitry Andric   ///   B1:
283*81ad6265SDimitry Andric   ///        uncond_br LoopHeader
284*81ad6265SDimitry Andric   ///
285*81ad6265SDimitry Andric   /// to
286*81ad6265SDimitry Andric   ///   B1:
287*81ad6265SDimitry Andric   ///        cond_br 1 LoopHeader dummyExit
288*81ad6265SDimitry Andric   /// and return the newly added dummy exit block
289*81ad6265SDimitry Andric   MachineBasicBlock *normalizeInfiniteLoopExit(MachineLoop *LoopRep);
290*81ad6265SDimitry Andric   void removeUnconditionalBranch(MachineBasicBlock *MBB);
291*81ad6265SDimitry Andric 
292*81ad6265SDimitry Andric   /// Remove duplicate branches instructions in a block.
293*81ad6265SDimitry Andric   /// For instance
294*81ad6265SDimitry Andric   /// B0:
295*81ad6265SDimitry Andric   ///    cond_br X B1 B2
296*81ad6265SDimitry Andric   ///    cond_br X B1 B2
297*81ad6265SDimitry Andric   /// is transformed to
298*81ad6265SDimitry Andric   /// B0:
299*81ad6265SDimitry Andric   ///    cond_br X B1 B2
300*81ad6265SDimitry Andric   void removeRedundantConditionalBranch(MachineBasicBlock *MBB);
301*81ad6265SDimitry Andric 
302*81ad6265SDimitry Andric   void addDummyExitBlock(SmallVectorImpl<MachineBasicBlock *> &RetMBB);
303*81ad6265SDimitry Andric   void removeSuccessor(MachineBasicBlock *MBB);
304*81ad6265SDimitry Andric   MachineBasicBlock *cloneBlockForPredecessor(MachineBasicBlock *MBB,
305*81ad6265SDimitry Andric       MachineBasicBlock *PredMBB);
306*81ad6265SDimitry Andric   void migrateInstruction(MachineBasicBlock *SrcMBB,
307*81ad6265SDimitry Andric       MachineBasicBlock *DstMBB, MachineBasicBlock::iterator I);
308*81ad6265SDimitry Andric   void recordSccnum(MachineBasicBlock *MBB, int SCCNum);
309*81ad6265SDimitry Andric   void retireBlock(MachineBasicBlock *MBB);
310*81ad6265SDimitry Andric 
311*81ad6265SDimitry Andric private:
312*81ad6265SDimitry Andric   MBBInfoMap BlockInfoMap;
313*81ad6265SDimitry Andric   LoopLandInfoMap LLInfoMap;
314*81ad6265SDimitry Andric   std::map<MachineLoop *, bool> Visited;
315*81ad6265SDimitry Andric   MachineFunction *FuncRep;
316*81ad6265SDimitry Andric   SmallVector<MachineBasicBlock *, DEFAULT_VEC_SLOTS> OrderedBlks;
317*81ad6265SDimitry Andric };
318*81ad6265SDimitry Andric 
319*81ad6265SDimitry Andric } // end anonymous namespace
320*81ad6265SDimitry Andric 
321*81ad6265SDimitry Andric char R600MachineCFGStructurizer::ID = 0;
322*81ad6265SDimitry Andric 
323*81ad6265SDimitry Andric int R600MachineCFGStructurizer::getSCCNum(MachineBasicBlock *MBB) const {
324*81ad6265SDimitry Andric   MBBInfoMap::const_iterator It = BlockInfoMap.find(MBB);
325*81ad6265SDimitry Andric   if (It == BlockInfoMap.end())
326*81ad6265SDimitry Andric     return INVALIDSCCNUM;
327*81ad6265SDimitry Andric   return (*It).second->SccNum;
328*81ad6265SDimitry Andric }
329*81ad6265SDimitry Andric 
330*81ad6265SDimitry Andric MachineBasicBlock *R600MachineCFGStructurizer::getLoopLandInfo(MachineLoop *LoopRep)
331*81ad6265SDimitry Andric     const {
332*81ad6265SDimitry Andric   LoopLandInfoMap::const_iterator It = LLInfoMap.find(LoopRep);
333*81ad6265SDimitry Andric   if (It == LLInfoMap.end())
334*81ad6265SDimitry Andric     return nullptr;
335*81ad6265SDimitry Andric   return (*It).second;
336*81ad6265SDimitry Andric }
337*81ad6265SDimitry Andric 
338*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::hasBackEdge(MachineBasicBlock *MBB) const {
339*81ad6265SDimitry Andric   MachineLoop *LoopRep = MLI->getLoopFor(MBB);
340*81ad6265SDimitry Andric   if (!LoopRep)
341*81ad6265SDimitry Andric     return false;
342*81ad6265SDimitry Andric   MachineBasicBlock *LoopHeader = LoopRep->getHeader();
343*81ad6265SDimitry Andric   return MBB->isSuccessor(LoopHeader);
344*81ad6265SDimitry Andric }
345*81ad6265SDimitry Andric 
346*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::isRetiredBlock(MachineBasicBlock *MBB) const {
347*81ad6265SDimitry Andric   MBBInfoMap::const_iterator It = BlockInfoMap.find(MBB);
348*81ad6265SDimitry Andric   if (It == BlockInfoMap.end())
349*81ad6265SDimitry Andric     return false;
350*81ad6265SDimitry Andric   return (*It).second->IsRetired;
351*81ad6265SDimitry Andric }
352*81ad6265SDimitry Andric 
353*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::isActiveLoophead(MachineBasicBlock *MBB) const {
354*81ad6265SDimitry Andric   MachineLoop *LoopRep = MLI->getLoopFor(MBB);
355*81ad6265SDimitry Andric   while (LoopRep && LoopRep->getHeader() == MBB) {
356*81ad6265SDimitry Andric     MachineBasicBlock *LoopLand = getLoopLandInfo(LoopRep);
357*81ad6265SDimitry Andric     if(!LoopLand)
358*81ad6265SDimitry Andric       return true;
359*81ad6265SDimitry Andric     if (!isRetiredBlock(LoopLand))
360*81ad6265SDimitry Andric       return true;
361*81ad6265SDimitry Andric     LoopRep = LoopRep->getParentLoop();
362*81ad6265SDimitry Andric   }
363*81ad6265SDimitry Andric   return false;
364*81ad6265SDimitry Andric }
365*81ad6265SDimitry Andric 
366*81ad6265SDimitry Andric R600MachineCFGStructurizer::PathToKind R600MachineCFGStructurizer::singlePathTo(
367*81ad6265SDimitry Andric     MachineBasicBlock *SrcMBB, MachineBasicBlock *DstMBB,
368*81ad6265SDimitry Andric     bool AllowSideEntry) const {
369*81ad6265SDimitry Andric   assert(DstMBB);
370*81ad6265SDimitry Andric   if (SrcMBB == DstMBB)
371*81ad6265SDimitry Andric     return SinglePath_InPath;
372*81ad6265SDimitry Andric   while (SrcMBB && SrcMBB->succ_size() == 1) {
373*81ad6265SDimitry Andric     SrcMBB = *SrcMBB->succ_begin();
374*81ad6265SDimitry Andric     if (SrcMBB == DstMBB)
375*81ad6265SDimitry Andric       return SinglePath_InPath;
376*81ad6265SDimitry Andric     if (!AllowSideEntry && SrcMBB->pred_size() > 1)
377*81ad6265SDimitry Andric       return Not_SinglePath;
378*81ad6265SDimitry Andric   }
379*81ad6265SDimitry Andric   if (SrcMBB && SrcMBB->succ_size()==0)
380*81ad6265SDimitry Andric     return SinglePath_NotInPath;
381*81ad6265SDimitry Andric   return Not_SinglePath;
382*81ad6265SDimitry Andric }
383*81ad6265SDimitry Andric 
384*81ad6265SDimitry Andric int R600MachineCFGStructurizer::countActiveBlock(MBBVector::const_iterator It,
385*81ad6265SDimitry Andric     MBBVector::const_iterator E) const {
386*81ad6265SDimitry Andric   int Count = 0;
387*81ad6265SDimitry Andric   while (It != E) {
388*81ad6265SDimitry Andric     if (!isRetiredBlock(*It))
389*81ad6265SDimitry Andric       ++Count;
390*81ad6265SDimitry Andric     ++It;
391*81ad6265SDimitry Andric   }
392*81ad6265SDimitry Andric   return Count;
393*81ad6265SDimitry Andric }
394*81ad6265SDimitry Andric 
395*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::needMigrateBlock(MachineBasicBlock *MBB) const {
396*81ad6265SDimitry Andric   unsigned BlockSizeThreshold = 30;
397*81ad6265SDimitry Andric   unsigned CloneInstrThreshold = 100;
398*81ad6265SDimitry Andric   bool MultiplePreds = MBB && (MBB->pred_size() > 1);
399*81ad6265SDimitry Andric 
400*81ad6265SDimitry Andric   if(!MultiplePreds)
401*81ad6265SDimitry Andric     return false;
402*81ad6265SDimitry Andric   unsigned BlkSize = MBB->size();
403*81ad6265SDimitry Andric   return ((BlkSize > BlockSizeThreshold) &&
404*81ad6265SDimitry Andric       (BlkSize * (MBB->pred_size() - 1) > CloneInstrThreshold));
405*81ad6265SDimitry Andric }
406*81ad6265SDimitry Andric 
407*81ad6265SDimitry Andric void R600MachineCFGStructurizer::reversePredicateSetter(
408*81ad6265SDimitry Andric     MachineBasicBlock::iterator I, MachineBasicBlock &MBB) {
409*81ad6265SDimitry Andric   assert(I.isValid() && "Expected valid iterator");
410*81ad6265SDimitry Andric   for (;; --I) {
411*81ad6265SDimitry Andric     if (I == MBB.end())
412*81ad6265SDimitry Andric       continue;
413*81ad6265SDimitry Andric     if (I->getOpcode() == R600::PRED_X) {
414*81ad6265SDimitry Andric       switch (I->getOperand(2).getImm()) {
415*81ad6265SDimitry Andric       case R600::PRED_SETE_INT:
416*81ad6265SDimitry Andric         I->getOperand(2).setImm(R600::PRED_SETNE_INT);
417*81ad6265SDimitry Andric         return;
418*81ad6265SDimitry Andric       case R600::PRED_SETNE_INT:
419*81ad6265SDimitry Andric         I->getOperand(2).setImm(R600::PRED_SETE_INT);
420*81ad6265SDimitry Andric         return;
421*81ad6265SDimitry Andric       case R600::PRED_SETE:
422*81ad6265SDimitry Andric         I->getOperand(2).setImm(R600::PRED_SETNE);
423*81ad6265SDimitry Andric         return;
424*81ad6265SDimitry Andric       case R600::PRED_SETNE:
425*81ad6265SDimitry Andric         I->getOperand(2).setImm(R600::PRED_SETE);
426*81ad6265SDimitry Andric         return;
427*81ad6265SDimitry Andric       default:
428*81ad6265SDimitry Andric         llvm_unreachable("PRED_X Opcode invalid!");
429*81ad6265SDimitry Andric       }
430*81ad6265SDimitry Andric     }
431*81ad6265SDimitry Andric   }
432*81ad6265SDimitry Andric }
433*81ad6265SDimitry Andric 
434*81ad6265SDimitry Andric void R600MachineCFGStructurizer::insertInstrEnd(MachineBasicBlock *MBB,
435*81ad6265SDimitry Andric                                            int NewOpcode, const DebugLoc &DL) {
436*81ad6265SDimitry Andric   MachineInstr *MI =
437*81ad6265SDimitry Andric       MBB->getParent()->CreateMachineInstr(TII->get(NewOpcode), DL);
438*81ad6265SDimitry Andric   MBB->push_back(MI);
439*81ad6265SDimitry Andric   //assume the instruction doesn't take any reg operand ...
440*81ad6265SDimitry Andric   SHOWNEWINSTR(MI);
441*81ad6265SDimitry Andric }
442*81ad6265SDimitry Andric 
443*81ad6265SDimitry Andric MachineInstr *R600MachineCFGStructurizer::insertInstrBefore(MachineBasicBlock *MBB,
444*81ad6265SDimitry Andric                                                        int NewOpcode,
445*81ad6265SDimitry Andric                                                        const DebugLoc &DL) {
446*81ad6265SDimitry Andric   MachineInstr *MI =
447*81ad6265SDimitry Andric       MBB->getParent()->CreateMachineInstr(TII->get(NewOpcode), DL);
448*81ad6265SDimitry Andric   if (!MBB->empty())
449*81ad6265SDimitry Andric     MBB->insert(MBB->begin(), MI);
450*81ad6265SDimitry Andric   else
451*81ad6265SDimitry Andric     MBB->push_back(MI);
452*81ad6265SDimitry Andric   SHOWNEWINSTR(MI);
453*81ad6265SDimitry Andric   return MI;
454*81ad6265SDimitry Andric }
455*81ad6265SDimitry Andric 
456*81ad6265SDimitry Andric MachineInstr *R600MachineCFGStructurizer::insertInstrBefore(
457*81ad6265SDimitry Andric     MachineBasicBlock::iterator I, int NewOpcode) {
458*81ad6265SDimitry Andric   MachineInstr *OldMI = &(*I);
459*81ad6265SDimitry Andric   MachineBasicBlock *MBB = OldMI->getParent();
460*81ad6265SDimitry Andric   MachineInstr *NewMBB =
461*81ad6265SDimitry Andric       MBB->getParent()->CreateMachineInstr(TII->get(NewOpcode), DebugLoc());
462*81ad6265SDimitry Andric   MBB->insert(I, NewMBB);
463*81ad6265SDimitry Andric   //assume the instruction doesn't take any reg operand ...
464*81ad6265SDimitry Andric   SHOWNEWINSTR(NewMBB);
465*81ad6265SDimitry Andric   return NewMBB;
466*81ad6265SDimitry Andric }
467*81ad6265SDimitry Andric 
468*81ad6265SDimitry Andric void R600MachineCFGStructurizer::insertCondBranchBefore(
469*81ad6265SDimitry Andric     MachineBasicBlock::iterator I, int NewOpcode, const DebugLoc &DL) {
470*81ad6265SDimitry Andric   MachineInstr *OldMI = &(*I);
471*81ad6265SDimitry Andric   MachineBasicBlock *MBB = OldMI->getParent();
472*81ad6265SDimitry Andric   MachineFunction *MF = MBB->getParent();
473*81ad6265SDimitry Andric   MachineInstr *NewMI = MF->CreateMachineInstr(TII->get(NewOpcode), DL);
474*81ad6265SDimitry Andric   MBB->insert(I, NewMI);
475*81ad6265SDimitry Andric   MachineInstrBuilder MIB(*MF, NewMI);
476*81ad6265SDimitry Andric   MIB.addReg(OldMI->getOperand(1).getReg(), false);
477*81ad6265SDimitry Andric   SHOWNEWINSTR(NewMI);
478*81ad6265SDimitry Andric   //erase later oldInstr->eraseFromParent();
479*81ad6265SDimitry Andric }
480*81ad6265SDimitry Andric 
481*81ad6265SDimitry Andric void R600MachineCFGStructurizer::insertCondBranchBefore(
482*81ad6265SDimitry Andric     MachineBasicBlock *blk, MachineBasicBlock::iterator I, int NewOpcode,
483*81ad6265SDimitry Andric     int RegNum, const DebugLoc &DL) {
484*81ad6265SDimitry Andric   MachineFunction *MF = blk->getParent();
485*81ad6265SDimitry Andric   MachineInstr *NewInstr = MF->CreateMachineInstr(TII->get(NewOpcode), DL);
486*81ad6265SDimitry Andric   //insert before
487*81ad6265SDimitry Andric   blk->insert(I, NewInstr);
488*81ad6265SDimitry Andric   MachineInstrBuilder(*MF, NewInstr).addReg(RegNum, false);
489*81ad6265SDimitry Andric   SHOWNEWINSTR(NewInstr);
490*81ad6265SDimitry Andric }
491*81ad6265SDimitry Andric 
492*81ad6265SDimitry Andric int R600MachineCFGStructurizer::getBranchNzeroOpcode(int OldOpcode) {
493*81ad6265SDimitry Andric   switch(OldOpcode) {
494*81ad6265SDimitry Andric   case R600::JUMP_COND:
495*81ad6265SDimitry Andric   case R600::JUMP: return R600::IF_PREDICATE_SET;
496*81ad6265SDimitry Andric   case R600::BRANCH_COND_i32:
497*81ad6265SDimitry Andric   case R600::BRANCH_COND_f32: return R600::IF_LOGICALNZ_f32;
498*81ad6265SDimitry Andric   default: llvm_unreachable("internal error");
499*81ad6265SDimitry Andric   }
500*81ad6265SDimitry Andric   return -1;
501*81ad6265SDimitry Andric }
502*81ad6265SDimitry Andric 
503*81ad6265SDimitry Andric int R600MachineCFGStructurizer::getBranchZeroOpcode(int OldOpcode) {
504*81ad6265SDimitry Andric   switch(OldOpcode) {
505*81ad6265SDimitry Andric   case R600::JUMP_COND:
506*81ad6265SDimitry Andric   case R600::JUMP: return R600::IF_PREDICATE_SET;
507*81ad6265SDimitry Andric   case R600::BRANCH_COND_i32:
508*81ad6265SDimitry Andric   case R600::BRANCH_COND_f32: return R600::IF_LOGICALZ_f32;
509*81ad6265SDimitry Andric   default: llvm_unreachable("internal error");
510*81ad6265SDimitry Andric   }
511*81ad6265SDimitry Andric   return -1;
512*81ad6265SDimitry Andric }
513*81ad6265SDimitry Andric 
514*81ad6265SDimitry Andric int R600MachineCFGStructurizer::getContinueNzeroOpcode(int OldOpcode) {
515*81ad6265SDimitry Andric   switch(OldOpcode) {
516*81ad6265SDimitry Andric   case R600::JUMP_COND:
517*81ad6265SDimitry Andric   case R600::JUMP: return R600::CONTINUE_LOGICALNZ_i32;
518*81ad6265SDimitry Andric   default: llvm_unreachable("internal error");
519*81ad6265SDimitry Andric   }
520*81ad6265SDimitry Andric   return -1;
521*81ad6265SDimitry Andric }
522*81ad6265SDimitry Andric 
523*81ad6265SDimitry Andric int R600MachineCFGStructurizer::getContinueZeroOpcode(int OldOpcode) {
524*81ad6265SDimitry Andric   switch(OldOpcode) {
525*81ad6265SDimitry Andric   case R600::JUMP_COND:
526*81ad6265SDimitry Andric   case R600::JUMP: return R600::CONTINUE_LOGICALZ_i32;
527*81ad6265SDimitry Andric   default: llvm_unreachable("internal error");
528*81ad6265SDimitry Andric   }
529*81ad6265SDimitry Andric   return -1;
530*81ad6265SDimitry Andric }
531*81ad6265SDimitry Andric 
532*81ad6265SDimitry Andric MachineBasicBlock *R600MachineCFGStructurizer::getTrueBranch(MachineInstr *MI) {
533*81ad6265SDimitry Andric   return MI->getOperand(0).getMBB();
534*81ad6265SDimitry Andric }
535*81ad6265SDimitry Andric 
536*81ad6265SDimitry Andric void R600MachineCFGStructurizer::setTrueBranch(MachineInstr *MI,
537*81ad6265SDimitry Andric     MachineBasicBlock *MBB) {
538*81ad6265SDimitry Andric   MI->getOperand(0).setMBB(MBB);
539*81ad6265SDimitry Andric }
540*81ad6265SDimitry Andric 
541*81ad6265SDimitry Andric MachineBasicBlock *
542*81ad6265SDimitry Andric R600MachineCFGStructurizer::getFalseBranch(MachineBasicBlock *MBB,
543*81ad6265SDimitry Andric     MachineInstr *MI) {
544*81ad6265SDimitry Andric   assert(MBB->succ_size() == 2);
545*81ad6265SDimitry Andric   MachineBasicBlock *TrueBranch = getTrueBranch(MI);
546*81ad6265SDimitry Andric   MachineBasicBlock::succ_iterator It = MBB->succ_begin();
547*81ad6265SDimitry Andric   MachineBasicBlock::succ_iterator Next = It;
548*81ad6265SDimitry Andric   ++Next;
549*81ad6265SDimitry Andric   return (*It == TrueBranch) ? *Next : *It;
550*81ad6265SDimitry Andric }
551*81ad6265SDimitry Andric 
552*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::isCondBranch(MachineInstr *MI) {
553*81ad6265SDimitry Andric   switch (MI->getOpcode()) {
554*81ad6265SDimitry Andric     case R600::JUMP_COND:
555*81ad6265SDimitry Andric     case R600::BRANCH_COND_i32:
556*81ad6265SDimitry Andric     case R600::BRANCH_COND_f32: return true;
557*81ad6265SDimitry Andric   default:
558*81ad6265SDimitry Andric     return false;
559*81ad6265SDimitry Andric   }
560*81ad6265SDimitry Andric   return false;
561*81ad6265SDimitry Andric }
562*81ad6265SDimitry Andric 
563*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::isUncondBranch(MachineInstr *MI) {
564*81ad6265SDimitry Andric   switch (MI->getOpcode()) {
565*81ad6265SDimitry Andric   case R600::JUMP:
566*81ad6265SDimitry Andric   case R600::BRANCH:
567*81ad6265SDimitry Andric     return true;
568*81ad6265SDimitry Andric   default:
569*81ad6265SDimitry Andric     return false;
570*81ad6265SDimitry Andric   }
571*81ad6265SDimitry Andric   return false;
572*81ad6265SDimitry Andric }
573*81ad6265SDimitry Andric 
574*81ad6265SDimitry Andric DebugLoc R600MachineCFGStructurizer::getLastDebugLocInBB(MachineBasicBlock *MBB) {
575*81ad6265SDimitry Andric   //get DebugLoc from the first MachineBasicBlock instruction with debug info
576*81ad6265SDimitry Andric   DebugLoc DL;
577*81ad6265SDimitry Andric   for (MachineInstr &MI : *MBB)
578*81ad6265SDimitry Andric     if (MI.getDebugLoc())
579*81ad6265SDimitry Andric       DL = MI.getDebugLoc();
580*81ad6265SDimitry Andric   return DL;
581*81ad6265SDimitry Andric }
582*81ad6265SDimitry Andric 
583*81ad6265SDimitry Andric MachineInstr *R600MachineCFGStructurizer::getNormalBlockBranchInstr(
584*81ad6265SDimitry Andric     MachineBasicBlock *MBB) {
585*81ad6265SDimitry Andric   MachineBasicBlock::reverse_iterator It = MBB->rbegin();
586*81ad6265SDimitry Andric   MachineInstr *MI = &*It;
587*81ad6265SDimitry Andric   if (MI && (isCondBranch(MI) || isUncondBranch(MI)))
588*81ad6265SDimitry Andric     return MI;
589*81ad6265SDimitry Andric   return nullptr;
590*81ad6265SDimitry Andric }
591*81ad6265SDimitry Andric 
592*81ad6265SDimitry Andric MachineInstr *R600MachineCFGStructurizer::getLoopendBlockBranchInstr(
593*81ad6265SDimitry Andric     MachineBasicBlock *MBB) {
594*81ad6265SDimitry Andric   for (MachineBasicBlock::reverse_iterator It = MBB->rbegin(), E = MBB->rend();
595*81ad6265SDimitry Andric       It != E; ++It) {
596*81ad6265SDimitry Andric     // FIXME: Simplify
597*81ad6265SDimitry Andric     MachineInstr *MI = &*It;
598*81ad6265SDimitry Andric     if (MI) {
599*81ad6265SDimitry Andric       if (isCondBranch(MI) || isUncondBranch(MI))
600*81ad6265SDimitry Andric         return MI;
601*81ad6265SDimitry Andric       else if (!TII->isMov(MI->getOpcode()))
602*81ad6265SDimitry Andric         break;
603*81ad6265SDimitry Andric     }
604*81ad6265SDimitry Andric   }
605*81ad6265SDimitry Andric   return nullptr;
606*81ad6265SDimitry Andric }
607*81ad6265SDimitry Andric 
608*81ad6265SDimitry Andric MachineInstr *R600MachineCFGStructurizer::getReturnInstr(MachineBasicBlock *MBB) {
609*81ad6265SDimitry Andric   MachineBasicBlock::reverse_iterator It = MBB->rbegin();
610*81ad6265SDimitry Andric   if (It != MBB->rend()) {
611*81ad6265SDimitry Andric     MachineInstr *instr = &(*It);
612*81ad6265SDimitry Andric     if (instr->getOpcode() == R600::RETURN)
613*81ad6265SDimitry Andric       return instr;
614*81ad6265SDimitry Andric   }
615*81ad6265SDimitry Andric   return nullptr;
616*81ad6265SDimitry Andric }
617*81ad6265SDimitry Andric 
618*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::isReturnBlock(MachineBasicBlock *MBB) {
619*81ad6265SDimitry Andric   MachineInstr *MI = getReturnInstr(MBB);
620*81ad6265SDimitry Andric   bool IsReturn = MBB->succ_empty();
621*81ad6265SDimitry Andric   if (MI)
622*81ad6265SDimitry Andric     assert(IsReturn);
623*81ad6265SDimitry Andric   else if (IsReturn)
624*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "BB" << MBB->getNumber()
625*81ad6265SDimitry Andric                       << " is return block without RETURN instr\n";);
626*81ad6265SDimitry Andric   return  IsReturn;
627*81ad6265SDimitry Andric }
628*81ad6265SDimitry Andric 
629*81ad6265SDimitry Andric void R600MachineCFGStructurizer::cloneSuccessorList(MachineBasicBlock *DstMBB,
630*81ad6265SDimitry Andric     MachineBasicBlock *SrcMBB) {
631*81ad6265SDimitry Andric   for (MachineBasicBlock *Succ : SrcMBB->successors())
632*81ad6265SDimitry Andric     DstMBB->addSuccessor(Succ);  // *iter's predecessor is also taken care of
633*81ad6265SDimitry Andric }
634*81ad6265SDimitry Andric 
635*81ad6265SDimitry Andric MachineBasicBlock *R600MachineCFGStructurizer::clone(MachineBasicBlock *MBB) {
636*81ad6265SDimitry Andric   MachineFunction *Func = MBB->getParent();
637*81ad6265SDimitry Andric   MachineBasicBlock *NewMBB = Func->CreateMachineBasicBlock();
638*81ad6265SDimitry Andric   Func->push_back(NewMBB);  //insert to function
639*81ad6265SDimitry Andric   for (const MachineInstr &It : *MBB)
640*81ad6265SDimitry Andric     NewMBB->push_back(Func->CloneMachineInstr(&It));
641*81ad6265SDimitry Andric   return NewMBB;
642*81ad6265SDimitry Andric }
643*81ad6265SDimitry Andric 
644*81ad6265SDimitry Andric void R600MachineCFGStructurizer::replaceInstrUseOfBlockWith(
645*81ad6265SDimitry Andric     MachineBasicBlock *SrcMBB, MachineBasicBlock *OldMBB,
646*81ad6265SDimitry Andric     MachineBasicBlock *NewBlk) {
647*81ad6265SDimitry Andric   MachineInstr *BranchMI = getLoopendBlockBranchInstr(SrcMBB);
648*81ad6265SDimitry Andric   if (BranchMI && isCondBranch(BranchMI) &&
649*81ad6265SDimitry Andric       getTrueBranch(BranchMI) == OldMBB)
650*81ad6265SDimitry Andric     setTrueBranch(BranchMI, NewBlk);
651*81ad6265SDimitry Andric }
652*81ad6265SDimitry Andric 
653*81ad6265SDimitry Andric void R600MachineCFGStructurizer::wrapup(MachineBasicBlock *MBB) {
654*81ad6265SDimitry Andric   assert((!MBB->getParent()->getJumpTableInfo()
655*81ad6265SDimitry Andric           || MBB->getParent()->getJumpTableInfo()->isEmpty())
656*81ad6265SDimitry Andric          && "found a jump table");
657*81ad6265SDimitry Andric 
658*81ad6265SDimitry Andric    //collect continue right before endloop
659*81ad6265SDimitry Andric    SmallVector<MachineInstr *, DEFAULT_VEC_SLOTS> ContInstr;
660*81ad6265SDimitry Andric    MachineBasicBlock::iterator Pre = MBB->begin();
661*81ad6265SDimitry Andric    MachineBasicBlock::iterator E = MBB->end();
662*81ad6265SDimitry Andric    MachineBasicBlock::iterator It = Pre;
663*81ad6265SDimitry Andric    while (It != E) {
664*81ad6265SDimitry Andric      if (Pre->getOpcode() == R600::CONTINUE
665*81ad6265SDimitry Andric          && It->getOpcode() == R600::ENDLOOP)
666*81ad6265SDimitry Andric        ContInstr.push_back(&*Pre);
667*81ad6265SDimitry Andric      Pre = It;
668*81ad6265SDimitry Andric      ++It;
669*81ad6265SDimitry Andric    }
670*81ad6265SDimitry Andric 
671*81ad6265SDimitry Andric    //delete continue right before endloop
672*81ad6265SDimitry Andric    for (unsigned i = 0; i < ContInstr.size(); ++i)
673*81ad6265SDimitry Andric       ContInstr[i]->eraseFromParent();
674*81ad6265SDimitry Andric 
675*81ad6265SDimitry Andric    // TODO to fix up jump table so later phase won't be confused.  if
676*81ad6265SDimitry Andric    // (jumpTableInfo->isEmpty() == false) { need to clean the jump table, but
677*81ad6265SDimitry Andric    // there isn't such an interface yet.  alternatively, replace all the other
678*81ad6265SDimitry Andric    // blocks in the jump table with the entryBlk //}
679*81ad6265SDimitry Andric }
680*81ad6265SDimitry Andric 
681*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::prepare() {
682*81ad6265SDimitry Andric   bool Changed = false;
683*81ad6265SDimitry Andric 
684*81ad6265SDimitry Andric   //FIXME: if not reducible flow graph, make it so ???
685*81ad6265SDimitry Andric 
686*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "R600MachineCFGStructurizer::prepare\n";);
687*81ad6265SDimitry Andric 
688*81ad6265SDimitry Andric   orderBlocks(FuncRep);
689*81ad6265SDimitry Andric 
690*81ad6265SDimitry Andric   SmallVector<MachineBasicBlock *, DEFAULT_VEC_SLOTS> RetBlks;
691*81ad6265SDimitry Andric 
692*81ad6265SDimitry Andric   // Add an ExitBlk to loop that don't have one
693*81ad6265SDimitry Andric   for (MachineLoop *LoopRep : *MLI) {
694*81ad6265SDimitry Andric     MBBVector ExitingMBBs;
695*81ad6265SDimitry Andric     LoopRep->getExitingBlocks(ExitingMBBs);
696*81ad6265SDimitry Andric 
697*81ad6265SDimitry Andric     if (ExitingMBBs.size() == 0) {
698*81ad6265SDimitry Andric       MachineBasicBlock* DummyExitBlk = normalizeInfiniteLoopExit(LoopRep);
699*81ad6265SDimitry Andric       if (DummyExitBlk)
700*81ad6265SDimitry Andric         RetBlks.push_back(DummyExitBlk);
701*81ad6265SDimitry Andric     }
702*81ad6265SDimitry Andric   }
703*81ad6265SDimitry Andric 
704*81ad6265SDimitry Andric   // Remove unconditional branch instr.
705*81ad6265SDimitry Andric   // Add dummy exit block iff there are multiple returns.
706*81ad6265SDimitry Andric   for (MachineBasicBlock *MBB : OrderedBlks) {
707*81ad6265SDimitry Andric     removeUnconditionalBranch(MBB);
708*81ad6265SDimitry Andric     removeRedundantConditionalBranch(MBB);
709*81ad6265SDimitry Andric     if (isReturnBlock(MBB)) {
710*81ad6265SDimitry Andric       RetBlks.push_back(MBB);
711*81ad6265SDimitry Andric     }
712*81ad6265SDimitry Andric     assert(MBB->succ_size() <= 2);
713*81ad6265SDimitry Andric   }
714*81ad6265SDimitry Andric 
715*81ad6265SDimitry Andric   if (RetBlks.size() >= 2) {
716*81ad6265SDimitry Andric     addDummyExitBlock(RetBlks);
717*81ad6265SDimitry Andric     Changed = true;
718*81ad6265SDimitry Andric   }
719*81ad6265SDimitry Andric 
720*81ad6265SDimitry Andric   return Changed;
721*81ad6265SDimitry Andric }
722*81ad6265SDimitry Andric 
723*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::run() {
724*81ad6265SDimitry Andric   //Assume reducible CFG...
725*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "R600MachineCFGStructurizer::run\n");
726*81ad6265SDimitry Andric 
727*81ad6265SDimitry Andric #ifdef STRESSTEST
728*81ad6265SDimitry Andric   //Use the worse block ordering to test the algorithm.
729*81ad6265SDimitry Andric   ReverseVector(orderedBlks);
730*81ad6265SDimitry Andric #endif
731*81ad6265SDimitry Andric 
732*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "Ordered blocks:\n"; printOrderedBlocks(););
733*81ad6265SDimitry Andric   int NumIter = 0;
734*81ad6265SDimitry Andric   bool Finish = false;
735*81ad6265SDimitry Andric   MachineBasicBlock *MBB;
736*81ad6265SDimitry Andric   bool MakeProgress = false;
737*81ad6265SDimitry Andric   int NumRemainedBlk = countActiveBlock(OrderedBlks.begin(),
738*81ad6265SDimitry Andric                                         OrderedBlks.end());
739*81ad6265SDimitry Andric 
740*81ad6265SDimitry Andric   do {
741*81ad6265SDimitry Andric     ++NumIter;
742*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "numIter = " << NumIter
743*81ad6265SDimitry Andric                       << ", numRemaintedBlk = " << NumRemainedBlk << "\n";);
744*81ad6265SDimitry Andric     (void)NumIter;
745*81ad6265SDimitry Andric 
746*81ad6265SDimitry Andric     SmallVectorImpl<MachineBasicBlock *>::const_iterator It =
747*81ad6265SDimitry Andric         OrderedBlks.begin();
748*81ad6265SDimitry Andric     SmallVectorImpl<MachineBasicBlock *>::const_iterator E =
749*81ad6265SDimitry Andric         OrderedBlks.end();
750*81ad6265SDimitry Andric 
751*81ad6265SDimitry Andric     SmallVectorImpl<MachineBasicBlock *>::const_iterator SccBeginIter =
752*81ad6265SDimitry Andric         It;
753*81ad6265SDimitry Andric     MachineBasicBlock *SccBeginMBB = nullptr;
754*81ad6265SDimitry Andric     int SccNumBlk = 0;  // The number of active blocks, init to a
755*81ad6265SDimitry Andric                         // maximum possible number.
756*81ad6265SDimitry Andric     int SccNumIter;     // Number of iteration in this SCC.
757*81ad6265SDimitry Andric 
758*81ad6265SDimitry Andric     while (It != E) {
759*81ad6265SDimitry Andric       MBB = *It;
760*81ad6265SDimitry Andric 
761*81ad6265SDimitry Andric       if (!SccBeginMBB) {
762*81ad6265SDimitry Andric         SccBeginIter = It;
763*81ad6265SDimitry Andric         SccBeginMBB = MBB;
764*81ad6265SDimitry Andric         SccNumIter = 0;
765*81ad6265SDimitry Andric         SccNumBlk = NumRemainedBlk; // Init to maximum possible number.
766*81ad6265SDimitry Andric         LLVM_DEBUG(dbgs() << "start processing SCC" << getSCCNum(SccBeginMBB);
767*81ad6265SDimitry Andric                    dbgs() << "\n";);
768*81ad6265SDimitry Andric       }
769*81ad6265SDimitry Andric 
770*81ad6265SDimitry Andric       if (!isRetiredBlock(MBB))
771*81ad6265SDimitry Andric         patternMatch(MBB);
772*81ad6265SDimitry Andric 
773*81ad6265SDimitry Andric       ++It;
774*81ad6265SDimitry Andric 
775*81ad6265SDimitry Andric       bool ContNextScc = true;
776*81ad6265SDimitry Andric       if (It == E
777*81ad6265SDimitry Andric           || getSCCNum(SccBeginMBB) != getSCCNum(*It)) {
778*81ad6265SDimitry Andric         // Just finish one scc.
779*81ad6265SDimitry Andric         ++SccNumIter;
780*81ad6265SDimitry Andric         int sccRemainedNumBlk = countActiveBlock(SccBeginIter, It);
781*81ad6265SDimitry Andric         if (sccRemainedNumBlk != 1 && sccRemainedNumBlk >= SccNumBlk) {
782*81ad6265SDimitry Andric           LLVM_DEBUG(dbgs() << "Can't reduce SCC " << getSCCNum(MBB)
783*81ad6265SDimitry Andric                             << ", sccNumIter = " << SccNumIter;
784*81ad6265SDimitry Andric                      dbgs() << "doesn't make any progress\n";);
785*81ad6265SDimitry Andric           (void)SccNumIter;
786*81ad6265SDimitry Andric           ContNextScc = true;
787*81ad6265SDimitry Andric         } else if (sccRemainedNumBlk != 1 && sccRemainedNumBlk < SccNumBlk) {
788*81ad6265SDimitry Andric           SccNumBlk = sccRemainedNumBlk;
789*81ad6265SDimitry Andric           It = SccBeginIter;
790*81ad6265SDimitry Andric           ContNextScc = false;
791*81ad6265SDimitry Andric           LLVM_DEBUG(dbgs() << "repeat processing SCC" << getSCCNum(MBB)
792*81ad6265SDimitry Andric                             << "sccNumIter = " << SccNumIter << '\n';);
793*81ad6265SDimitry Andric         } else {
794*81ad6265SDimitry Andric           // Finish the current scc.
795*81ad6265SDimitry Andric           ContNextScc = true;
796*81ad6265SDimitry Andric         }
797*81ad6265SDimitry Andric       } else {
798*81ad6265SDimitry Andric         // Continue on next component in the current scc.
799*81ad6265SDimitry Andric         ContNextScc = false;
800*81ad6265SDimitry Andric       }
801*81ad6265SDimitry Andric 
802*81ad6265SDimitry Andric       if (ContNextScc)
803*81ad6265SDimitry Andric         SccBeginMBB = nullptr;
804*81ad6265SDimitry Andric     } //while, "one iteration" over the function.
805*81ad6265SDimitry Andric 
806*81ad6265SDimitry Andric     MachineBasicBlock *EntryMBB =
807*81ad6265SDimitry Andric         *GraphTraits<MachineFunction *>::nodes_begin(FuncRep);
808*81ad6265SDimitry Andric     if (EntryMBB->succ_empty()) {
809*81ad6265SDimitry Andric       Finish = true;
810*81ad6265SDimitry Andric       LLVM_DEBUG(dbgs() << "Reduce to one block\n";);
811*81ad6265SDimitry Andric     } else {
812*81ad6265SDimitry Andric       int NewnumRemainedBlk
813*81ad6265SDimitry Andric         = countActiveBlock(OrderedBlks.begin(), OrderedBlks.end());
814*81ad6265SDimitry Andric       // consider cloned blocks ??
815*81ad6265SDimitry Andric       if (NewnumRemainedBlk == 1 || NewnumRemainedBlk < NumRemainedBlk) {
816*81ad6265SDimitry Andric         MakeProgress = true;
817*81ad6265SDimitry Andric         NumRemainedBlk = NewnumRemainedBlk;
818*81ad6265SDimitry Andric       } else {
819*81ad6265SDimitry Andric         MakeProgress = false;
820*81ad6265SDimitry Andric         LLVM_DEBUG(dbgs() << "No progress\n";);
821*81ad6265SDimitry Andric       }
822*81ad6265SDimitry Andric     }
823*81ad6265SDimitry Andric   } while (!Finish && MakeProgress);
824*81ad6265SDimitry Andric 
825*81ad6265SDimitry Andric   // Misc wrap up to maintain the consistency of the Function representation.
826*81ad6265SDimitry Andric   wrapup(*GraphTraits<MachineFunction *>::nodes_begin(FuncRep));
827*81ad6265SDimitry Andric 
828*81ad6265SDimitry Andric   // Detach retired Block, release memory.
829*81ad6265SDimitry Andric   for (auto &It : BlockInfoMap) {
830*81ad6265SDimitry Andric     if (It.second && It.second->IsRetired) {
831*81ad6265SDimitry Andric       assert((It.first)->getNumber() != -1);
832*81ad6265SDimitry Andric       LLVM_DEBUG(dbgs() << "Erase BB" << (It.first)->getNumber() << "\n";);
833*81ad6265SDimitry Andric       It.first->eraseFromParent(); // Remove from the parent Function.
834*81ad6265SDimitry Andric     }
835*81ad6265SDimitry Andric     delete It.second;
836*81ad6265SDimitry Andric   }
837*81ad6265SDimitry Andric   BlockInfoMap.clear();
838*81ad6265SDimitry Andric   LLInfoMap.clear();
839*81ad6265SDimitry Andric 
840*81ad6265SDimitry Andric   if (!Finish) {
841*81ad6265SDimitry Andric     LLVM_DEBUG(FuncRep->viewCFG());
842*81ad6265SDimitry Andric     report_fatal_error("IRREDUCIBLE_CFG");
843*81ad6265SDimitry Andric   }
844*81ad6265SDimitry Andric 
845*81ad6265SDimitry Andric   return true;
846*81ad6265SDimitry Andric }
847*81ad6265SDimitry Andric 
848*81ad6265SDimitry Andric void R600MachineCFGStructurizer::orderBlocks(MachineFunction *MF) {
849*81ad6265SDimitry Andric   int SccNum = 0;
850*81ad6265SDimitry Andric   for (scc_iterator<MachineFunction *> It = scc_begin(MF); !It.isAtEnd();
851*81ad6265SDimitry Andric        ++It, ++SccNum) {
852*81ad6265SDimitry Andric     const std::vector<MachineBasicBlock *> &SccNext = *It;
853*81ad6265SDimitry Andric     for (MachineBasicBlock *MBB : SccNext) {
854*81ad6265SDimitry Andric       OrderedBlks.push_back(MBB);
855*81ad6265SDimitry Andric       recordSccnum(MBB, SccNum);
856*81ad6265SDimitry Andric     }
857*81ad6265SDimitry Andric   }
858*81ad6265SDimitry Andric 
859*81ad6265SDimitry Andric   // walk through all the block in func to check for unreachable
860*81ad6265SDimitry Andric   for (auto *MBB : nodes(MF)) {
861*81ad6265SDimitry Andric     SccNum = getSCCNum(MBB);
862*81ad6265SDimitry Andric     if (SccNum == INVALIDSCCNUM)
863*81ad6265SDimitry Andric       dbgs() << "unreachable block BB" << MBB->getNumber() << "\n";
864*81ad6265SDimitry Andric   }
865*81ad6265SDimitry Andric }
866*81ad6265SDimitry Andric 
867*81ad6265SDimitry Andric int R600MachineCFGStructurizer::patternMatch(MachineBasicBlock *MBB) {
868*81ad6265SDimitry Andric   int NumMatch = 0;
869*81ad6265SDimitry Andric   int CurMatch;
870*81ad6265SDimitry Andric 
871*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "Begin patternMatch BB" << MBB->getNumber() << "\n";);
872*81ad6265SDimitry Andric 
873*81ad6265SDimitry Andric   while ((CurMatch = patternMatchGroup(MBB)) > 0)
874*81ad6265SDimitry Andric     NumMatch += CurMatch;
875*81ad6265SDimitry Andric 
876*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "End patternMatch BB" << MBB->getNumber()
877*81ad6265SDimitry Andric                     << ", numMatch = " << NumMatch << "\n";);
878*81ad6265SDimitry Andric 
879*81ad6265SDimitry Andric   return NumMatch;
880*81ad6265SDimitry Andric }
881*81ad6265SDimitry Andric 
882*81ad6265SDimitry Andric int R600MachineCFGStructurizer::patternMatchGroup(MachineBasicBlock *MBB) {
883*81ad6265SDimitry Andric   int NumMatch = 0;
884*81ad6265SDimitry Andric   NumMatch += loopendPatternMatch();
885*81ad6265SDimitry Andric   NumMatch += serialPatternMatch(MBB);
886*81ad6265SDimitry Andric   NumMatch += ifPatternMatch(MBB);
887*81ad6265SDimitry Andric   return NumMatch;
888*81ad6265SDimitry Andric }
889*81ad6265SDimitry Andric 
890*81ad6265SDimitry Andric int R600MachineCFGStructurizer::serialPatternMatch(MachineBasicBlock *MBB) {
891*81ad6265SDimitry Andric   if (MBB->succ_size() != 1)
892*81ad6265SDimitry Andric     return 0;
893*81ad6265SDimitry Andric 
894*81ad6265SDimitry Andric   MachineBasicBlock *childBlk = *MBB->succ_begin();
895*81ad6265SDimitry Andric   if (childBlk->pred_size() != 1 || isActiveLoophead(childBlk))
896*81ad6265SDimitry Andric     return 0;
897*81ad6265SDimitry Andric 
898*81ad6265SDimitry Andric   mergeSerialBlock(MBB, childBlk);
899*81ad6265SDimitry Andric   ++numSerialPatternMatch;
900*81ad6265SDimitry Andric   return 1;
901*81ad6265SDimitry Andric }
902*81ad6265SDimitry Andric 
903*81ad6265SDimitry Andric int R600MachineCFGStructurizer::ifPatternMatch(MachineBasicBlock *MBB) {
904*81ad6265SDimitry Andric   //two edges
905*81ad6265SDimitry Andric   if (MBB->succ_size() != 2)
906*81ad6265SDimitry Andric     return 0;
907*81ad6265SDimitry Andric   if (hasBackEdge(MBB))
908*81ad6265SDimitry Andric     return 0;
909*81ad6265SDimitry Andric   MachineInstr *BranchMI = getNormalBlockBranchInstr(MBB);
910*81ad6265SDimitry Andric   if (!BranchMI)
911*81ad6265SDimitry Andric     return 0;
912*81ad6265SDimitry Andric 
913*81ad6265SDimitry Andric   assert(isCondBranch(BranchMI));
914*81ad6265SDimitry Andric   int NumMatch = 0;
915*81ad6265SDimitry Andric 
916*81ad6265SDimitry Andric   MachineBasicBlock *TrueMBB = getTrueBranch(BranchMI);
917*81ad6265SDimitry Andric   NumMatch += serialPatternMatch(TrueMBB);
918*81ad6265SDimitry Andric   NumMatch += ifPatternMatch(TrueMBB);
919*81ad6265SDimitry Andric   MachineBasicBlock *FalseMBB = getFalseBranch(MBB, BranchMI);
920*81ad6265SDimitry Andric   NumMatch += serialPatternMatch(FalseMBB);
921*81ad6265SDimitry Andric   NumMatch += ifPatternMatch(FalseMBB);
922*81ad6265SDimitry Andric   MachineBasicBlock *LandBlk;
923*81ad6265SDimitry Andric   int Cloned = 0;
924*81ad6265SDimitry Andric 
925*81ad6265SDimitry Andric   assert (!TrueMBB->succ_empty() || !FalseMBB->succ_empty());
926*81ad6265SDimitry Andric   // TODO: Simplify
927*81ad6265SDimitry Andric   if (TrueMBB->succ_size() == 1 && FalseMBB->succ_size() == 1
928*81ad6265SDimitry Andric     && *TrueMBB->succ_begin() == *FalseMBB->succ_begin()) {
929*81ad6265SDimitry Andric     // Diamond pattern
930*81ad6265SDimitry Andric     LandBlk = *TrueMBB->succ_begin();
931*81ad6265SDimitry Andric   } else if (TrueMBB->succ_size() == 1 && *TrueMBB->succ_begin() == FalseMBB) {
932*81ad6265SDimitry Andric     // Triangle pattern, false is empty
933*81ad6265SDimitry Andric     LandBlk = FalseMBB;
934*81ad6265SDimitry Andric     FalseMBB = nullptr;
935*81ad6265SDimitry Andric   } else if (FalseMBB->succ_size() == 1
936*81ad6265SDimitry Andric              && *FalseMBB->succ_begin() == TrueMBB) {
937*81ad6265SDimitry Andric     // Triangle pattern, true is empty
938*81ad6265SDimitry Andric     // We reverse the predicate to make a triangle, empty false pattern;
939*81ad6265SDimitry Andric     std::swap(TrueMBB, FalseMBB);
940*81ad6265SDimitry Andric     reversePredicateSetter(MBB->end(), *MBB);
941*81ad6265SDimitry Andric     LandBlk = FalseMBB;
942*81ad6265SDimitry Andric     FalseMBB = nullptr;
943*81ad6265SDimitry Andric   } else if (FalseMBB->succ_size() == 1
944*81ad6265SDimitry Andric              && isSameloopDetachedContbreak(TrueMBB, FalseMBB)) {
945*81ad6265SDimitry Andric     LandBlk = *FalseMBB->succ_begin();
946*81ad6265SDimitry Andric   } else if (TrueMBB->succ_size() == 1
947*81ad6265SDimitry Andric     && isSameloopDetachedContbreak(FalseMBB, TrueMBB)) {
948*81ad6265SDimitry Andric     LandBlk = *TrueMBB->succ_begin();
949*81ad6265SDimitry Andric   } else {
950*81ad6265SDimitry Andric     return NumMatch + handleJumpintoIf(MBB, TrueMBB, FalseMBB);
951*81ad6265SDimitry Andric   }
952*81ad6265SDimitry Andric 
953*81ad6265SDimitry Andric   // improveSimpleJumpinfoIf can handle the case where landBlk == NULL but the
954*81ad6265SDimitry Andric   // new BB created for landBlk==NULL may introduce new challenge to the
955*81ad6265SDimitry Andric   // reduction process.
956*81ad6265SDimitry Andric   if (LandBlk &&
957*81ad6265SDimitry Andric       ((TrueMBB && TrueMBB->pred_size() > 1)
958*81ad6265SDimitry Andric       || (FalseMBB && FalseMBB->pred_size() > 1))) {
959*81ad6265SDimitry Andric      Cloned += improveSimpleJumpintoIf(MBB, TrueMBB, FalseMBB, &LandBlk);
960*81ad6265SDimitry Andric   }
961*81ad6265SDimitry Andric 
962*81ad6265SDimitry Andric   if (TrueMBB && TrueMBB->pred_size() > 1) {
963*81ad6265SDimitry Andric     TrueMBB = cloneBlockForPredecessor(TrueMBB, MBB);
964*81ad6265SDimitry Andric     ++Cloned;
965*81ad6265SDimitry Andric   }
966*81ad6265SDimitry Andric 
967*81ad6265SDimitry Andric   if (FalseMBB && FalseMBB->pred_size() > 1) {
968*81ad6265SDimitry Andric     FalseMBB = cloneBlockForPredecessor(FalseMBB, MBB);
969*81ad6265SDimitry Andric     ++Cloned;
970*81ad6265SDimitry Andric   }
971*81ad6265SDimitry Andric 
972*81ad6265SDimitry Andric   mergeIfthenelseBlock(BranchMI, MBB, TrueMBB, FalseMBB, LandBlk);
973*81ad6265SDimitry Andric 
974*81ad6265SDimitry Andric   ++numIfPatternMatch;
975*81ad6265SDimitry Andric 
976*81ad6265SDimitry Andric   numClonedBlock += Cloned;
977*81ad6265SDimitry Andric 
978*81ad6265SDimitry Andric   return 1 + Cloned + NumMatch;
979*81ad6265SDimitry Andric }
980*81ad6265SDimitry Andric 
981*81ad6265SDimitry Andric int R600MachineCFGStructurizer::loopendPatternMatch() {
982*81ad6265SDimitry Andric   std::deque<MachineLoop *> NestedLoops;
983*81ad6265SDimitry Andric   for (auto &It: *MLI)
984*81ad6265SDimitry Andric     for (MachineLoop *ML : depth_first(It))
985*81ad6265SDimitry Andric       NestedLoops.push_front(ML);
986*81ad6265SDimitry Andric 
987*81ad6265SDimitry Andric   if (NestedLoops.empty())
988*81ad6265SDimitry Andric     return 0;
989*81ad6265SDimitry Andric 
990*81ad6265SDimitry Andric   // Process nested loop outside->inside (we did push_front),
991*81ad6265SDimitry Andric   // so "continue" to a outside loop won't be mistaken as "break"
992*81ad6265SDimitry Andric   // of the current loop.
993*81ad6265SDimitry Andric   int Num = 0;
994*81ad6265SDimitry Andric   for (MachineLoop *ExaminedLoop : NestedLoops) {
995*81ad6265SDimitry Andric     if (ExaminedLoop->getNumBlocks() == 0 || Visited[ExaminedLoop])
996*81ad6265SDimitry Andric       continue;
997*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "Processing:\n"; ExaminedLoop->dump(););
998*81ad6265SDimitry Andric     int NumBreak = mergeLoop(ExaminedLoop);
999*81ad6265SDimitry Andric     if (NumBreak == -1)
1000*81ad6265SDimitry Andric       break;
1001*81ad6265SDimitry Andric     Num += NumBreak;
1002*81ad6265SDimitry Andric   }
1003*81ad6265SDimitry Andric   return Num;
1004*81ad6265SDimitry Andric }
1005*81ad6265SDimitry Andric 
1006*81ad6265SDimitry Andric int R600MachineCFGStructurizer::mergeLoop(MachineLoop *LoopRep) {
1007*81ad6265SDimitry Andric   MachineBasicBlock *LoopHeader = LoopRep->getHeader();
1008*81ad6265SDimitry Andric   MBBVector ExitingMBBs;
1009*81ad6265SDimitry Andric   LoopRep->getExitingBlocks(ExitingMBBs);
1010*81ad6265SDimitry Andric   assert(!ExitingMBBs.empty() && "Infinite Loop not supported");
1011*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "Loop has " << ExitingMBBs.size()
1012*81ad6265SDimitry Andric                     << " exiting blocks\n";);
1013*81ad6265SDimitry Andric   // We assume a single ExitBlk
1014*81ad6265SDimitry Andric   MBBVector ExitBlks;
1015*81ad6265SDimitry Andric   LoopRep->getExitBlocks(ExitBlks);
1016*81ad6265SDimitry Andric   SmallPtrSet<MachineBasicBlock *, 2> ExitBlkSet;
1017*81ad6265SDimitry Andric   for (unsigned i = 0, e = ExitBlks.size(); i < e; ++i)
1018*81ad6265SDimitry Andric     ExitBlkSet.insert(ExitBlks[i]);
1019*81ad6265SDimitry Andric   assert(ExitBlkSet.size() == 1);
1020*81ad6265SDimitry Andric   MachineBasicBlock *ExitBlk = *ExitBlks.begin();
1021*81ad6265SDimitry Andric   assert(ExitBlk && "Loop has several exit block");
1022*81ad6265SDimitry Andric   MBBVector LatchBlks;
1023*81ad6265SDimitry Andric   for (auto *LB : inverse_children<MachineBasicBlock*>(LoopHeader))
1024*81ad6265SDimitry Andric     if (LoopRep->contains(LB))
1025*81ad6265SDimitry Andric       LatchBlks.push_back(LB);
1026*81ad6265SDimitry Andric 
1027*81ad6265SDimitry Andric   for (unsigned i = 0, e = ExitingMBBs.size(); i < e; ++i)
1028*81ad6265SDimitry Andric     mergeLoopbreakBlock(ExitingMBBs[i], ExitBlk);
1029*81ad6265SDimitry Andric   for (unsigned i = 0, e = LatchBlks.size(); i < e; ++i)
1030*81ad6265SDimitry Andric     settleLoopcontBlock(LatchBlks[i], LoopHeader);
1031*81ad6265SDimitry Andric   int Match = 0;
1032*81ad6265SDimitry Andric   do {
1033*81ad6265SDimitry Andric     Match = 0;
1034*81ad6265SDimitry Andric     Match += serialPatternMatch(LoopHeader);
1035*81ad6265SDimitry Andric     Match += ifPatternMatch(LoopHeader);
1036*81ad6265SDimitry Andric   } while (Match > 0);
1037*81ad6265SDimitry Andric   mergeLooplandBlock(LoopHeader, ExitBlk);
1038*81ad6265SDimitry Andric   MachineLoop *ParentLoop = LoopRep->getParentLoop();
1039*81ad6265SDimitry Andric   if (ParentLoop)
1040*81ad6265SDimitry Andric     MLI->changeLoopFor(LoopHeader, ParentLoop);
1041*81ad6265SDimitry Andric   else
1042*81ad6265SDimitry Andric     MLI->removeBlock(LoopHeader);
1043*81ad6265SDimitry Andric   Visited[LoopRep] = true;
1044*81ad6265SDimitry Andric   return 1;
1045*81ad6265SDimitry Andric }
1046*81ad6265SDimitry Andric 
1047*81ad6265SDimitry Andric bool R600MachineCFGStructurizer::isSameloopDetachedContbreak(
1048*81ad6265SDimitry Andric     MachineBasicBlock *Src1MBB, MachineBasicBlock *Src2MBB) {
1049*81ad6265SDimitry Andric   if (Src1MBB->succ_empty()) {
1050*81ad6265SDimitry Andric     MachineLoop *LoopRep = MLI->getLoopFor(Src1MBB);
1051*81ad6265SDimitry Andric     if (LoopRep&& LoopRep == MLI->getLoopFor(Src2MBB)) {
1052*81ad6265SDimitry Andric       MachineBasicBlock *&TheEntry = LLInfoMap[LoopRep];
1053*81ad6265SDimitry Andric       if (TheEntry) {
1054*81ad6265SDimitry Andric         LLVM_DEBUG(dbgs() << "isLoopContBreakBlock yes src1 = BB"
1055*81ad6265SDimitry Andric                           << Src1MBB->getNumber() << " src2 = BB"
1056*81ad6265SDimitry Andric                           << Src2MBB->getNumber() << "\n";);
1057*81ad6265SDimitry Andric         return true;
1058*81ad6265SDimitry Andric       }
1059*81ad6265SDimitry Andric     }
1060*81ad6265SDimitry Andric   }
1061*81ad6265SDimitry Andric   return false;
1062*81ad6265SDimitry Andric }
1063*81ad6265SDimitry Andric 
1064*81ad6265SDimitry Andric int R600MachineCFGStructurizer::handleJumpintoIf(MachineBasicBlock *HeadMBB,
1065*81ad6265SDimitry Andric     MachineBasicBlock *TrueMBB, MachineBasicBlock *FalseMBB) {
1066*81ad6265SDimitry Andric   int Num = handleJumpintoIfImp(HeadMBB, TrueMBB, FalseMBB);
1067*81ad6265SDimitry Andric   if (Num == 0) {
1068*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "handleJumpintoIf swap trueBlk and FalseBlk"
1069*81ad6265SDimitry Andric                       << "\n";);
1070*81ad6265SDimitry Andric     Num = handleJumpintoIfImp(HeadMBB, FalseMBB, TrueMBB);
1071*81ad6265SDimitry Andric   }
1072*81ad6265SDimitry Andric   return Num;
1073*81ad6265SDimitry Andric }
1074*81ad6265SDimitry Andric 
1075*81ad6265SDimitry Andric int R600MachineCFGStructurizer::handleJumpintoIfImp(MachineBasicBlock *HeadMBB,
1076*81ad6265SDimitry Andric     MachineBasicBlock *TrueMBB, MachineBasicBlock *FalseMBB) {
1077*81ad6265SDimitry Andric   int Num = 0;
1078*81ad6265SDimitry Andric   MachineBasicBlock *DownBlk;
1079*81ad6265SDimitry Andric 
1080*81ad6265SDimitry Andric   //trueBlk could be the common post dominator
1081*81ad6265SDimitry Andric   DownBlk = TrueMBB;
1082*81ad6265SDimitry Andric 
1083*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "handleJumpintoIfImp head = BB" << HeadMBB->getNumber()
1084*81ad6265SDimitry Andric                     << " true = BB" << TrueMBB->getNumber()
1085*81ad6265SDimitry Andric                     << ", numSucc=" << TrueMBB->succ_size() << " false = BB"
1086*81ad6265SDimitry Andric                     << FalseMBB->getNumber() << "\n";);
1087*81ad6265SDimitry Andric 
1088*81ad6265SDimitry Andric   while (DownBlk) {
1089*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "check down = BB" << DownBlk->getNumber(););
1090*81ad6265SDimitry Andric 
1091*81ad6265SDimitry Andric     if (singlePathTo(FalseMBB, DownBlk) == SinglePath_InPath) {
1092*81ad6265SDimitry Andric       LLVM_DEBUG(dbgs() << " working\n";);
1093*81ad6265SDimitry Andric 
1094*81ad6265SDimitry Andric       Num += cloneOnSideEntryTo(HeadMBB, TrueMBB, DownBlk);
1095*81ad6265SDimitry Andric       Num += cloneOnSideEntryTo(HeadMBB, FalseMBB, DownBlk);
1096*81ad6265SDimitry Andric 
1097*81ad6265SDimitry Andric       numClonedBlock += Num;
1098*81ad6265SDimitry Andric       Num += serialPatternMatch(*HeadMBB->succ_begin());
1099*81ad6265SDimitry Andric       Num += serialPatternMatch(*std::next(HeadMBB->succ_begin()));
1100*81ad6265SDimitry Andric       Num += ifPatternMatch(HeadMBB);
1101*81ad6265SDimitry Andric       assert(Num > 0);
1102*81ad6265SDimitry Andric 
1103*81ad6265SDimitry Andric       break;
1104*81ad6265SDimitry Andric     }
1105*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << " not working\n";);
1106*81ad6265SDimitry Andric     DownBlk = (DownBlk->succ_size() == 1) ? (*DownBlk->succ_begin()) : nullptr;
1107*81ad6265SDimitry Andric   } // walk down the postDomTree
1108*81ad6265SDimitry Andric 
1109*81ad6265SDimitry Andric   return Num;
1110*81ad6265SDimitry Andric }
1111*81ad6265SDimitry Andric 
1112*81ad6265SDimitry Andric #ifndef NDEBUG
1113*81ad6265SDimitry Andric void R600MachineCFGStructurizer::showImproveSimpleJumpintoIf(
1114*81ad6265SDimitry Andric     MachineBasicBlock *HeadMBB, MachineBasicBlock *TrueMBB,
1115*81ad6265SDimitry Andric     MachineBasicBlock *FalseMBB, MachineBasicBlock *LandMBB, bool Detail) {
1116*81ad6265SDimitry Andric   dbgs() << "head = BB" << HeadMBB->getNumber()
1117*81ad6265SDimitry Andric          << " size = " << HeadMBB->size();
1118*81ad6265SDimitry Andric   if (Detail) {
1119*81ad6265SDimitry Andric     dbgs() << "\n";
1120*81ad6265SDimitry Andric     HeadMBB->print(dbgs());
1121*81ad6265SDimitry Andric     dbgs() << "\n";
1122*81ad6265SDimitry Andric   }
1123*81ad6265SDimitry Andric 
1124*81ad6265SDimitry Andric   if (TrueMBB) {
1125*81ad6265SDimitry Andric     dbgs() << ", true = BB" << TrueMBB->getNumber() << " size = "
1126*81ad6265SDimitry Andric            << TrueMBB->size() << " numPred = " << TrueMBB->pred_size();
1127*81ad6265SDimitry Andric     if (Detail) {
1128*81ad6265SDimitry Andric       dbgs() << "\n";
1129*81ad6265SDimitry Andric       TrueMBB->print(dbgs());
1130*81ad6265SDimitry Andric       dbgs() << "\n";
1131*81ad6265SDimitry Andric     }
1132*81ad6265SDimitry Andric   }
1133*81ad6265SDimitry Andric   if (FalseMBB) {
1134*81ad6265SDimitry Andric     dbgs() << ", false = BB" << FalseMBB->getNumber() << " size = "
1135*81ad6265SDimitry Andric            << FalseMBB->size() << " numPred = " << FalseMBB->pred_size();
1136*81ad6265SDimitry Andric     if (Detail) {
1137*81ad6265SDimitry Andric       dbgs() << "\n";
1138*81ad6265SDimitry Andric       FalseMBB->print(dbgs());
1139*81ad6265SDimitry Andric       dbgs() << "\n";
1140*81ad6265SDimitry Andric     }
1141*81ad6265SDimitry Andric   }
1142*81ad6265SDimitry Andric   if (LandMBB) {
1143*81ad6265SDimitry Andric     dbgs() << ", land = BB" << LandMBB->getNumber() << " size = "
1144*81ad6265SDimitry Andric            << LandMBB->size() << " numPred = " << LandMBB->pred_size();
1145*81ad6265SDimitry Andric     if (Detail) {
1146*81ad6265SDimitry Andric       dbgs() << "\n";
1147*81ad6265SDimitry Andric       LandMBB->print(dbgs());
1148*81ad6265SDimitry Andric       dbgs() << "\n";
1149*81ad6265SDimitry Andric     }
1150*81ad6265SDimitry Andric   }
1151*81ad6265SDimitry Andric 
1152*81ad6265SDimitry Andric   dbgs() << "\n";
1153*81ad6265SDimitry Andric }
1154*81ad6265SDimitry Andric #endif
1155*81ad6265SDimitry Andric 
1156*81ad6265SDimitry Andric int R600MachineCFGStructurizer::improveSimpleJumpintoIf(MachineBasicBlock *HeadMBB,
1157*81ad6265SDimitry Andric     MachineBasicBlock *TrueMBB, MachineBasicBlock *FalseMBB,
1158*81ad6265SDimitry Andric     MachineBasicBlock **LandMBBPtr) {
1159*81ad6265SDimitry Andric   bool MigrateTrue = false;
1160*81ad6265SDimitry Andric   bool MigrateFalse = false;
1161*81ad6265SDimitry Andric 
1162*81ad6265SDimitry Andric   MachineBasicBlock *LandBlk = *LandMBBPtr;
1163*81ad6265SDimitry Andric 
1164*81ad6265SDimitry Andric   assert((!TrueMBB || TrueMBB->succ_size() <= 1)
1165*81ad6265SDimitry Andric          && (!FalseMBB || FalseMBB->succ_size() <= 1));
1166*81ad6265SDimitry Andric 
1167*81ad6265SDimitry Andric   if (TrueMBB == FalseMBB)
1168*81ad6265SDimitry Andric     return 0;
1169*81ad6265SDimitry Andric 
1170*81ad6265SDimitry Andric   MigrateTrue = needMigrateBlock(TrueMBB);
1171*81ad6265SDimitry Andric   MigrateFalse = needMigrateBlock(FalseMBB);
1172*81ad6265SDimitry Andric 
1173*81ad6265SDimitry Andric   if (!MigrateTrue && !MigrateFalse)
1174*81ad6265SDimitry Andric     return 0;
1175*81ad6265SDimitry Andric 
1176*81ad6265SDimitry Andric   // If we need to migrate either trueBlk and falseBlk, migrate the rest that
1177*81ad6265SDimitry Andric   // have more than one predecessors.  without doing this, its predecessor
1178*81ad6265SDimitry Andric   // rather than headBlk will have undefined value in initReg.
1179*81ad6265SDimitry Andric   if (!MigrateTrue && TrueMBB && TrueMBB->pred_size() > 1)
1180*81ad6265SDimitry Andric     MigrateTrue = true;
1181*81ad6265SDimitry Andric   if (!MigrateFalse && FalseMBB && FalseMBB->pred_size() > 1)
1182*81ad6265SDimitry Andric     MigrateFalse = true;
1183*81ad6265SDimitry Andric 
1184*81ad6265SDimitry Andric   LLVM_DEBUG(
1185*81ad6265SDimitry Andric       dbgs() << "before improveSimpleJumpintoIf: ";
1186*81ad6265SDimitry Andric       showImproveSimpleJumpintoIf(HeadMBB, TrueMBB, FalseMBB, LandBlk, 0););
1187*81ad6265SDimitry Andric 
1188*81ad6265SDimitry Andric   // org: headBlk => if () {trueBlk} else {falseBlk} => landBlk
1189*81ad6265SDimitry Andric   //
1190*81ad6265SDimitry Andric   // new: headBlk => if () {initReg = 1; org trueBlk branch} else
1191*81ad6265SDimitry Andric   //      {initReg = 0; org falseBlk branch }
1192*81ad6265SDimitry Andric   //      => landBlk => if (initReg) {org trueBlk} else {org falseBlk}
1193*81ad6265SDimitry Andric   //      => org landBlk
1194*81ad6265SDimitry Andric   //      if landBlk->pred_size() > 2, put the about if-else inside
1195*81ad6265SDimitry Andric   //      if (initReg !=2) {...}
1196*81ad6265SDimitry Andric   //
1197*81ad6265SDimitry Andric   // add initReg = initVal to headBlk
1198*81ad6265SDimitry Andric 
1199*81ad6265SDimitry Andric   const TargetRegisterClass * I32RC = TRI->getCFGStructurizerRegClass(MVT::i32);
1200*81ad6265SDimitry Andric   if (!MigrateTrue || !MigrateFalse) {
1201*81ad6265SDimitry Andric     // XXX: We have an opportunity here to optimize the "branch into if" case
1202*81ad6265SDimitry Andric     // here.  Branch into if looks like this:
1203*81ad6265SDimitry Andric     //                        entry
1204*81ad6265SDimitry Andric     //                       /     |
1205*81ad6265SDimitry Andric     //           diamond_head       branch_from
1206*81ad6265SDimitry Andric     //             /      \           |
1207*81ad6265SDimitry Andric     // diamond_false        diamond_true
1208*81ad6265SDimitry Andric     //             \      /
1209*81ad6265SDimitry Andric     //               done
1210*81ad6265SDimitry Andric     //
1211*81ad6265SDimitry Andric     // The diamond_head block begins the "if" and the diamond_true block
1212*81ad6265SDimitry Andric     // is the block being "branched into".
1213*81ad6265SDimitry Andric     //
1214*81ad6265SDimitry Andric     // If MigrateTrue is true, then TrueBB is the block being "branched into"
1215*81ad6265SDimitry Andric     // and if MigrateFalse is true, then FalseBB is the block being
1216*81ad6265SDimitry Andric     // "branched into"
1217*81ad6265SDimitry Andric     //
1218*81ad6265SDimitry Andric     // Here is the pseudo code for how I think the optimization should work:
1219*81ad6265SDimitry Andric     // 1. Insert MOV GPR0, 0 before the branch instruction in diamond_head.
1220*81ad6265SDimitry Andric     // 2. Insert MOV GPR0, 1 before the branch instruction in branch_from.
1221*81ad6265SDimitry Andric     // 3. Move the branch instruction from diamond_head into its own basic
1222*81ad6265SDimitry Andric     //    block (new_block).
1223*81ad6265SDimitry Andric     // 4. Add an unconditional branch from diamond_head to new_block
1224*81ad6265SDimitry Andric     // 5. Replace the branch instruction in branch_from with an unconditional
1225*81ad6265SDimitry Andric     //    branch to new_block.  If branch_from has multiple predecessors, then
1226*81ad6265SDimitry Andric     //    we need to replace the True/False block in the branch
1227*81ad6265SDimitry Andric     //    instruction instead of replacing it.
1228*81ad6265SDimitry Andric     // 6. Change the condition of the branch instruction in new_block from
1229*81ad6265SDimitry Andric     //    COND to (COND || GPR0)
1230*81ad6265SDimitry Andric     //
1231*81ad6265SDimitry Andric     // In order insert these MOV instruction, we will need to use the
1232*81ad6265SDimitry Andric     // RegisterScavenger.  Usually liveness stops being tracked during
1233*81ad6265SDimitry Andric     // the late machine optimization passes, however if we implement
1234*81ad6265SDimitry Andric     // bool TargetRegisterInfo::requiresRegisterScavenging(
1235*81ad6265SDimitry Andric     //                                                const MachineFunction &MF)
1236*81ad6265SDimitry Andric     // and have it return true, liveness will be tracked correctly
1237*81ad6265SDimitry Andric     // by generic optimization passes.  We will also need to make sure that
1238*81ad6265SDimitry Andric     // all of our target-specific passes that run after regalloc and before
1239*81ad6265SDimitry Andric     // the CFGStructurizer track liveness and we will need to modify this pass
1240*81ad6265SDimitry Andric     // to correctly track liveness.
1241*81ad6265SDimitry Andric     //
1242*81ad6265SDimitry Andric     // After the above changes, the new CFG should look like this:
1243*81ad6265SDimitry Andric     //                        entry
1244*81ad6265SDimitry Andric     //                       /     |
1245*81ad6265SDimitry Andric     //           diamond_head       branch_from
1246*81ad6265SDimitry Andric     //                       \     /
1247*81ad6265SDimitry Andric     //                      new_block
1248*81ad6265SDimitry Andric     //                      /      |
1249*81ad6265SDimitry Andric     //         diamond_false        diamond_true
1250*81ad6265SDimitry Andric     //                      \      /
1251*81ad6265SDimitry Andric     //                        done
1252*81ad6265SDimitry Andric     //
1253*81ad6265SDimitry Andric     // Without this optimization, we are forced to duplicate the diamond_true
1254*81ad6265SDimitry Andric     // block and we will end up with a CFG like this:
1255*81ad6265SDimitry Andric     //
1256*81ad6265SDimitry Andric     //                        entry
1257*81ad6265SDimitry Andric     //                       /     |
1258*81ad6265SDimitry Andric     //           diamond_head       branch_from
1259*81ad6265SDimitry Andric     //             /      \                   |
1260*81ad6265SDimitry Andric     // diamond_false        diamond_true      diamond_true (duplicate)
1261*81ad6265SDimitry Andric     //             \      /                   |
1262*81ad6265SDimitry Andric     //               done --------------------|
1263*81ad6265SDimitry Andric     //
1264*81ad6265SDimitry Andric     // Duplicating diamond_true can be very costly especially if it has a
1265*81ad6265SDimitry Andric     // lot of instructions.
1266*81ad6265SDimitry Andric     return 0;
1267*81ad6265SDimitry Andric   }
1268*81ad6265SDimitry Andric 
1269*81ad6265SDimitry Andric   int NumNewBlk = 0;
1270*81ad6265SDimitry Andric 
1271*81ad6265SDimitry Andric   bool LandBlkHasOtherPred = (LandBlk->pred_size() > 2);
1272*81ad6265SDimitry Andric 
1273*81ad6265SDimitry Andric   //insert R600::ENDIF to avoid special case "input landBlk == NULL"
1274*81ad6265SDimitry Andric   MachineBasicBlock::iterator I = insertInstrBefore(LandBlk, R600::ENDIF);
1275*81ad6265SDimitry Andric 
1276*81ad6265SDimitry Andric   if (LandBlkHasOtherPred) {
1277*81ad6265SDimitry Andric     report_fatal_error("Extra register needed to handle CFG");
1278*81ad6265SDimitry Andric     Register CmpResReg =
1279*81ad6265SDimitry Andric         HeadMBB->getParent()->getRegInfo().createVirtualRegister(I32RC);
1280*81ad6265SDimitry Andric     report_fatal_error("Extra compare instruction needed to handle CFG");
1281*81ad6265SDimitry Andric     insertCondBranchBefore(LandBlk, I, R600::IF_PREDICATE_SET,
1282*81ad6265SDimitry Andric         CmpResReg, DebugLoc());
1283*81ad6265SDimitry Andric   }
1284*81ad6265SDimitry Andric 
1285*81ad6265SDimitry Andric   // XXX: We are running this after RA, so creating virtual registers will
1286*81ad6265SDimitry Andric   // cause an assertion failure in the PostRA scheduling pass.
1287*81ad6265SDimitry Andric   Register InitReg =
1288*81ad6265SDimitry Andric       HeadMBB->getParent()->getRegInfo().createVirtualRegister(I32RC);
1289*81ad6265SDimitry Andric   insertCondBranchBefore(LandBlk, I, R600::IF_PREDICATE_SET, InitReg,
1290*81ad6265SDimitry Andric       DebugLoc());
1291*81ad6265SDimitry Andric 
1292*81ad6265SDimitry Andric   if (MigrateTrue) {
1293*81ad6265SDimitry Andric     migrateInstruction(TrueMBB, LandBlk, I);
1294*81ad6265SDimitry Andric     // need to uncondionally insert the assignment to ensure a path from its
1295*81ad6265SDimitry Andric     // predecessor rather than headBlk has valid value in initReg if
1296*81ad6265SDimitry Andric     // (initVal != 1).
1297*81ad6265SDimitry Andric     report_fatal_error("Extra register needed to handle CFG");
1298*81ad6265SDimitry Andric   }
1299*81ad6265SDimitry Andric   insertInstrBefore(I, R600::ELSE);
1300*81ad6265SDimitry Andric 
1301*81ad6265SDimitry Andric   if (MigrateFalse) {
1302*81ad6265SDimitry Andric     migrateInstruction(FalseMBB, LandBlk, I);
1303*81ad6265SDimitry Andric     // need to uncondionally insert the assignment to ensure a path from its
1304*81ad6265SDimitry Andric     // predecessor rather than headBlk has valid value in initReg if
1305*81ad6265SDimitry Andric     // (initVal != 0)
1306*81ad6265SDimitry Andric     report_fatal_error("Extra register needed to handle CFG");
1307*81ad6265SDimitry Andric   }
1308*81ad6265SDimitry Andric 
1309*81ad6265SDimitry Andric   if (LandBlkHasOtherPred) {
1310*81ad6265SDimitry Andric     // add endif
1311*81ad6265SDimitry Andric     insertInstrBefore(I, R600::ENDIF);
1312*81ad6265SDimitry Andric 
1313*81ad6265SDimitry Andric     // put initReg = 2 to other predecessors of landBlk
1314*81ad6265SDimitry Andric     for (MachineBasicBlock *MBB : LandBlk->predecessors())
1315*81ad6265SDimitry Andric       if (MBB != TrueMBB && MBB != FalseMBB)
1316*81ad6265SDimitry Andric         report_fatal_error("Extra register needed to handle CFG");
1317*81ad6265SDimitry Andric   }
1318*81ad6265SDimitry Andric   LLVM_DEBUG(
1319*81ad6265SDimitry Andric       dbgs() << "result from improveSimpleJumpintoIf: ";
1320*81ad6265SDimitry Andric       showImproveSimpleJumpintoIf(HeadMBB, TrueMBB, FalseMBB, LandBlk, 0););
1321*81ad6265SDimitry Andric 
1322*81ad6265SDimitry Andric   // update landBlk
1323*81ad6265SDimitry Andric   *LandMBBPtr = LandBlk;
1324*81ad6265SDimitry Andric 
1325*81ad6265SDimitry Andric   return NumNewBlk;
1326*81ad6265SDimitry Andric }
1327*81ad6265SDimitry Andric 
1328*81ad6265SDimitry Andric void R600MachineCFGStructurizer::mergeSerialBlock(MachineBasicBlock *DstMBB,
1329*81ad6265SDimitry Andric     MachineBasicBlock *SrcMBB) {
1330*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "serialPattern BB" << DstMBB->getNumber() << " <= BB"
1331*81ad6265SDimitry Andric                     << SrcMBB->getNumber() << "\n";);
1332*81ad6265SDimitry Andric   DstMBB->splice(DstMBB->end(), SrcMBB, SrcMBB->begin(), SrcMBB->end());
1333*81ad6265SDimitry Andric 
1334*81ad6265SDimitry Andric   DstMBB->removeSuccessor(SrcMBB, true);
1335*81ad6265SDimitry Andric   cloneSuccessorList(DstMBB, SrcMBB);
1336*81ad6265SDimitry Andric 
1337*81ad6265SDimitry Andric   removeSuccessor(SrcMBB);
1338*81ad6265SDimitry Andric   MLI->removeBlock(SrcMBB);
1339*81ad6265SDimitry Andric   retireBlock(SrcMBB);
1340*81ad6265SDimitry Andric }
1341*81ad6265SDimitry Andric 
1342*81ad6265SDimitry Andric void R600MachineCFGStructurizer::mergeIfthenelseBlock(MachineInstr *BranchMI,
1343*81ad6265SDimitry Andric     MachineBasicBlock *MBB, MachineBasicBlock *TrueMBB,
1344*81ad6265SDimitry Andric     MachineBasicBlock *FalseMBB, MachineBasicBlock *LandMBB) {
1345*81ad6265SDimitry Andric   assert (TrueMBB);
1346*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "ifPattern BB" << MBB->getNumber(); dbgs() << "{  ";
1347*81ad6265SDimitry Andric              if (TrueMBB) { dbgs() << "BB" << TrueMBB->getNumber(); } dbgs()
1348*81ad6265SDimitry Andric              << "  } else ";
1349*81ad6265SDimitry Andric              dbgs() << "{  "; if (FalseMBB) {
1350*81ad6265SDimitry Andric                dbgs() << "BB" << FalseMBB->getNumber();
1351*81ad6265SDimitry Andric              } dbgs() << "  }\n ";
1352*81ad6265SDimitry Andric              dbgs() << "landBlock: "; if (!LandMBB) { dbgs() << "NULL"; } else {
1353*81ad6265SDimitry Andric                dbgs() << "BB" << LandMBB->getNumber();
1354*81ad6265SDimitry Andric              } dbgs() << "\n";);
1355*81ad6265SDimitry Andric 
1356*81ad6265SDimitry Andric   int OldOpcode = BranchMI->getOpcode();
1357*81ad6265SDimitry Andric   DebugLoc BranchDL = BranchMI->getDebugLoc();
1358*81ad6265SDimitry Andric 
1359*81ad6265SDimitry Andric //    transform to
1360*81ad6265SDimitry Andric //    if cond
1361*81ad6265SDimitry Andric //       trueBlk
1362*81ad6265SDimitry Andric //    else
1363*81ad6265SDimitry Andric //       falseBlk
1364*81ad6265SDimitry Andric //    endif
1365*81ad6265SDimitry Andric //    landBlk
1366*81ad6265SDimitry Andric 
1367*81ad6265SDimitry Andric   MachineBasicBlock::iterator I = BranchMI;
1368*81ad6265SDimitry Andric   insertCondBranchBefore(I, getBranchNzeroOpcode(OldOpcode),
1369*81ad6265SDimitry Andric       BranchDL);
1370*81ad6265SDimitry Andric 
1371*81ad6265SDimitry Andric   if (TrueMBB) {
1372*81ad6265SDimitry Andric     MBB->splice(I, TrueMBB, TrueMBB->begin(), TrueMBB->end());
1373*81ad6265SDimitry Andric     MBB->removeSuccessor(TrueMBB, true);
1374*81ad6265SDimitry Andric     if (LandMBB && TrueMBB->succ_size()!=0)
1375*81ad6265SDimitry Andric       TrueMBB->removeSuccessor(LandMBB, true);
1376*81ad6265SDimitry Andric     retireBlock(TrueMBB);
1377*81ad6265SDimitry Andric     MLI->removeBlock(TrueMBB);
1378*81ad6265SDimitry Andric   }
1379*81ad6265SDimitry Andric 
1380*81ad6265SDimitry Andric   if (FalseMBB) {
1381*81ad6265SDimitry Andric     insertInstrBefore(I, R600::ELSE);
1382*81ad6265SDimitry Andric     MBB->splice(I, FalseMBB, FalseMBB->begin(),
1383*81ad6265SDimitry Andric                    FalseMBB->end());
1384*81ad6265SDimitry Andric     MBB->removeSuccessor(FalseMBB, true);
1385*81ad6265SDimitry Andric     if (LandMBB && !FalseMBB->succ_empty())
1386*81ad6265SDimitry Andric       FalseMBB->removeSuccessor(LandMBB, true);
1387*81ad6265SDimitry Andric     retireBlock(FalseMBB);
1388*81ad6265SDimitry Andric     MLI->removeBlock(FalseMBB);
1389*81ad6265SDimitry Andric   }
1390*81ad6265SDimitry Andric   insertInstrBefore(I, R600::ENDIF);
1391*81ad6265SDimitry Andric 
1392*81ad6265SDimitry Andric   BranchMI->eraseFromParent();
1393*81ad6265SDimitry Andric 
1394*81ad6265SDimitry Andric   if (LandMBB && TrueMBB && FalseMBB)
1395*81ad6265SDimitry Andric     MBB->addSuccessor(LandMBB);
1396*81ad6265SDimitry Andric }
1397*81ad6265SDimitry Andric 
1398*81ad6265SDimitry Andric void R600MachineCFGStructurizer::mergeLooplandBlock(MachineBasicBlock *DstBlk,
1399*81ad6265SDimitry Andric     MachineBasicBlock *LandMBB) {
1400*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "loopPattern header = BB" << DstBlk->getNumber()
1401*81ad6265SDimitry Andric                     << " land = BB" << LandMBB->getNumber() << "\n";);
1402*81ad6265SDimitry Andric 
1403*81ad6265SDimitry Andric   insertInstrBefore(DstBlk, R600::WHILELOOP, DebugLoc());
1404*81ad6265SDimitry Andric   insertInstrEnd(DstBlk, R600::ENDLOOP, DebugLoc());
1405*81ad6265SDimitry Andric   DstBlk->replaceSuccessor(DstBlk, LandMBB);
1406*81ad6265SDimitry Andric }
1407*81ad6265SDimitry Andric 
1408*81ad6265SDimitry Andric void R600MachineCFGStructurizer::mergeLoopbreakBlock(MachineBasicBlock *ExitingMBB,
1409*81ad6265SDimitry Andric     MachineBasicBlock *LandMBB) {
1410*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "loopbreakPattern exiting = BB"
1411*81ad6265SDimitry Andric                     << ExitingMBB->getNumber() << " land = BB"
1412*81ad6265SDimitry Andric                     << LandMBB->getNumber() << "\n";);
1413*81ad6265SDimitry Andric   MachineInstr *BranchMI = getLoopendBlockBranchInstr(ExitingMBB);
1414*81ad6265SDimitry Andric   assert(BranchMI && isCondBranch(BranchMI));
1415*81ad6265SDimitry Andric   DebugLoc DL = BranchMI->getDebugLoc();
1416*81ad6265SDimitry Andric   MachineBasicBlock *TrueBranch = getTrueBranch(BranchMI);
1417*81ad6265SDimitry Andric   MachineBasicBlock::iterator I = BranchMI;
1418*81ad6265SDimitry Andric   if (TrueBranch != LandMBB)
1419*81ad6265SDimitry Andric     reversePredicateSetter(I, *I->getParent());
1420*81ad6265SDimitry Andric   insertCondBranchBefore(ExitingMBB, I, R600::IF_PREDICATE_SET, R600::PREDICATE_BIT, DL);
1421*81ad6265SDimitry Andric   insertInstrBefore(I, R600::BREAK);
1422*81ad6265SDimitry Andric   insertInstrBefore(I, R600::ENDIF);
1423*81ad6265SDimitry Andric   //now branchInst can be erase safely
1424*81ad6265SDimitry Andric   BranchMI->eraseFromParent();
1425*81ad6265SDimitry Andric   //now take care of successors, retire blocks
1426*81ad6265SDimitry Andric   ExitingMBB->removeSuccessor(LandMBB, true);
1427*81ad6265SDimitry Andric }
1428*81ad6265SDimitry Andric 
1429*81ad6265SDimitry Andric void R600MachineCFGStructurizer::settleLoopcontBlock(MachineBasicBlock *ContingMBB,
1430*81ad6265SDimitry Andric     MachineBasicBlock *ContMBB) {
1431*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "settleLoopcontBlock conting = BB"
1432*81ad6265SDimitry Andric                     << ContingMBB->getNumber() << ", cont = BB"
1433*81ad6265SDimitry Andric                     << ContMBB->getNumber() << "\n";);
1434*81ad6265SDimitry Andric 
1435*81ad6265SDimitry Andric   MachineInstr *MI = getLoopendBlockBranchInstr(ContingMBB);
1436*81ad6265SDimitry Andric   if (MI) {
1437*81ad6265SDimitry Andric     assert(isCondBranch(MI));
1438*81ad6265SDimitry Andric     MachineBasicBlock::iterator I = MI;
1439*81ad6265SDimitry Andric     MachineBasicBlock *TrueBranch = getTrueBranch(MI);
1440*81ad6265SDimitry Andric     int OldOpcode = MI->getOpcode();
1441*81ad6265SDimitry Andric     DebugLoc DL = MI->getDebugLoc();
1442*81ad6265SDimitry Andric 
1443*81ad6265SDimitry Andric     bool UseContinueLogical = ((&*ContingMBB->rbegin()) == MI);
1444*81ad6265SDimitry Andric 
1445*81ad6265SDimitry Andric     if (!UseContinueLogical) {
1446*81ad6265SDimitry Andric       int BranchOpcode =
1447*81ad6265SDimitry Andric           TrueBranch == ContMBB ? getBranchNzeroOpcode(OldOpcode) :
1448*81ad6265SDimitry Andric           getBranchZeroOpcode(OldOpcode);
1449*81ad6265SDimitry Andric       insertCondBranchBefore(I, BranchOpcode, DL);
1450*81ad6265SDimitry Andric       // insertEnd to ensure phi-moves, if exist, go before the continue-instr.
1451*81ad6265SDimitry Andric       insertInstrEnd(ContingMBB, R600::CONTINUE, DL);
1452*81ad6265SDimitry Andric       insertInstrEnd(ContingMBB, R600::ENDIF, DL);
1453*81ad6265SDimitry Andric     } else {
1454*81ad6265SDimitry Andric       int BranchOpcode =
1455*81ad6265SDimitry Andric           TrueBranch == ContMBB ? getContinueNzeroOpcode(OldOpcode) :
1456*81ad6265SDimitry Andric           getContinueZeroOpcode(OldOpcode);
1457*81ad6265SDimitry Andric       insertCondBranchBefore(I, BranchOpcode, DL);
1458*81ad6265SDimitry Andric     }
1459*81ad6265SDimitry Andric 
1460*81ad6265SDimitry Andric     MI->eraseFromParent();
1461*81ad6265SDimitry Andric   } else {
1462*81ad6265SDimitry Andric     // if we've arrived here then we've already erased the branch instruction
1463*81ad6265SDimitry Andric     // travel back up the basic block to see the last reference of our debug
1464*81ad6265SDimitry Andric     // location we've just inserted that reference here so it should be
1465*81ad6265SDimitry Andric     // representative insertEnd to ensure phi-moves, if exist, go before the
1466*81ad6265SDimitry Andric     // continue-instr.
1467*81ad6265SDimitry Andric     insertInstrEnd(ContingMBB, R600::CONTINUE,
1468*81ad6265SDimitry Andric         getLastDebugLocInBB(ContingMBB));
1469*81ad6265SDimitry Andric   }
1470*81ad6265SDimitry Andric }
1471*81ad6265SDimitry Andric 
1472*81ad6265SDimitry Andric int R600MachineCFGStructurizer::cloneOnSideEntryTo(MachineBasicBlock *PreMBB,
1473*81ad6265SDimitry Andric     MachineBasicBlock *SrcMBB, MachineBasicBlock *DstMBB) {
1474*81ad6265SDimitry Andric   int Cloned = 0;
1475*81ad6265SDimitry Andric   assert(PreMBB->isSuccessor(SrcMBB));
1476*81ad6265SDimitry Andric   while (SrcMBB && SrcMBB != DstMBB) {
1477*81ad6265SDimitry Andric     assert(SrcMBB->succ_size() == 1);
1478*81ad6265SDimitry Andric     if (SrcMBB->pred_size() > 1) {
1479*81ad6265SDimitry Andric       SrcMBB = cloneBlockForPredecessor(SrcMBB, PreMBB);
1480*81ad6265SDimitry Andric       ++Cloned;
1481*81ad6265SDimitry Andric     }
1482*81ad6265SDimitry Andric 
1483*81ad6265SDimitry Andric     PreMBB = SrcMBB;
1484*81ad6265SDimitry Andric     SrcMBB = *SrcMBB->succ_begin();
1485*81ad6265SDimitry Andric   }
1486*81ad6265SDimitry Andric 
1487*81ad6265SDimitry Andric   return Cloned;
1488*81ad6265SDimitry Andric }
1489*81ad6265SDimitry Andric 
1490*81ad6265SDimitry Andric MachineBasicBlock *
1491*81ad6265SDimitry Andric R600MachineCFGStructurizer::cloneBlockForPredecessor(MachineBasicBlock *MBB,
1492*81ad6265SDimitry Andric     MachineBasicBlock *PredMBB) {
1493*81ad6265SDimitry Andric   assert(PredMBB->isSuccessor(MBB) && "succBlk is not a predecessor of curBlk");
1494*81ad6265SDimitry Andric 
1495*81ad6265SDimitry Andric   MachineBasicBlock *CloneMBB = clone(MBB);  //clone instructions
1496*81ad6265SDimitry Andric   replaceInstrUseOfBlockWith(PredMBB, MBB, CloneMBB);
1497*81ad6265SDimitry Andric   //srcBlk, oldBlk, newBlk
1498*81ad6265SDimitry Andric 
1499*81ad6265SDimitry Andric   PredMBB->replaceSuccessor(MBB, CloneMBB);
1500*81ad6265SDimitry Andric 
1501*81ad6265SDimitry Andric   // add all successor to cloneBlk
1502*81ad6265SDimitry Andric   cloneSuccessorList(CloneMBB, MBB);
1503*81ad6265SDimitry Andric 
1504*81ad6265SDimitry Andric   numClonedInstr += MBB->size();
1505*81ad6265SDimitry Andric 
1506*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "Cloned block: "
1507*81ad6265SDimitry Andric                     << "BB" << MBB->getNumber() << "size " << MBB->size()
1508*81ad6265SDimitry Andric                     << "\n";);
1509*81ad6265SDimitry Andric 
1510*81ad6265SDimitry Andric   SHOWNEWBLK(CloneMBB, "result of Cloned block: ");
1511*81ad6265SDimitry Andric 
1512*81ad6265SDimitry Andric   return CloneMBB;
1513*81ad6265SDimitry Andric }
1514*81ad6265SDimitry Andric 
1515*81ad6265SDimitry Andric void R600MachineCFGStructurizer::migrateInstruction(MachineBasicBlock *SrcMBB,
1516*81ad6265SDimitry Andric     MachineBasicBlock *DstMBB, MachineBasicBlock::iterator I) {
1517*81ad6265SDimitry Andric   MachineBasicBlock::iterator SpliceEnd;
1518*81ad6265SDimitry Andric   //look for the input branchinstr, not the AMDGPU branchinstr
1519*81ad6265SDimitry Andric   MachineInstr *BranchMI = getNormalBlockBranchInstr(SrcMBB);
1520*81ad6265SDimitry Andric   if (!BranchMI) {
1521*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "migrateInstruction don't see branch instr\n";);
1522*81ad6265SDimitry Andric     SpliceEnd = SrcMBB->end();
1523*81ad6265SDimitry Andric   } else {
1524*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "migrateInstruction see branch instr: " << *BranchMI);
1525*81ad6265SDimitry Andric     SpliceEnd = BranchMI;
1526*81ad6265SDimitry Andric   }
1527*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "migrateInstruction before splice dstSize = "
1528*81ad6265SDimitry Andric                     << DstMBB->size() << "srcSize = " << SrcMBB->size()
1529*81ad6265SDimitry Andric                     << "\n";);
1530*81ad6265SDimitry Andric 
1531*81ad6265SDimitry Andric   //splice insert before insertPos
1532*81ad6265SDimitry Andric   DstMBB->splice(I, SrcMBB, SrcMBB->begin(), SpliceEnd);
1533*81ad6265SDimitry Andric 
1534*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "migrateInstruction after splice dstSize = "
1535*81ad6265SDimitry Andric                     << DstMBB->size() << "srcSize = " << SrcMBB->size()
1536*81ad6265SDimitry Andric                     << '\n';);
1537*81ad6265SDimitry Andric }
1538*81ad6265SDimitry Andric 
1539*81ad6265SDimitry Andric MachineBasicBlock *
1540*81ad6265SDimitry Andric R600MachineCFGStructurizer::normalizeInfiniteLoopExit(MachineLoop* LoopRep) {
1541*81ad6265SDimitry Andric   MachineBasicBlock *LoopHeader = LoopRep->getHeader();
1542*81ad6265SDimitry Andric   MachineBasicBlock *LoopLatch = LoopRep->getLoopLatch();
1543*81ad6265SDimitry Andric 
1544*81ad6265SDimitry Andric   if (!LoopHeader || !LoopLatch)
1545*81ad6265SDimitry Andric     return nullptr;
1546*81ad6265SDimitry Andric   MachineInstr *BranchMI = getLoopendBlockBranchInstr(LoopLatch);
1547*81ad6265SDimitry Andric   // Is LoopRep an infinite loop ?
1548*81ad6265SDimitry Andric   if (!BranchMI || !isUncondBranch(BranchMI))
1549*81ad6265SDimitry Andric     return nullptr;
1550*81ad6265SDimitry Andric 
1551*81ad6265SDimitry Andric   MachineBasicBlock *DummyExitBlk = FuncRep->CreateMachineBasicBlock();
1552*81ad6265SDimitry Andric   FuncRep->push_back(DummyExitBlk);  //insert to function
1553*81ad6265SDimitry Andric   SHOWNEWBLK(DummyExitBlk, "DummyExitBlock to normalize infiniteLoop: ");
1554*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "Old branch instr: " << *BranchMI << "\n";);
1555*81ad6265SDimitry Andric   LLVMContext &Ctx = LoopHeader->getParent()->getFunction().getContext();
1556*81ad6265SDimitry Andric   Ctx.emitError("Extra register needed to handle CFG");
1557*81ad6265SDimitry Andric   return nullptr;
1558*81ad6265SDimitry Andric }
1559*81ad6265SDimitry Andric 
1560*81ad6265SDimitry Andric void R600MachineCFGStructurizer::removeUnconditionalBranch(MachineBasicBlock *MBB) {
1561*81ad6265SDimitry Andric   MachineInstr *BranchMI;
1562*81ad6265SDimitry Andric 
1563*81ad6265SDimitry Andric   // I saw two unconditional branch in one basic block in example
1564*81ad6265SDimitry Andric   // test_fc_do_while_or.c need to fix the upstream on this to remove the loop.
1565*81ad6265SDimitry Andric   while ((BranchMI = getLoopendBlockBranchInstr(MBB))
1566*81ad6265SDimitry Andric           && isUncondBranch(BranchMI)) {
1567*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "Removing uncond branch instr: " << *BranchMI);
1568*81ad6265SDimitry Andric     BranchMI->eraseFromParent();
1569*81ad6265SDimitry Andric   }
1570*81ad6265SDimitry Andric }
1571*81ad6265SDimitry Andric 
1572*81ad6265SDimitry Andric void R600MachineCFGStructurizer::removeRedundantConditionalBranch(
1573*81ad6265SDimitry Andric     MachineBasicBlock *MBB) {
1574*81ad6265SDimitry Andric   if (MBB->succ_size() != 2)
1575*81ad6265SDimitry Andric     return;
1576*81ad6265SDimitry Andric   MachineBasicBlock *MBB1 = *MBB->succ_begin();
1577*81ad6265SDimitry Andric   MachineBasicBlock *MBB2 = *std::next(MBB->succ_begin());
1578*81ad6265SDimitry Andric   if (MBB1 != MBB2)
1579*81ad6265SDimitry Andric     return;
1580*81ad6265SDimitry Andric 
1581*81ad6265SDimitry Andric   MachineInstr *BranchMI = getNormalBlockBranchInstr(MBB);
1582*81ad6265SDimitry Andric   assert(BranchMI && isCondBranch(BranchMI));
1583*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "Removing unneeded cond branch instr: " << *BranchMI);
1584*81ad6265SDimitry Andric   BranchMI->eraseFromParent();
1585*81ad6265SDimitry Andric   SHOWNEWBLK(MBB1, "Removing redundant successor");
1586*81ad6265SDimitry Andric   MBB->removeSuccessor(MBB1, true);
1587*81ad6265SDimitry Andric }
1588*81ad6265SDimitry Andric 
1589*81ad6265SDimitry Andric void R600MachineCFGStructurizer::addDummyExitBlock(
1590*81ad6265SDimitry Andric     SmallVectorImpl<MachineBasicBlock*> &RetMBB) {
1591*81ad6265SDimitry Andric   MachineBasicBlock *DummyExitBlk = FuncRep->CreateMachineBasicBlock();
1592*81ad6265SDimitry Andric   FuncRep->push_back(DummyExitBlk);  //insert to function
1593*81ad6265SDimitry Andric   insertInstrEnd(DummyExitBlk, R600::RETURN);
1594*81ad6265SDimitry Andric 
1595*81ad6265SDimitry Andric   for (MachineBasicBlock *MBB : RetMBB) {
1596*81ad6265SDimitry Andric     if (MachineInstr *MI = getReturnInstr(MBB))
1597*81ad6265SDimitry Andric       MI->eraseFromParent();
1598*81ad6265SDimitry Andric     MBB->addSuccessor(DummyExitBlk);
1599*81ad6265SDimitry Andric     LLVM_DEBUG(dbgs() << "Add dummyExitBlock to BB" << MBB->getNumber()
1600*81ad6265SDimitry Andric                       << " successors\n";);
1601*81ad6265SDimitry Andric   }
1602*81ad6265SDimitry Andric   SHOWNEWBLK(DummyExitBlk, "DummyExitBlock: ");
1603*81ad6265SDimitry Andric }
1604*81ad6265SDimitry Andric 
1605*81ad6265SDimitry Andric void R600MachineCFGStructurizer::removeSuccessor(MachineBasicBlock *MBB) {
1606*81ad6265SDimitry Andric   while (MBB->succ_size())
1607*81ad6265SDimitry Andric     MBB->removeSuccessor(*MBB->succ_begin());
1608*81ad6265SDimitry Andric }
1609*81ad6265SDimitry Andric 
1610*81ad6265SDimitry Andric void R600MachineCFGStructurizer::recordSccnum(MachineBasicBlock *MBB,
1611*81ad6265SDimitry Andric     int SccNum) {
1612*81ad6265SDimitry Andric   BlockInformation *&srcBlkInfo = BlockInfoMap[MBB];
1613*81ad6265SDimitry Andric   if (!srcBlkInfo)
1614*81ad6265SDimitry Andric     srcBlkInfo = new BlockInformation();
1615*81ad6265SDimitry Andric   srcBlkInfo->SccNum = SccNum;
1616*81ad6265SDimitry Andric }
1617*81ad6265SDimitry Andric 
1618*81ad6265SDimitry Andric void R600MachineCFGStructurizer::retireBlock(MachineBasicBlock *MBB) {
1619*81ad6265SDimitry Andric   LLVM_DEBUG(dbgs() << "Retiring BB" << MBB->getNumber() << "\n";);
1620*81ad6265SDimitry Andric 
1621*81ad6265SDimitry Andric   BlockInformation *&SrcBlkInfo = BlockInfoMap[MBB];
1622*81ad6265SDimitry Andric 
1623*81ad6265SDimitry Andric   if (!SrcBlkInfo)
1624*81ad6265SDimitry Andric     SrcBlkInfo = new BlockInformation();
1625*81ad6265SDimitry Andric 
1626*81ad6265SDimitry Andric   SrcBlkInfo->IsRetired = true;
1627*81ad6265SDimitry Andric   assert(MBB->succ_empty() && MBB->pred_empty() && "can't retire block yet");
1628*81ad6265SDimitry Andric }
1629*81ad6265SDimitry Andric 
1630*81ad6265SDimitry Andric INITIALIZE_PASS_BEGIN(R600MachineCFGStructurizer, "amdgpustructurizer",
1631*81ad6265SDimitry Andric                       "AMDGPU CFG Structurizer", false, false)
1632*81ad6265SDimitry Andric INITIALIZE_PASS_DEPENDENCY(MachineDominatorTree)
1633*81ad6265SDimitry Andric INITIALIZE_PASS_DEPENDENCY(MachinePostDominatorTree)
1634*81ad6265SDimitry Andric INITIALIZE_PASS_DEPENDENCY(MachineLoopInfo)
1635*81ad6265SDimitry Andric INITIALIZE_PASS_END(R600MachineCFGStructurizer, "amdgpustructurizer",
1636*81ad6265SDimitry Andric                       "AMDGPU CFG Structurizer", false, false)
1637*81ad6265SDimitry Andric 
1638*81ad6265SDimitry Andric FunctionPass *llvm::createR600MachineCFGStructurizerPass() {
1639*81ad6265SDimitry Andric   return new R600MachineCFGStructurizer();
1640*81ad6265SDimitry Andric }
1641