xref: /llvm-project/llvm/lib/Transforms/Scalar/GVNHoist.cpp (revision 9cf05464aa4487ed420940a45973ea20b3c9611b)
1 //===- GVNHoist.cpp - Hoist scalar and load expressions -------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This pass hoists expressions from branches to a common dominator. It uses
11 // GVN (global value numbering) to discover expressions computing the same
12 // values. The primary goal is to reduce the code size, and in some
13 // cases reduce critical path (by exposing more ILP).
14 // Hoisting may affect the performance in some cases. To mitigate that, hoisting
15 // is disabled in the following cases.
16 // 1. Scalars across calls.
17 // 2. geps when corresponding load/store cannot be hoisted.
18 //===----------------------------------------------------------------------===//
19 
20 #include "llvm/ADT/DenseMap.h"
21 #include "llvm/ADT/SmallPtrSet.h"
22 #include "llvm/ADT/Statistic.h"
23 #include "llvm/Analysis/ValueTracking.h"
24 #include "llvm/Transforms/Scalar.h"
25 #include "llvm/Transforms/Scalar/GVN.h"
26 #include "llvm/Transforms/Utils/Local.h"
27 #include "llvm/Transforms/Utils/MemorySSA.h"
28 
29 using namespace llvm;
30 
31 #define DEBUG_TYPE "gvn-hoist"
32 
33 STATISTIC(NumHoisted, "Number of instructions hoisted");
34 STATISTIC(NumRemoved, "Number of instructions removed");
35 STATISTIC(NumLoadsHoisted, "Number of loads hoisted");
36 STATISTIC(NumLoadsRemoved, "Number of loads removed");
37 STATISTIC(NumStoresHoisted, "Number of stores hoisted");
38 STATISTIC(NumStoresRemoved, "Number of stores removed");
39 STATISTIC(NumCallsHoisted, "Number of calls hoisted");
40 STATISTIC(NumCallsRemoved, "Number of calls removed");
41 
42 static cl::opt<int>
43     MaxHoistedThreshold("gvn-max-hoisted", cl::Hidden, cl::init(-1),
44                         cl::desc("Max number of instructions to hoist "
45                                  "(default unlimited = -1)"));
46 static cl::opt<int> MaxNumberOfBBSInPath(
47     "gvn-hoist-max-bbs", cl::Hidden, cl::init(4),
48     cl::desc("Max number of basic blocks on the path between "
49              "hoisting locations (default = 4, unlimited = -1)"));
50 
51 static cl::opt<int> MaxDepthInBB(
52     "gvn-hoist-max-depth", cl::Hidden, cl::init(100),
53     cl::desc("Hoist instructions from the beginning of the BB up to the "
54              "maximum specified depth (default = 100, unlimited = -1)"));
55 
56 namespace {
57 
58 // Provides a sorting function based on the execution order of two instructions.
59 struct SortByDFSIn {
60 private:
61   DenseMap<const Value *, unsigned> &DFSNumber;
62 
63 public:
64   SortByDFSIn(DenseMap<const Value *, unsigned> &D) : DFSNumber(D) {}
65 
66   // Returns true when A executes before B.
67   bool operator()(const Instruction *A, const Instruction *B) const {
68     // FIXME: libc++ has a std::sort() algorithm that will call the compare
69     // function on the same element.  Once PR20837 is fixed and some more years
70     // pass by and all the buildbots have moved to a corrected std::sort(),
71     // enable the following assert:
72     //
73     // assert(A != B);
74 
75     unsigned ADFS = DFSNumber.lookup(A);
76     unsigned BDFS = DFSNumber.lookup(B);
77     assert (ADFS && BDFS);
78     return ADFS < BDFS;
79   }
80 };
81 
82 // A map from a pair of VNs to all the instructions with those VNs.
83 typedef DenseMap<std::pair<unsigned, unsigned>, SmallVector<Instruction *, 4>>
84     VNtoInsns;
85 // An invalid value number Used when inserting a single value number into
86 // VNtoInsns.
87 enum : unsigned { InvalidVN = ~2U };
88 
89 // Records all scalar instructions candidate for code hoisting.
90 class InsnInfo {
91   VNtoInsns VNtoScalars;
92 
93 public:
94   // Inserts I and its value number in VNtoScalars.
95   void insert(Instruction *I, GVN::ValueTable &VN) {
96     // Scalar instruction.
97     unsigned V = VN.lookupOrAdd(I);
98     VNtoScalars[{V, InvalidVN}].push_back(I);
99   }
100 
101   const VNtoInsns &getVNTable() const { return VNtoScalars; }
102 };
103 
104 // Records all load instructions candidate for code hoisting.
105 class LoadInfo {
106   VNtoInsns VNtoLoads;
107 
108 public:
109   // Insert Load and the value number of its memory address in VNtoLoads.
110   void insert(LoadInst *Load, GVN::ValueTable &VN) {
111     if (Load->isSimple()) {
112       unsigned V = VN.lookupOrAdd(Load->getPointerOperand());
113       VNtoLoads[{V, InvalidVN}].push_back(Load);
114     }
115   }
116 
117   const VNtoInsns &getVNTable() const { return VNtoLoads; }
118 };
119 
120 // Records all store instructions candidate for code hoisting.
121 class StoreInfo {
122   VNtoInsns VNtoStores;
123 
124 public:
125   // Insert the Store and a hash number of the store address and the stored
126   // value in VNtoStores.
127   void insert(StoreInst *Store, GVN::ValueTable &VN) {
128     if (!Store->isSimple())
129       return;
130     // Hash the store address and the stored value.
131     Value *Ptr = Store->getPointerOperand();
132     Value *Val = Store->getValueOperand();
133     VNtoStores[{VN.lookupOrAdd(Ptr), VN.lookupOrAdd(Val)}].push_back(Store);
134   }
135 
136   const VNtoInsns &getVNTable() const { return VNtoStores; }
137 };
138 
139 // Records all call instructions candidate for code hoisting.
140 class CallInfo {
141   VNtoInsns VNtoCallsScalars;
142   VNtoInsns VNtoCallsLoads;
143   VNtoInsns VNtoCallsStores;
144 
145 public:
146   // Insert Call and its value numbering in one of the VNtoCalls* containers.
147   void insert(CallInst *Call, GVN::ValueTable &VN) {
148     // A call that doesNotAccessMemory is handled as a Scalar,
149     // onlyReadsMemory will be handled as a Load instruction,
150     // all other calls will be handled as stores.
151     unsigned V = VN.lookupOrAdd(Call);
152     auto Entry = std::make_pair(V, InvalidVN);
153 
154     if (Call->doesNotAccessMemory())
155       VNtoCallsScalars[Entry].push_back(Call);
156     else if (Call->onlyReadsMemory())
157       VNtoCallsLoads[Entry].push_back(Call);
158     else
159       VNtoCallsStores[Entry].push_back(Call);
160   }
161 
162   const VNtoInsns &getScalarVNTable() const { return VNtoCallsScalars; }
163 
164   const VNtoInsns &getLoadVNTable() const { return VNtoCallsLoads; }
165 
166   const VNtoInsns &getStoreVNTable() const { return VNtoCallsStores; }
167 };
168 
169 typedef DenseMap<const BasicBlock *, bool> BBSideEffectsSet;
170 typedef SmallVector<Instruction *, 4> SmallVecInsn;
171 typedef SmallVectorImpl<Instruction *> SmallVecImplInsn;
172 
173 static void combineKnownMetadata(Instruction *ReplInst, Instruction *I) {
174   static const unsigned KnownIDs[] = {
175       LLVMContext::MD_tbaa,           LLVMContext::MD_alias_scope,
176       LLVMContext::MD_noalias,        LLVMContext::MD_range,
177       LLVMContext::MD_fpmath,         LLVMContext::MD_invariant_load,
178       LLVMContext::MD_invariant_group};
179   combineMetadata(ReplInst, I, KnownIDs);
180 }
181 
182 // This pass hoists common computations across branches sharing common
183 // dominator. The primary goal is to reduce the code size, and in some
184 // cases reduce critical path (by exposing more ILP).
185 class GVNHoist {
186 public:
187   GVNHoist(DominatorTree *Dt, AliasAnalysis *Aa, MemoryDependenceResults *Md,
188            bool OptForMinSize)
189       : DT(Dt), AA(Aa), MD(Md), OptForMinSize(OptForMinSize),
190         HoistingGeps(OptForMinSize), HoistedCtr(0) {}
191   bool run(Function &F) {
192     VN.setDomTree(DT);
193     VN.setAliasAnalysis(AA);
194     VN.setMemDep(MD);
195     bool Res = false;
196 
197     // FIXME: use lazy evaluation of VN to avoid the fix-point computation.
198     while (1) {
199       // FIXME: only compute MemorySSA once. We need to update the analysis in
200       // the same time as transforming the code.
201       MemorySSA M(F, AA, DT);
202       MSSA = &M;
203 
204       // Perform DFS Numbering of instructions.
205       unsigned I = 0;
206       for (const BasicBlock *BB : depth_first(&F.getEntryBlock()))
207         for (auto &Inst: *BB)
208           DFSNumber.insert({&Inst, ++I});
209 
210       auto HoistStat = hoistExpressions(F);
211       if (HoistStat.first + HoistStat.second == 0) {
212         return Res;
213       }
214       if (HoistStat.second > 0) {
215         // To address a limitation of the current GVN, we need to rerun the
216         // hoisting after we hoisted loads in order to be able to hoist all
217         // scalars dependent on the hoisted loads. Same for stores.
218         VN.clear();
219       }
220       Res = true;
221 
222       // DFS numbers change when instructions are hoisted: clear and recompute.
223       DFSNumber.clear();
224     }
225 
226     return Res;
227   }
228 private:
229   GVN::ValueTable VN;
230   DominatorTree *DT;
231   AliasAnalysis *AA;
232   MemoryDependenceResults *MD;
233   const bool OptForMinSize;
234   const bool HoistingGeps;
235   DenseMap<const Value *, unsigned> DFSNumber;
236   BBSideEffectsSet BBSideEffects;
237   MemorySSA *MSSA;
238   int HoistedCtr;
239 
240   enum InsKind { Unknown, Scalar, Load, Store };
241 
242   // Return true when there are exception handling in BB.
243   bool hasEH(const BasicBlock *BB) {
244     auto It = BBSideEffects.find(BB);
245     if (It != BBSideEffects.end())
246       return It->second;
247 
248     if (BB->isEHPad() || BB->hasAddressTaken()) {
249       BBSideEffects[BB] = true;
250       return true;
251     }
252 
253     if (BB->getTerminator()->mayThrow()) {
254       BBSideEffects[BB] = true;
255       return true;
256     }
257 
258     BBSideEffects[BB] = false;
259     return false;
260   }
261 
262   // Return true when all paths from A to the end of the function pass through
263   // either B or C.
264   bool hoistingFromAllPaths(const BasicBlock *A, const BasicBlock *B,
265                             const BasicBlock *C) {
266     // We fully copy the WL in order to be able to remove items from it.
267     SmallPtrSet<const BasicBlock *, 2> WL;
268     WL.insert(B);
269     WL.insert(C);
270 
271     for (auto It = df_begin(A), E = df_end(A); It != E;) {
272       // There exists a path from A to the exit of the function if we are still
273       // iterating in DF traversal and we removed all instructions from the work
274       // list.
275       if (WL.empty())
276         return false;
277 
278       const BasicBlock *BB = *It;
279       if (WL.erase(BB)) {
280         // Stop DFS traversal when BB is in the work list.
281         It.skipChildren();
282         continue;
283       }
284 
285       // Check for end of function, calls that do not return, etc.
286       if (!isGuaranteedToTransferExecutionToSuccessor(BB->getTerminator()))
287         return false;
288 
289       // Increment DFS traversal when not skipping children.
290       ++It;
291     }
292 
293     return true;
294   }
295 
296   /* Return true when I1 appears before I2 in the instructions of BB.  */
297   bool firstInBB(const Instruction *I1, const Instruction *I2) {
298     assert (I1->getParent() == I2->getParent());
299     unsigned I1DFS = DFSNumber.lookup(I1);
300     unsigned I2DFS = DFSNumber.lookup(I2);
301     assert (I1DFS && I2DFS);
302     return I1DFS < I2DFS;
303   }
304 
305   // Return true when there are users of Def in BB.
306   bool hasMemoryUseOnPath(MemoryAccess *Def, const BasicBlock *BB,
307                           const Instruction *OldPt) {
308     const BasicBlock *DefBB = Def->getBlock();
309     const BasicBlock *OldBB = OldPt->getParent();
310 
311     for (User *U : Def->users())
312       if (auto *MU = dyn_cast<MemoryUse>(U)) {
313         BasicBlock *UBB = MU->getBlock();
314         // Only analyze uses in BB.
315         if (BB != UBB)
316           continue;
317 
318         // A use in the same block as the Def is on the path.
319         if (UBB == DefBB) {
320           assert(MSSA->locallyDominates(Def, MU) && "def not dominating use");
321           return true;
322         }
323 
324         if (UBB != OldBB)
325           return true;
326 
327         // It is only harmful to hoist when the use is before OldPt.
328         if (firstInBB(MU->getMemoryInst(), OldPt))
329           return true;
330       }
331 
332     return false;
333   }
334 
335   // Return true when there are exception handling or loads of memory Def
336   // between OldPt and NewPt.
337 
338   // Decrement by 1 NBBsOnAllPaths for each block between HoistPt and BB, and
339   // return true when the counter NBBsOnAllPaths reaces 0, except when it is
340   // initialized to -1 which is unlimited.
341   bool hasEHOrLoadsOnPath(const Instruction *NewPt, const Instruction *OldPt,
342                           MemoryAccess *Def, int &NBBsOnAllPaths) {
343     const BasicBlock *NewBB = NewPt->getParent();
344     const BasicBlock *OldBB = OldPt->getParent();
345     assert(DT->dominates(NewBB, OldBB) && "invalid path");
346     assert(DT->dominates(Def->getBlock(), NewBB) &&
347            "def does not dominate new hoisting point");
348 
349     // Walk all basic blocks reachable in depth-first iteration on the inverse
350     // CFG from OldBB to NewBB. These blocks are all the blocks that may be
351     // executed between the execution of NewBB and OldBB. Hoisting an expression
352     // from OldBB into NewBB has to be safe on all execution paths.
353     for (auto I = idf_begin(OldBB), E = idf_end(OldBB); I != E;) {
354       if (*I == NewBB) {
355         // Stop traversal when reaching HoistPt.
356         I.skipChildren();
357         continue;
358       }
359 
360       // Impossible to hoist with exceptions on the path.
361       if (hasEH(*I))
362         return true;
363 
364       // Check that we do not move a store past loads.
365       if (hasMemoryUseOnPath(Def, *I, OldPt))
366         return true;
367 
368       // Stop walk once the limit is reached.
369       if (NBBsOnAllPaths == 0)
370         return true;
371 
372       // -1 is unlimited number of blocks on all paths.
373       if (NBBsOnAllPaths != -1)
374         --NBBsOnAllPaths;
375 
376       ++I;
377     }
378 
379     return false;
380   }
381 
382   // Return true when there are exception handling between HoistPt and BB.
383   // Decrement by 1 NBBsOnAllPaths for each block between HoistPt and BB, and
384   // return true when the counter NBBsOnAllPaths reaches 0, except when it is
385   // initialized to -1 which is unlimited.
386   bool hasEHOnPath(const BasicBlock *HoistPt, const BasicBlock *BB,
387                    int &NBBsOnAllPaths) {
388     assert(DT->dominates(HoistPt, BB) && "Invalid path");
389 
390     // Walk all basic blocks reachable in depth-first iteration on
391     // the inverse CFG from BBInsn to NewHoistPt. These blocks are all the
392     // blocks that may be executed between the execution of NewHoistPt and
393     // BBInsn. Hoisting an expression from BBInsn into NewHoistPt has to be safe
394     // on all execution paths.
395     for (auto I = idf_begin(BB), E = idf_end(BB); I != E;) {
396       if (*I == HoistPt) {
397         // Stop traversal when reaching NewHoistPt.
398         I.skipChildren();
399         continue;
400       }
401 
402       // Impossible to hoist with exceptions on the path.
403       if (hasEH(*I))
404         return true;
405 
406       // Stop walk once the limit is reached.
407       if (NBBsOnAllPaths == 0)
408         return true;
409 
410       // -1 is unlimited number of blocks on all paths.
411       if (NBBsOnAllPaths != -1)
412         --NBBsOnAllPaths;
413 
414       ++I;
415     }
416 
417     return false;
418   }
419 
420   // Return true when it is safe to hoist a memory load or store U from OldPt
421   // to NewPt.
422   bool safeToHoistLdSt(const Instruction *NewPt, const Instruction *OldPt,
423                        MemoryUseOrDef *U, InsKind K, int &NBBsOnAllPaths) {
424 
425     // In place hoisting is safe.
426     if (NewPt == OldPt)
427       return true;
428 
429     const BasicBlock *NewBB = NewPt->getParent();
430     const BasicBlock *OldBB = OldPt->getParent();
431     const BasicBlock *UBB = U->getBlock();
432 
433     // Check for dependences on the Memory SSA.
434     MemoryAccess *D = U->getDefiningAccess();
435     BasicBlock *DBB = D->getBlock();
436     if (DT->properlyDominates(NewBB, DBB))
437       // Cannot move the load or store to NewBB above its definition in DBB.
438       return false;
439 
440     if (NewBB == DBB && !MSSA->isLiveOnEntryDef(D))
441       if (auto *UD = dyn_cast<MemoryUseOrDef>(D))
442         if (firstInBB(NewPt, UD->getMemoryInst()))
443           // Cannot move the load or store to NewPt above its definition in D.
444           return false;
445 
446     // Check for unsafe hoistings due to side effects.
447     if (K == InsKind::Store) {
448       if (hasEHOrLoadsOnPath(NewPt, OldPt, D, NBBsOnAllPaths))
449         return false;
450     } else if (hasEHOnPath(NewBB, OldBB, NBBsOnAllPaths))
451       return false;
452 
453     if (UBB == NewBB) {
454       if (DT->properlyDominates(DBB, NewBB))
455         return true;
456       assert(UBB == DBB);
457       assert(MSSA->locallyDominates(D, U));
458     }
459 
460     // No side effects: it is safe to hoist.
461     return true;
462   }
463 
464   // Return true when it is safe to hoist scalar instructions from BB1 and BB2
465   // to HoistBB.
466   bool safeToHoistScalar(const BasicBlock *HoistBB, const BasicBlock *BB1,
467                          const BasicBlock *BB2, int &NBBsOnAllPaths) {
468     // Check that the hoisted expression is needed on all paths.  When HoistBB
469     // already contains an instruction to be hoisted, the expression is needed
470     // on all paths.  Enable scalar hoisting at -Oz as it is safe to hoist
471     // scalars to a place where they are partially needed.
472     if (!OptForMinSize && BB1 != HoistBB &&
473         !hoistingFromAllPaths(HoistBB, BB1, BB2))
474       return false;
475 
476     if (hasEHOnPath(HoistBB, BB1, NBBsOnAllPaths) ||
477         hasEHOnPath(HoistBB, BB2, NBBsOnAllPaths))
478       return false;
479 
480     // Safe to hoist scalars from BB1 and BB2 to HoistBB.
481     return true;
482   }
483 
484   // Each element of a hoisting list contains the basic block where to hoist and
485   // a list of instructions to be hoisted.
486   typedef std::pair<BasicBlock *, SmallVecInsn> HoistingPointInfo;
487   typedef SmallVector<HoistingPointInfo, 4> HoistingPointList;
488 
489   // Partition InstructionsToHoist into a set of candidates which can share a
490   // common hoisting point. The partitions are collected in HPL. IsScalar is
491   // true when the instructions in InstructionsToHoist are scalars. IsLoad is
492   // true when the InstructionsToHoist are loads, false when they are stores.
493   void partitionCandidates(SmallVecImplInsn &InstructionsToHoist,
494                            HoistingPointList &HPL, InsKind K) {
495     // No need to sort for two instructions.
496     if (InstructionsToHoist.size() > 2) {
497       SortByDFSIn Pred(DFSNumber);
498       std::sort(InstructionsToHoist.begin(), InstructionsToHoist.end(), Pred);
499     }
500 
501     int NBBsOnAllPaths = MaxNumberOfBBSInPath;
502 
503     SmallVecImplInsn::iterator II = InstructionsToHoist.begin();
504     SmallVecImplInsn::iterator Start = II;
505     Instruction *HoistPt = *II;
506     BasicBlock *HoistBB = HoistPt->getParent();
507     MemoryUseOrDef *UD;
508     if (K != InsKind::Scalar)
509       UD = cast<MemoryUseOrDef>(MSSA->getMemoryAccess(HoistPt));
510 
511     for (++II; II != InstructionsToHoist.end(); ++II) {
512       Instruction *Insn = *II;
513       BasicBlock *BB = Insn->getParent();
514       BasicBlock *NewHoistBB;
515       Instruction *NewHoistPt;
516 
517       if (BB == HoistBB) {
518         NewHoistBB = HoistBB;
519         NewHoistPt = firstInBB(Insn, HoistPt) ? Insn : HoistPt;
520       } else {
521         NewHoistBB = DT->findNearestCommonDominator(HoistBB, BB);
522         if (NewHoistBB == BB)
523           NewHoistPt = Insn;
524         else if (NewHoistBB == HoistBB)
525           NewHoistPt = HoistPt;
526         else
527           NewHoistPt = NewHoistBB->getTerminator();
528       }
529 
530       if (K == InsKind::Scalar) {
531         if (safeToHoistScalar(NewHoistBB, HoistBB, BB, NBBsOnAllPaths)) {
532           // Extend HoistPt to NewHoistPt.
533           HoistPt = NewHoistPt;
534           HoistBB = NewHoistBB;
535           continue;
536         }
537       } else {
538         // When NewBB already contains an instruction to be hoisted, the
539         // expression is needed on all paths.
540         // Check that the hoisted expression is needed on all paths: it is
541         // unsafe to hoist loads to a place where there may be a path not
542         // loading from the same address: for instance there may be a branch on
543         // which the address of the load may not be initialized.
544         if ((HoistBB == NewHoistBB || BB == NewHoistBB ||
545              hoistingFromAllPaths(NewHoistBB, HoistBB, BB)) &&
546             // Also check that it is safe to move the load or store from HoistPt
547             // to NewHoistPt, and from Insn to NewHoistPt.
548             safeToHoistLdSt(NewHoistPt, HoistPt, UD, K, NBBsOnAllPaths) &&
549             safeToHoistLdSt(NewHoistPt, Insn,
550                             cast<MemoryUseOrDef>(MSSA->getMemoryAccess(Insn)),
551                             K, NBBsOnAllPaths)) {
552           // Extend HoistPt to NewHoistPt.
553           HoistPt = NewHoistPt;
554           HoistBB = NewHoistBB;
555           continue;
556         }
557       }
558 
559       // At this point it is not safe to extend the current hoisting to
560       // NewHoistPt: save the hoisting list so far.
561       if (std::distance(Start, II) > 1)
562         HPL.push_back({HoistBB, SmallVecInsn(Start, II)});
563 
564       // Start over from BB.
565       Start = II;
566       if (K != InsKind::Scalar)
567         UD = cast<MemoryUseOrDef>(MSSA->getMemoryAccess(*Start));
568       HoistPt = Insn;
569       HoistBB = BB;
570       NBBsOnAllPaths = MaxNumberOfBBSInPath;
571     }
572 
573     // Save the last partition.
574     if (std::distance(Start, II) > 1)
575       HPL.push_back({HoistBB, SmallVecInsn(Start, II)});
576   }
577 
578   // Initialize HPL from Map.
579   void computeInsertionPoints(const VNtoInsns &Map, HoistingPointList &HPL,
580                               InsKind K) {
581     for (const auto &Entry : Map) {
582       if (MaxHoistedThreshold != -1 && ++HoistedCtr > MaxHoistedThreshold)
583         return;
584 
585       const SmallVecInsn &V = Entry.second;
586       if (V.size() < 2)
587         continue;
588 
589       // Compute the insertion point and the list of expressions to be hoisted.
590       SmallVecInsn InstructionsToHoist;
591       for (auto I : V)
592         if (!hasEH(I->getParent()))
593           InstructionsToHoist.push_back(I);
594 
595       if (!InstructionsToHoist.empty())
596         partitionCandidates(InstructionsToHoist, HPL, K);
597     }
598   }
599 
600   // Return true when all operands of Instr are available at insertion point
601   // HoistPt. When limiting the number of hoisted expressions, one could hoist
602   // a load without hoisting its access function. So before hoisting any
603   // expression, make sure that all its operands are available at insert point.
604   bool allOperandsAvailable(const Instruction *I,
605                             const BasicBlock *HoistPt) const {
606     for (const Use &Op : I->operands())
607       if (const auto *Inst = dyn_cast<Instruction>(&Op))
608         if (!DT->dominates(Inst->getParent(), HoistPt))
609           return false;
610 
611     return true;
612   }
613 
614   // Same as allOperandsAvailable with recursive check for GEP operands.
615   bool allGepOperandsAvailable(const Instruction *I,
616                                const BasicBlock *HoistPt) const {
617     for (const Use &Op : I->operands())
618       if (const auto *Inst = dyn_cast<Instruction>(&Op))
619         if (!DT->dominates(Inst->getParent(), HoistPt)) {
620           if (const GetElementPtrInst *GepOp = dyn_cast<GetElementPtrInst>(Inst)) {
621             if (!allGepOperandsAvailable(GepOp, HoistPt))
622               return false;
623             // Gep is available if all operands of GepOp are available.
624           } else {
625             // Gep is not available if it has operands other than GEPs that are
626             // defined in blocks not dominating HoistPt.
627             return false;
628           }
629         }
630     return true;
631   }
632 
633   // Make all operands of the GEP available.
634   void makeGepsAvailable(Instruction *Repl, BasicBlock *HoistPt,
635                          const SmallVecInsn &InstructionsToHoist,
636                          Instruction *Gep) const {
637     assert(allGepOperandsAvailable(Gep, HoistPt) && "GEP operands not available");
638 
639     Instruction *ClonedGep = Gep->clone();
640     for (unsigned i = 0, e = Gep->getNumOperands(); i != e; ++i)
641       if (Instruction *Op = dyn_cast<Instruction>(Gep->getOperand(i))) {
642 
643         // Check whether the operand is already available.
644         if (DT->dominates(Op->getParent(), HoistPt))
645           continue;
646 
647         // As a GEP can refer to other GEPs, recursively make all the operands
648         // of this GEP available at HoistPt.
649         if (GetElementPtrInst *GepOp = dyn_cast<GetElementPtrInst>(Op))
650           makeGepsAvailable(ClonedGep, HoistPt, InstructionsToHoist, GepOp);
651       }
652 
653     // Copy Gep and replace its uses in Repl with ClonedGep.
654     ClonedGep->insertBefore(HoistPt->getTerminator());
655 
656     // Conservatively discard any optimization hints, they may differ on the
657     // other paths.
658     ClonedGep->dropUnknownNonDebugMetadata();
659 
660     // If we have optimization hints which agree with each other along different
661     // paths, preserve them.
662     for (const Instruction *OtherInst : InstructionsToHoist) {
663       const GetElementPtrInst *OtherGep;
664       if (auto *OtherLd = dyn_cast<LoadInst>(OtherInst))
665         OtherGep = cast<GetElementPtrInst>(OtherLd->getPointerOperand());
666       else
667         OtherGep = cast<GetElementPtrInst>(
668             cast<StoreInst>(OtherInst)->getPointerOperand());
669       ClonedGep->intersectOptionalDataWith(OtherGep);
670     }
671 
672     // Replace uses of Gep with ClonedGep in Repl.
673     Repl->replaceUsesOfWith(Gep, ClonedGep);
674   }
675 
676   // In the case Repl is a load or a store, we make all their GEPs
677   // available: GEPs are not hoisted by default to avoid the address
678   // computations to be hoisted without the associated load or store.
679   bool makeGepOperandsAvailable(Instruction *Repl, BasicBlock *HoistPt,
680                                 const SmallVecInsn &InstructionsToHoist) const {
681     // Check whether the GEP of a ld/st can be synthesized at HoistPt.
682     GetElementPtrInst *Gep = nullptr;
683     Instruction *Val = nullptr;
684     if (auto *Ld = dyn_cast<LoadInst>(Repl)) {
685       Gep = dyn_cast<GetElementPtrInst>(Ld->getPointerOperand());
686     } else if (auto *St = dyn_cast<StoreInst>(Repl)) {
687       Gep = dyn_cast<GetElementPtrInst>(St->getPointerOperand());
688       Val = dyn_cast<Instruction>(St->getValueOperand());
689       // Check that the stored value is available.
690       if (Val) {
691         if (isa<GetElementPtrInst>(Val)) {
692           // Check whether we can compute the GEP at HoistPt.
693           if (!allGepOperandsAvailable(Val, HoistPt))
694             return false;
695         } else if (!DT->dominates(Val->getParent(), HoistPt))
696           return false;
697       }
698     }
699 
700     // Check whether we can compute the Gep at HoistPt.
701     if (!Gep || !allGepOperandsAvailable(Gep, HoistPt))
702       return false;
703 
704     makeGepsAvailable(Repl, HoistPt, InstructionsToHoist, Gep);
705 
706     if (Val && isa<GetElementPtrInst>(Val))
707       makeGepsAvailable(Repl, HoistPt, InstructionsToHoist, Val);
708 
709     return true;
710   }
711 
712   std::pair<unsigned, unsigned> hoist(HoistingPointList &HPL) {
713     unsigned NI = 0, NL = 0, NS = 0, NC = 0, NR = 0;
714     for (const HoistingPointInfo &HP : HPL) {
715       // Find out whether we already have one of the instructions in HoistPt,
716       // in which case we do not have to move it.
717       BasicBlock *HoistPt = HP.first;
718       const SmallVecInsn &InstructionsToHoist = HP.second;
719       Instruction *Repl = nullptr;
720       for (Instruction *I : InstructionsToHoist)
721         if (I->getParent() == HoistPt)
722           // If there are two instructions in HoistPt to be hoisted in place:
723           // update Repl to be the first one, such that we can rename the uses
724           // of the second based on the first.
725           if (!Repl || firstInBB(I, Repl))
726             Repl = I;
727 
728       if (Repl) {
729         // Repl is already in HoistPt: it remains in place.
730         assert(allOperandsAvailable(Repl, HoistPt) &&
731                "instruction depends on operands that are not available");
732       } else {
733         // When we do not find Repl in HoistPt, select the first in the list
734         // and move it to HoistPt.
735         Repl = InstructionsToHoist.front();
736 
737         // We can move Repl in HoistPt only when all operands are available.
738         // When not HoistingGeps we need to copy the GEPs now.
739         // The order in which hoistings are done may influence the availability
740         // of operands.
741         if (!allOperandsAvailable(Repl, HoistPt) && !HoistingGeps &&
742             !makeGepOperandsAvailable(Repl, HoistPt, InstructionsToHoist))
743           continue;
744 
745         Repl->moveBefore(HoistPt->getTerminator());
746       }
747 
748       if (isa<LoadInst>(Repl))
749         ++NL;
750       else if (isa<StoreInst>(Repl))
751         ++NS;
752       else if (isa<CallInst>(Repl))
753         ++NC;
754       else // Scalar
755         ++NI;
756 
757       // Remove and rename all other instructions.
758       for (Instruction *I : InstructionsToHoist)
759         if (I != Repl) {
760           ++NR;
761           if (auto *ReplacementLoad = dyn_cast<LoadInst>(Repl)) {
762             ReplacementLoad->setAlignment(
763                 std::min(ReplacementLoad->getAlignment(),
764                          cast<LoadInst>(I)->getAlignment()));
765             ++NumLoadsRemoved;
766           } else if (auto *ReplacementStore = dyn_cast<StoreInst>(Repl)) {
767             ReplacementStore->setAlignment(
768                 std::min(ReplacementStore->getAlignment(),
769                          cast<StoreInst>(I)->getAlignment()));
770             ++NumStoresRemoved;
771           } else if (auto *ReplacementAlloca = dyn_cast<AllocaInst>(Repl)) {
772             ReplacementAlloca->setAlignment(
773                 std::max(ReplacementAlloca->getAlignment(),
774                          cast<AllocaInst>(I)->getAlignment()));
775           } else if (isa<CallInst>(Repl)) {
776             ++NumCallsRemoved;
777           }
778           Repl->intersectOptionalDataWith(I);
779           combineKnownMetadata(Repl, I);
780           I->replaceAllUsesWith(Repl);
781           I->eraseFromParent();
782         }
783     }
784 
785     NumHoisted += NL + NS + NC + NI;
786     NumRemoved += NR;
787     NumLoadsHoisted += NL;
788     NumStoresHoisted += NS;
789     NumCallsHoisted += NC;
790     return {NI, NL + NC + NS};
791   }
792 
793   // Hoist all expressions. Returns Number of scalars hoisted
794   // and number of non-scalars hoisted.
795   std::pair<unsigned, unsigned> hoistExpressions(Function &F) {
796     InsnInfo II;
797     LoadInfo LI;
798     StoreInfo SI;
799     CallInfo CI;
800     for (BasicBlock *BB : depth_first(&F.getEntryBlock())) {
801       int InstructionNb = 0;
802       for (Instruction &I1 : *BB) {
803         // Only hoist the first instructions in BB up to MaxDepthInBB. Hoisting
804         // deeper may increase the register pressure and compilation time.
805         if (MaxDepthInBB != -1 && InstructionNb++ >= MaxDepthInBB)
806           break;
807 
808         if (auto *Load = dyn_cast<LoadInst>(&I1))
809           LI.insert(Load, VN);
810         else if (auto *Store = dyn_cast<StoreInst>(&I1))
811           SI.insert(Store, VN);
812         else if (auto *Call = dyn_cast<CallInst>(&I1)) {
813           if (auto *Intr = dyn_cast<IntrinsicInst>(Call)) {
814             if (isa<DbgInfoIntrinsic>(Intr) ||
815                 Intr->getIntrinsicID() == Intrinsic::assume)
816               continue;
817           }
818           if (Call->mayHaveSideEffects()) {
819             if (!OptForMinSize)
820               break;
821             // We may continue hoisting across calls which write to memory.
822             if (Call->mayThrow())
823               break;
824           }
825           CI.insert(Call, VN);
826         } else if (HoistingGeps || !isa<GetElementPtrInst>(&I1))
827           // Do not hoist scalars past calls that may write to memory because
828           // that could result in spills later. geps are handled separately.
829           // TODO: We can relax this for targets like AArch64 as they have more
830           // registers than X86.
831           II.insert(&I1, VN);
832       }
833     }
834 
835     HoistingPointList HPL;
836     computeInsertionPoints(II.getVNTable(), HPL, InsKind::Scalar);
837     computeInsertionPoints(LI.getVNTable(), HPL, InsKind::Load);
838     computeInsertionPoints(SI.getVNTable(), HPL, InsKind::Store);
839     computeInsertionPoints(CI.getScalarVNTable(), HPL, InsKind::Scalar);
840     computeInsertionPoints(CI.getLoadVNTable(), HPL, InsKind::Load);
841     computeInsertionPoints(CI.getStoreVNTable(), HPL, InsKind::Store);
842     return hoist(HPL);
843   }
844 };
845 
846 class GVNHoistLegacyPass : public FunctionPass {
847 public:
848   static char ID;
849 
850   GVNHoistLegacyPass() : FunctionPass(ID) {
851     initializeGVNHoistLegacyPassPass(*PassRegistry::getPassRegistry());
852   }
853 
854   bool runOnFunction(Function &F) override {
855     if (skipFunction(F))
856       return false;
857     auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
858     auto &AA = getAnalysis<AAResultsWrapperPass>().getAAResults();
859     auto &MD = getAnalysis<MemoryDependenceWrapperPass>().getMemDep();
860 
861     GVNHoist G(&DT, &AA, &MD, F.optForMinSize());
862     return G.run(F);
863   }
864 
865   void getAnalysisUsage(AnalysisUsage &AU) const override {
866     AU.addRequired<DominatorTreeWrapperPass>();
867     AU.addRequired<AAResultsWrapperPass>();
868     AU.addRequired<MemoryDependenceWrapperPass>();
869     AU.addPreserved<DominatorTreeWrapperPass>();
870   }
871 };
872 } // namespace
873 
874 PreservedAnalyses GVNHoistPass::run(Function &F,
875                                     AnalysisManager<Function> &AM) {
876   DominatorTree &DT = AM.getResult<DominatorTreeAnalysis>(F);
877   AliasAnalysis &AA = AM.getResult<AAManager>(F);
878   MemoryDependenceResults &MD = AM.getResult<MemoryDependenceAnalysis>(F);
879 
880   GVNHoist G(&DT, &AA, &MD, F.optForMinSize());
881   if (!G.run(F))
882     return PreservedAnalyses::all();
883 
884   PreservedAnalyses PA;
885   PA.preserve<DominatorTreeAnalysis>();
886   return PA;
887 }
888 
889 char GVNHoistLegacyPass::ID = 0;
890 INITIALIZE_PASS_BEGIN(GVNHoistLegacyPass, "gvn-hoist",
891                       "Early GVN Hoisting of Expressions", false, false)
892 INITIALIZE_PASS_DEPENDENCY(MemoryDependenceWrapperPass)
893 INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
894 INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass)
895 INITIALIZE_PASS_END(GVNHoistLegacyPass, "gvn-hoist",
896                     "Early GVN Hoisting of Expressions", false, false)
897 
898 FunctionPass *llvm::createGVNHoistPass() { return new GVNHoistLegacyPass(); }
899