xref: /llvm-project/llvm/lib/CodeGen/StackSlotColoring.cpp (revision f6d431f208c0fa48827eac40e7acf788346a9967)
1 //===- StackSlotColoring.cpp - Stack slot coloring pass. ------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements the stack slot coloring pass.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "llvm/ADT/BitVector.h"
14 #include "llvm/ADT/SmallVector.h"
15 #include "llvm/ADT/Statistic.h"
16 #include "llvm/CodeGen/LiveInterval.h"
17 #include "llvm/CodeGen/LiveIntervalUnion.h"
18 #include "llvm/CodeGen/LiveIntervals.h"
19 #include "llvm/CodeGen/LiveStacks.h"
20 #include "llvm/CodeGen/MachineBasicBlock.h"
21 #include "llvm/CodeGen/MachineBlockFrequencyInfo.h"
22 #include "llvm/CodeGen/MachineFrameInfo.h"
23 #include "llvm/CodeGen/MachineFunction.h"
24 #include "llvm/CodeGen/MachineFunctionPass.h"
25 #include "llvm/CodeGen/MachineInstr.h"
26 #include "llvm/CodeGen/MachineMemOperand.h"
27 #include "llvm/CodeGen/MachineOperand.h"
28 #include "llvm/CodeGen/Passes.h"
29 #include "llvm/CodeGen/PseudoSourceValue.h"
30 #include "llvm/CodeGen/PseudoSourceValueManager.h"
31 #include "llvm/CodeGen/SlotIndexes.h"
32 #include "llvm/CodeGen/TargetInstrInfo.h"
33 #include "llvm/CodeGen/TargetSubtargetInfo.h"
34 #include "llvm/InitializePasses.h"
35 #include "llvm/Pass.h"
36 #include "llvm/Support/Casting.h"
37 #include "llvm/Support/CommandLine.h"
38 #include "llvm/Support/Debug.h"
39 #include "llvm/Support/raw_ostream.h"
40 #include <algorithm>
41 #include <cassert>
42 #include <cstdint>
43 #include <iterator>
44 #include <vector>
45 
46 using namespace llvm;
47 
48 #define DEBUG_TYPE "stack-slot-coloring"
49 
50 static cl::opt<bool>
51 DisableSharing("no-stack-slot-sharing",
52              cl::init(false), cl::Hidden,
53              cl::desc("Suppress slot sharing during stack coloring"));
54 
55 static cl::opt<int> DCELimit("ssc-dce-limit", cl::init(-1), cl::Hidden);
56 
57 STATISTIC(NumEliminated, "Number of stack slots eliminated due to coloring");
58 STATISTIC(NumDead,       "Number of trivially dead stack accesses eliminated");
59 
60 namespace {
61 
62   class StackSlotColoring : public MachineFunctionPass {
63     LiveStacks *LS = nullptr;
64     MachineFrameInfo *MFI = nullptr;
65     const TargetInstrInfo *TII = nullptr;
66     const MachineBlockFrequencyInfo *MBFI = nullptr;
67 
68     // SSIntervals - Spill slot intervals.
69     std::vector<LiveInterval*> SSIntervals;
70 
71     // SSRefs - Keep a list of MachineMemOperands for each spill slot.
72     // MachineMemOperands can be shared between instructions, so we need
73     // to be careful that renames like [FI0, FI1] -> [FI1, FI2] do not
74     // become FI0 -> FI1 -> FI2.
75     SmallVector<SmallVector<MachineMemOperand *, 8>, 16> SSRefs;
76 
77     // OrigAlignments - Alignments of stack objects before coloring.
78     SmallVector<Align, 16> OrigAlignments;
79 
80     // OrigSizes - Sizes of stack objects before coloring.
81     SmallVector<unsigned, 16> OrigSizes;
82 
83     // AllColors - If index is set, it's a spill slot, i.e. color.
84     // FIXME: This assumes PEI locate spill slot with smaller indices
85     // closest to stack pointer / frame pointer. Therefore, smaller
86     // index == better color. This is per stack ID.
87     SmallVector<BitVector, 2> AllColors;
88 
89     // NextColor - Next "color" that's not yet used. This is per stack ID.
90     SmallVector<int, 2> NextColors = { -1 };
91 
92     // UsedColors - "Colors" that have been assigned. This is per stack ID
93     SmallVector<BitVector, 2> UsedColors;
94 
95     // Join all intervals sharing one color into a single LiveIntervalUnion to
96     // speedup range overlap test.
97     class ColorAssignmentInfo {
98       // Single liverange (used to avoid creation of LiveIntervalUnion).
99       LiveInterval *SingleLI = nullptr;
100       // LiveIntervalUnion to perform overlap test.
101       LiveIntervalUnion *LIU = nullptr;
102       // LiveIntervalUnion has a parameter in its constructor so doing this
103       // dirty magic.
104       uint8_t LIUPad[sizeof(LiveIntervalUnion)];
105 
106     public:
107       ~ColorAssignmentInfo() {
108         if (LIU)
109           LIU->~LiveIntervalUnion(); // Dirty magic again.
110       }
111 
112       // Return true if LiveInterval overlaps with any
113       // intervals that have already been assigned to this color.
114       bool overlaps(LiveInterval *LI) const {
115         if (LIU)
116           return LiveIntervalUnion::Query(*LI, *LIU).checkInterference();
117         return SingleLI ? SingleLI->overlaps(*LI) : false;
118       }
119 
120       // Add new LiveInterval to this color.
121       void add(LiveInterval *LI, LiveIntervalUnion::Allocator &Alloc) {
122         assert(!overlaps(LI));
123         if (LIU) {
124           LIU->unify(*LI, *LI);
125         } else if (SingleLI) {
126           LIU = new (LIUPad) LiveIntervalUnion(Alloc);
127           LIU->unify(*SingleLI, *SingleLI);
128           LIU->unify(*LI, *LI);
129           SingleLI = nullptr;
130         } else
131           SingleLI = LI;
132       }
133     };
134 
135     LiveIntervalUnion::Allocator LIUAlloc;
136 
137     // Assignments - Color to intervals mapping.
138     SmallVector<ColorAssignmentInfo, 16> Assignments;
139 
140   public:
141     static char ID; // Pass identification
142 
143     StackSlotColoring() : MachineFunctionPass(ID) {
144       initializeStackSlotColoringPass(*PassRegistry::getPassRegistry());
145     }
146 
147     void getAnalysisUsage(AnalysisUsage &AU) const override {
148       AU.setPreservesCFG();
149       AU.addRequired<SlotIndexes>();
150       AU.addPreserved<SlotIndexes>();
151       AU.addRequired<LiveStacks>();
152       AU.addRequired<MachineBlockFrequencyInfo>();
153       AU.addPreserved<MachineBlockFrequencyInfo>();
154       AU.addPreservedID(MachineDominatorsID);
155       MachineFunctionPass::getAnalysisUsage(AU);
156     }
157 
158     bool runOnMachineFunction(MachineFunction &MF) override;
159 
160   private:
161     void InitializeSlots();
162     void ScanForSpillSlotRefs(MachineFunction &MF);
163     int ColorSlot(LiveInterval *li);
164     bool ColorSlots(MachineFunction &MF);
165     void RewriteInstruction(MachineInstr &MI, SmallVectorImpl<int> &SlotMapping,
166                             MachineFunction &MF);
167     bool RemoveDeadStores(MachineBasicBlock* MBB);
168   };
169 
170 } // end anonymous namespace
171 
172 char StackSlotColoring::ID = 0;
173 
174 char &llvm::StackSlotColoringID = StackSlotColoring::ID;
175 
176 INITIALIZE_PASS_BEGIN(StackSlotColoring, DEBUG_TYPE,
177                 "Stack Slot Coloring", false, false)
178 INITIALIZE_PASS_DEPENDENCY(SlotIndexes)
179 INITIALIZE_PASS_DEPENDENCY(LiveStacks)
180 INITIALIZE_PASS_DEPENDENCY(MachineLoopInfo)
181 INITIALIZE_PASS_END(StackSlotColoring, DEBUG_TYPE,
182                 "Stack Slot Coloring", false, false)
183 
184 namespace {
185 
186 // IntervalSorter - Comparison predicate that sort live intervals by
187 // their weight.
188 struct IntervalSorter {
189   bool operator()(LiveInterval* LHS, LiveInterval* RHS) const {
190     return LHS->weight() > RHS->weight();
191   }
192 };
193 
194 } // end anonymous namespace
195 
196 /// ScanForSpillSlotRefs - Scan all the machine instructions for spill slot
197 /// references and update spill slot weights.
198 void StackSlotColoring::ScanForSpillSlotRefs(MachineFunction &MF) {
199   SSRefs.resize(MFI->getObjectIndexEnd());
200 
201   // FIXME: Need the equivalent of MachineRegisterInfo for frameindex operands.
202   for (MachineBasicBlock &MBB : MF) {
203     for (MachineInstr &MI : MBB) {
204       for (const MachineOperand &MO : MI.operands()) {
205         if (!MO.isFI())
206           continue;
207         int FI = MO.getIndex();
208         if (FI < 0)
209           continue;
210         if (!LS->hasInterval(FI))
211           continue;
212         LiveInterval &li = LS->getInterval(FI);
213         if (!MI.isDebugInstr())
214           li.incrementWeight(
215               LiveIntervals::getSpillWeight(false, true, MBFI, MI));
216       }
217       for (MachineInstr::mmo_iterator MMOI = MI.memoperands_begin(),
218                                       EE = MI.memoperands_end();
219            MMOI != EE; ++MMOI) {
220         MachineMemOperand *MMO = *MMOI;
221         if (const FixedStackPseudoSourceValue *FSV =
222             dyn_cast_or_null<FixedStackPseudoSourceValue>(
223                 MMO->getPseudoValue())) {
224           int FI = FSV->getFrameIndex();
225           if (FI >= 0)
226             SSRefs[FI].push_back(MMO);
227         }
228       }
229     }
230   }
231 }
232 
233 /// InitializeSlots - Process all spill stack slot liveintervals and add them
234 /// to a sorted (by weight) list.
235 void StackSlotColoring::InitializeSlots() {
236   int LastFI = MFI->getObjectIndexEnd();
237 
238   // There is always at least one stack ID.
239   AllColors.resize(1);
240   UsedColors.resize(1);
241 
242   OrigAlignments.resize(LastFI);
243   OrigSizes.resize(LastFI);
244   AllColors[0].resize(LastFI);
245   UsedColors[0].resize(LastFI);
246   Assignments.resize(LastFI);
247 
248   using Pair = std::iterator_traits<LiveStacks::iterator>::value_type;
249 
250   SmallVector<Pair *, 16> Intervals;
251 
252   Intervals.reserve(LS->getNumIntervals());
253   for (auto &I : *LS)
254     Intervals.push_back(&I);
255   llvm::sort(Intervals,
256              [](Pair *LHS, Pair *RHS) { return LHS->first < RHS->first; });
257 
258   // Gather all spill slots into a list.
259   LLVM_DEBUG(dbgs() << "Spill slot intervals:\n");
260   for (auto *I : Intervals) {
261     LiveInterval &li = I->second;
262     LLVM_DEBUG(li.dump());
263     int FI = Register::stackSlot2Index(li.reg());
264     if (MFI->isDeadObjectIndex(FI))
265       continue;
266 
267     SSIntervals.push_back(&li);
268     OrigAlignments[FI] = MFI->getObjectAlign(FI);
269     OrigSizes[FI]      = MFI->getObjectSize(FI);
270 
271     auto StackID = MFI->getStackID(FI);
272     if (StackID != 0) {
273       AllColors.resize(StackID + 1);
274       UsedColors.resize(StackID + 1);
275       AllColors[StackID].resize(LastFI);
276       UsedColors[StackID].resize(LastFI);
277     }
278 
279     AllColors[StackID].set(FI);
280   }
281   LLVM_DEBUG(dbgs() << '\n');
282 
283   // Sort them by weight.
284   llvm::stable_sort(SSIntervals, IntervalSorter());
285 
286   NextColors.resize(AllColors.size());
287 
288   // Get first "color".
289   for (unsigned I = 0, E = AllColors.size(); I != E; ++I)
290     NextColors[I] = AllColors[I].find_first();
291 }
292 
293 /// ColorSlot - Assign a "color" (stack slot) to the specified stack slot.
294 int StackSlotColoring::ColorSlot(LiveInterval *li) {
295   int Color = -1;
296   bool Share = false;
297   int FI = Register::stackSlot2Index(li->reg());
298   uint8_t StackID = MFI->getStackID(FI);
299 
300   if (!DisableSharing) {
301 
302     // Check if it's possible to reuse any of the used colors.
303     Color = UsedColors[StackID].find_first();
304     while (Color != -1) {
305       if (!Assignments[Color].overlaps(li)) {
306         Share = true;
307         ++NumEliminated;
308         break;
309       }
310       Color = UsedColors[StackID].find_next(Color);
311     }
312   }
313 
314   if (Color != -1 && MFI->getStackID(Color) != MFI->getStackID(FI)) {
315     LLVM_DEBUG(dbgs() << "cannot share FIs with different stack IDs\n");
316     Share = false;
317   }
318 
319   // Assign it to the first available color (assumed to be the best) if it's
320   // not possible to share a used color with other objects.
321   if (!Share) {
322     assert(NextColors[StackID] != -1 && "No more spill slots?");
323     Color = NextColors[StackID];
324     UsedColors[StackID].set(Color);
325     NextColors[StackID] = AllColors[StackID].find_next(NextColors[StackID]);
326   }
327 
328   assert(MFI->getStackID(Color) == MFI->getStackID(FI));
329 
330   // Record the assignment.
331   Assignments[Color].add(li, LIUAlloc);
332   LLVM_DEBUG(dbgs() << "Assigning fi#" << FI << " to fi#" << Color << "\n");
333 
334   // Change size and alignment of the allocated slot. If there are multiple
335   // objects sharing the same slot, then make sure the size and alignment
336   // are large enough for all.
337   Align Alignment = OrigAlignments[FI];
338   if (!Share || Alignment > MFI->getObjectAlign(Color))
339     MFI->setObjectAlignment(Color, Alignment);
340   int64_t Size = OrigSizes[FI];
341   if (!Share || Size > MFI->getObjectSize(Color))
342     MFI->setObjectSize(Color, Size);
343   return Color;
344 }
345 
346 /// Colorslots - Color all spill stack slots and rewrite all frameindex machine
347 /// operands in the function.
348 bool StackSlotColoring::ColorSlots(MachineFunction &MF) {
349   unsigned NumObjs = MFI->getObjectIndexEnd();
350   SmallVector<int, 16> SlotMapping(NumObjs, -1);
351   SmallVector<float, 16> SlotWeights(NumObjs, 0.0);
352   SmallVector<SmallVector<int, 4>, 16> RevMap(NumObjs);
353   BitVector UsedColors(NumObjs);
354 
355   LLVM_DEBUG(dbgs() << "Color spill slot intervals:\n");
356   bool Changed = false;
357   for (LiveInterval *li : SSIntervals) {
358     int SS = Register::stackSlot2Index(li->reg());
359     int NewSS = ColorSlot(li);
360     assert(NewSS >= 0 && "Stack coloring failed?");
361     SlotMapping[SS] = NewSS;
362     RevMap[NewSS].push_back(SS);
363     SlotWeights[NewSS] += li->weight();
364     UsedColors.set(NewSS);
365     Changed |= (SS != NewSS);
366   }
367 
368   LLVM_DEBUG(dbgs() << "\nSpill slots after coloring:\n");
369   for (LiveInterval *li : SSIntervals) {
370     int SS = Register::stackSlot2Index(li->reg());
371     li->setWeight(SlotWeights[SS]);
372   }
373   // Sort them by new weight.
374   llvm::stable_sort(SSIntervals, IntervalSorter());
375 
376 #ifndef NDEBUG
377   for (LiveInterval *li : SSIntervals)
378     LLVM_DEBUG(li->dump());
379   LLVM_DEBUG(dbgs() << '\n');
380 #endif
381 
382   if (!Changed)
383     return false;
384 
385   // Rewrite all MachineMemOperands.
386   for (unsigned SS = 0, SE = SSRefs.size(); SS != SE; ++SS) {
387     int NewFI = SlotMapping[SS];
388     if (NewFI == -1 || (NewFI == (int)SS))
389       continue;
390 
391     const PseudoSourceValue *NewSV = MF.getPSVManager().getFixedStack(NewFI);
392     SmallVectorImpl<MachineMemOperand *> &RefMMOs = SSRefs[SS];
393     for (unsigned i = 0, e = RefMMOs.size(); i != e; ++i)
394       RefMMOs[i]->setValue(NewSV);
395   }
396 
397   // Rewrite all MO_FrameIndex operands.  Look for dead stores.
398   for (MachineBasicBlock &MBB : MF) {
399     for (MachineInstr &MI : MBB)
400       RewriteInstruction(MI, SlotMapping, MF);
401     RemoveDeadStores(&MBB);
402   }
403 
404   // Delete unused stack slots.
405   for (int StackID = 0, E = AllColors.size(); StackID != E; ++StackID) {
406     int NextColor = NextColors[StackID];
407     while (NextColor != -1) {
408       LLVM_DEBUG(dbgs() << "Removing unused stack object fi#" << NextColor << "\n");
409       MFI->RemoveStackObject(NextColor);
410       NextColor = AllColors[StackID].find_next(NextColor);
411     }
412   }
413 
414   return true;
415 }
416 
417 /// RewriteInstruction - Rewrite specified instruction by replacing references
418 /// to old frame index with new one.
419 void StackSlotColoring::RewriteInstruction(MachineInstr &MI,
420                                            SmallVectorImpl<int> &SlotMapping,
421                                            MachineFunction &MF) {
422   // Update the operands.
423   for (MachineOperand &MO : MI.operands()) {
424     if (!MO.isFI())
425       continue;
426     int OldFI = MO.getIndex();
427     if (OldFI < 0)
428       continue;
429     int NewFI = SlotMapping[OldFI];
430     if (NewFI == -1 || NewFI == OldFI)
431       continue;
432 
433     assert(MFI->getStackID(OldFI) == MFI->getStackID(NewFI));
434     MO.setIndex(NewFI);
435   }
436 
437   // The MachineMemOperands have already been updated.
438 }
439 
440 /// RemoveDeadStores - Scan through a basic block and look for loads followed
441 /// by stores.  If they're both using the same stack slot, then the store is
442 /// definitely dead.  This could obviously be much more aggressive (consider
443 /// pairs with instructions between them), but such extensions might have a
444 /// considerable compile time impact.
445 bool StackSlotColoring::RemoveDeadStores(MachineBasicBlock* MBB) {
446   // FIXME: This could be much more aggressive, but we need to investigate
447   // the compile time impact of doing so.
448   bool changed = false;
449 
450   SmallVector<MachineInstr*, 4> toErase;
451 
452   for (MachineBasicBlock::iterator I = MBB->begin(), E = MBB->end();
453        I != E; ++I) {
454     if (DCELimit != -1 && (int)NumDead >= DCELimit)
455       break;
456     int FirstSS, SecondSS;
457     if (TII->isStackSlotCopy(*I, FirstSS, SecondSS) && FirstSS == SecondSS &&
458         FirstSS != -1) {
459       ++NumDead;
460       changed = true;
461       toErase.push_back(&*I);
462       continue;
463     }
464 
465     MachineBasicBlock::iterator NextMI = std::next(I);
466     MachineBasicBlock::iterator ProbableLoadMI = I;
467 
468     unsigned LoadReg = 0;
469     unsigned StoreReg = 0;
470     unsigned LoadSize = 0;
471     unsigned StoreSize = 0;
472     if (!(LoadReg = TII->isLoadFromStackSlot(*I, FirstSS, LoadSize)))
473       continue;
474     // Skip the ...pseudo debugging... instructions between a load and store.
475     while ((NextMI != E) && NextMI->isDebugInstr()) {
476       ++NextMI;
477       ++I;
478     }
479     if (NextMI == E) continue;
480     if (!(StoreReg = TII->isStoreToStackSlot(*NextMI, SecondSS, StoreSize)))
481       continue;
482     if (FirstSS != SecondSS || LoadReg != StoreReg || FirstSS == -1 ||
483         LoadSize != StoreSize || !MFI->isSpillSlotObjectIndex(FirstSS))
484       continue;
485 
486     ++NumDead;
487     changed = true;
488 
489     if (NextMI->findRegisterUseOperandIdx(LoadReg, /*TRI=*/nullptr, true) !=
490         -1) {
491       ++NumDead;
492       toErase.push_back(&*ProbableLoadMI);
493     }
494 
495     toErase.push_back(&*NextMI);
496     ++I;
497   }
498 
499   for (MachineInstr *MI : toErase)
500     MI->eraseFromParent();
501 
502   return changed;
503 }
504 
505 bool StackSlotColoring::runOnMachineFunction(MachineFunction &MF) {
506   LLVM_DEBUG({
507     dbgs() << "********** Stack Slot Coloring **********\n"
508            << "********** Function: " << MF.getName() << '\n';
509   });
510 
511   if (skipFunction(MF.getFunction()))
512     return false;
513 
514   MFI = &MF.getFrameInfo();
515   TII = MF.getSubtarget().getInstrInfo();
516   LS = &getAnalysis<LiveStacks>();
517   MBFI = &getAnalysis<MachineBlockFrequencyInfo>();
518 
519   bool Changed = false;
520 
521   unsigned NumSlots = LS->getNumIntervals();
522   if (NumSlots == 0)
523     // Nothing to do!
524     return false;
525 
526   // If there are calls to setjmp or sigsetjmp, don't perform stack slot
527   // coloring. The stack could be modified before the longjmp is executed,
528   // resulting in the wrong value being used afterwards.
529   if (MF.exposesReturnsTwice())
530     return false;
531 
532   // Gather spill slot references
533   ScanForSpillSlotRefs(MF);
534   InitializeSlots();
535   Changed = ColorSlots(MF);
536 
537   for (int &Next : NextColors)
538     Next = -1;
539 
540   SSIntervals.clear();
541   for (unsigned i = 0, e = SSRefs.size(); i != e; ++i)
542     SSRefs[i].clear();
543   SSRefs.clear();
544   OrigAlignments.clear();
545   OrigSizes.clear();
546   AllColors.clear();
547   UsedColors.clear();
548   Assignments.clear();
549 
550   return Changed;
551 }
552