xref: /netbsd-src/external/apache2/llvm/dist/llvm/lib/CodeGen/RegUsageInfoCollector.cpp (revision 7330f729ccf0bd976a06f95fad452fe774fc7fd1)
1*7330f729Sjoerg //===-- RegUsageInfoCollector.cpp - Register Usage Information Collector --===//
2*7330f729Sjoerg //
3*7330f729Sjoerg // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*7330f729Sjoerg // See https://llvm.org/LICENSE.txt for license information.
5*7330f729Sjoerg // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*7330f729Sjoerg //
7*7330f729Sjoerg //===----------------------------------------------------------------------===//
8*7330f729Sjoerg ///
9*7330f729Sjoerg /// This pass is required to take advantage of the interprocedural register
10*7330f729Sjoerg /// allocation infrastructure.
11*7330f729Sjoerg ///
12*7330f729Sjoerg /// This pass is simple MachineFunction pass which collects register usage
13*7330f729Sjoerg /// details by iterating through each physical registers and checking
14*7330f729Sjoerg /// MRI::isPhysRegUsed() then creates a RegMask based on this details.
15*7330f729Sjoerg /// The pass then stores this RegMask in PhysicalRegisterUsageInfo.cpp
16*7330f729Sjoerg ///
17*7330f729Sjoerg //===----------------------------------------------------------------------===//
18*7330f729Sjoerg 
19*7330f729Sjoerg #include "llvm/ADT/Statistic.h"
20*7330f729Sjoerg #include "llvm/CodeGen/MachineBasicBlock.h"
21*7330f729Sjoerg #include "llvm/CodeGen/MachineFunctionPass.h"
22*7330f729Sjoerg #include "llvm/CodeGen/MachineInstr.h"
23*7330f729Sjoerg #include "llvm/CodeGen/MachineOperand.h"
24*7330f729Sjoerg #include "llvm/CodeGen/MachineRegisterInfo.h"
25*7330f729Sjoerg #include "llvm/CodeGen/Passes.h"
26*7330f729Sjoerg #include "llvm/CodeGen/RegisterUsageInfo.h"
27*7330f729Sjoerg #include "llvm/Support/Debug.h"
28*7330f729Sjoerg #include "llvm/Support/raw_ostream.h"
29*7330f729Sjoerg #include "llvm/CodeGen/TargetFrameLowering.h"
30*7330f729Sjoerg 
31*7330f729Sjoerg using namespace llvm;
32*7330f729Sjoerg 
33*7330f729Sjoerg #define DEBUG_TYPE "ip-regalloc"
34*7330f729Sjoerg 
35*7330f729Sjoerg STATISTIC(NumCSROpt,
36*7330f729Sjoerg           "Number of functions optimized for callee saved registers");
37*7330f729Sjoerg 
38*7330f729Sjoerg namespace {
39*7330f729Sjoerg 
40*7330f729Sjoerg class RegUsageInfoCollector : public MachineFunctionPass {
41*7330f729Sjoerg public:
RegUsageInfoCollector()42*7330f729Sjoerg   RegUsageInfoCollector() : MachineFunctionPass(ID) {
43*7330f729Sjoerg     PassRegistry &Registry = *PassRegistry::getPassRegistry();
44*7330f729Sjoerg     initializeRegUsageInfoCollectorPass(Registry);
45*7330f729Sjoerg   }
46*7330f729Sjoerg 
getPassName() const47*7330f729Sjoerg   StringRef getPassName() const override {
48*7330f729Sjoerg     return "Register Usage Information Collector Pass";
49*7330f729Sjoerg   }
50*7330f729Sjoerg 
getAnalysisUsage(AnalysisUsage & AU) const51*7330f729Sjoerg   void getAnalysisUsage(AnalysisUsage &AU) const override {
52*7330f729Sjoerg     AU.addRequired<PhysicalRegisterUsageInfo>();
53*7330f729Sjoerg     AU.setPreservesAll();
54*7330f729Sjoerg     MachineFunctionPass::getAnalysisUsage(AU);
55*7330f729Sjoerg   }
56*7330f729Sjoerg 
57*7330f729Sjoerg   bool runOnMachineFunction(MachineFunction &MF) override;
58*7330f729Sjoerg 
59*7330f729Sjoerg   // Call getCalleeSaves and then also set the bits for subregs and
60*7330f729Sjoerg   // fully saved superregs.
61*7330f729Sjoerg   static void computeCalleeSavedRegs(BitVector &SavedRegs, MachineFunction &MF);
62*7330f729Sjoerg 
63*7330f729Sjoerg   static char ID;
64*7330f729Sjoerg };
65*7330f729Sjoerg 
66*7330f729Sjoerg } // end of anonymous namespace
67*7330f729Sjoerg 
68*7330f729Sjoerg char RegUsageInfoCollector::ID = 0;
69*7330f729Sjoerg 
70*7330f729Sjoerg INITIALIZE_PASS_BEGIN(RegUsageInfoCollector, "RegUsageInfoCollector",
71*7330f729Sjoerg                       "Register Usage Information Collector", false, false)
INITIALIZE_PASS_DEPENDENCY(PhysicalRegisterUsageInfo)72*7330f729Sjoerg INITIALIZE_PASS_DEPENDENCY(PhysicalRegisterUsageInfo)
73*7330f729Sjoerg INITIALIZE_PASS_END(RegUsageInfoCollector, "RegUsageInfoCollector",
74*7330f729Sjoerg                     "Register Usage Information Collector", false, false)
75*7330f729Sjoerg 
76*7330f729Sjoerg FunctionPass *llvm::createRegUsageInfoCollector() {
77*7330f729Sjoerg   return new RegUsageInfoCollector();
78*7330f729Sjoerg }
79*7330f729Sjoerg 
80*7330f729Sjoerg // TODO: Move to hook somwehere?
81*7330f729Sjoerg 
82*7330f729Sjoerg // Return true if it is useful to track the used registers for IPRA / no CSR
83*7330f729Sjoerg // optimizations. This is not useful for entry points, and computing the
84*7330f729Sjoerg // register usage information is expensive.
isCallableFunction(const MachineFunction & MF)85*7330f729Sjoerg static bool isCallableFunction(const MachineFunction &MF) {
86*7330f729Sjoerg   switch (MF.getFunction().getCallingConv()) {
87*7330f729Sjoerg   case CallingConv::AMDGPU_VS:
88*7330f729Sjoerg   case CallingConv::AMDGPU_GS:
89*7330f729Sjoerg   case CallingConv::AMDGPU_PS:
90*7330f729Sjoerg   case CallingConv::AMDGPU_CS:
91*7330f729Sjoerg   case CallingConv::AMDGPU_HS:
92*7330f729Sjoerg   case CallingConv::AMDGPU_ES:
93*7330f729Sjoerg   case CallingConv::AMDGPU_LS:
94*7330f729Sjoerg   case CallingConv::AMDGPU_KERNEL:
95*7330f729Sjoerg     return false;
96*7330f729Sjoerg   default:
97*7330f729Sjoerg     return true;
98*7330f729Sjoerg   }
99*7330f729Sjoerg }
100*7330f729Sjoerg 
runOnMachineFunction(MachineFunction & MF)101*7330f729Sjoerg bool RegUsageInfoCollector::runOnMachineFunction(MachineFunction &MF) {
102*7330f729Sjoerg   MachineRegisterInfo *MRI = &MF.getRegInfo();
103*7330f729Sjoerg   const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
104*7330f729Sjoerg   const LLVMTargetMachine &TM = MF.getTarget();
105*7330f729Sjoerg 
106*7330f729Sjoerg   LLVM_DEBUG(dbgs() << " -------------------- " << getPassName()
107*7330f729Sjoerg                     << " -------------------- \nFunction Name : "
108*7330f729Sjoerg                     << MF.getName() << '\n');
109*7330f729Sjoerg 
110*7330f729Sjoerg   // Analyzing the register usage may be expensive on some targets.
111*7330f729Sjoerg   if (!isCallableFunction(MF)) {
112*7330f729Sjoerg     LLVM_DEBUG(dbgs() << "Not analyzing non-callable function\n");
113*7330f729Sjoerg     return false;
114*7330f729Sjoerg   }
115*7330f729Sjoerg 
116*7330f729Sjoerg   // If there are no callers, there's no point in computing more precise
117*7330f729Sjoerg   // register usage here.
118*7330f729Sjoerg   if (MF.getFunction().use_empty()) {
119*7330f729Sjoerg     LLVM_DEBUG(dbgs() << "Not analyzing function with no callers\n");
120*7330f729Sjoerg     return false;
121*7330f729Sjoerg   }
122*7330f729Sjoerg 
123*7330f729Sjoerg   std::vector<uint32_t> RegMask;
124*7330f729Sjoerg 
125*7330f729Sjoerg   // Compute the size of the bit vector to represent all the registers.
126*7330f729Sjoerg   // The bit vector is broken into 32-bit chunks, thus takes the ceil of
127*7330f729Sjoerg   // the number of registers divided by 32 for the size.
128*7330f729Sjoerg   unsigned RegMaskSize = MachineOperand::getRegMaskSize(TRI->getNumRegs());
129*7330f729Sjoerg   RegMask.resize(RegMaskSize, ~((uint32_t)0));
130*7330f729Sjoerg 
131*7330f729Sjoerg   const Function &F = MF.getFunction();
132*7330f729Sjoerg 
133*7330f729Sjoerg   PhysicalRegisterUsageInfo &PRUI = getAnalysis<PhysicalRegisterUsageInfo>();
134*7330f729Sjoerg   PRUI.setTargetMachine(TM);
135*7330f729Sjoerg 
136*7330f729Sjoerg   LLVM_DEBUG(dbgs() << "Clobbered Registers: ");
137*7330f729Sjoerg 
138*7330f729Sjoerg   BitVector SavedRegs;
139*7330f729Sjoerg   computeCalleeSavedRegs(SavedRegs, MF);
140*7330f729Sjoerg 
141*7330f729Sjoerg   const BitVector &UsedPhysRegsMask = MRI->getUsedPhysRegsMask();
142*7330f729Sjoerg   auto SetRegAsDefined = [&RegMask] (unsigned Reg) {
143*7330f729Sjoerg     RegMask[Reg / 32] &= ~(1u << Reg % 32);
144*7330f729Sjoerg   };
145*7330f729Sjoerg 
146*7330f729Sjoerg   // Some targets can clobber registers "inside" a call, typically in
147*7330f729Sjoerg   // linker-generated code.
148*7330f729Sjoerg   for (const MCPhysReg Reg : TRI->getIntraCallClobberedRegs(&MF))
149*7330f729Sjoerg     for (MCRegAliasIterator AI(Reg, TRI, true); AI.isValid(); ++AI)
150*7330f729Sjoerg       SetRegAsDefined(*AI);
151*7330f729Sjoerg 
152*7330f729Sjoerg   // Scan all the physical registers. When a register is defined in the current
153*7330f729Sjoerg   // function set it and all the aliasing registers as defined in the regmask.
154*7330f729Sjoerg   // FIXME: Rewrite to use regunits.
155*7330f729Sjoerg   for (unsigned PReg = 1, PRegE = TRI->getNumRegs(); PReg < PRegE; ++PReg) {
156*7330f729Sjoerg     // Don't count registers that are saved and restored.
157*7330f729Sjoerg     if (SavedRegs.test(PReg))
158*7330f729Sjoerg       continue;
159*7330f729Sjoerg     // If a register is defined by an instruction mark it as defined together
160*7330f729Sjoerg     // with all it's unsaved aliases.
161*7330f729Sjoerg     if (!MRI->def_empty(PReg)) {
162*7330f729Sjoerg       for (MCRegAliasIterator AI(PReg, TRI, true); AI.isValid(); ++AI)
163*7330f729Sjoerg         if (!SavedRegs.test(*AI))
164*7330f729Sjoerg           SetRegAsDefined(*AI);
165*7330f729Sjoerg       continue;
166*7330f729Sjoerg     }
167*7330f729Sjoerg     // If a register is in the UsedPhysRegsMask set then mark it as defined.
168*7330f729Sjoerg     // All clobbered aliases will also be in the set, so we can skip setting
169*7330f729Sjoerg     // as defined all the aliases here.
170*7330f729Sjoerg     if (UsedPhysRegsMask.test(PReg))
171*7330f729Sjoerg       SetRegAsDefined(PReg);
172*7330f729Sjoerg   }
173*7330f729Sjoerg 
174*7330f729Sjoerg   if (TargetFrameLowering::isSafeForNoCSROpt(F) &&
175*7330f729Sjoerg       MF.getSubtarget().getFrameLowering()->isProfitableForNoCSROpt(F)) {
176*7330f729Sjoerg     ++NumCSROpt;
177*7330f729Sjoerg     LLVM_DEBUG(dbgs() << MF.getName()
178*7330f729Sjoerg                       << " function optimized for not having CSR.\n");
179*7330f729Sjoerg   }
180*7330f729Sjoerg 
181*7330f729Sjoerg   LLVM_DEBUG(
182*7330f729Sjoerg     for (unsigned PReg = 1, PRegE = TRI->getNumRegs(); PReg < PRegE; ++PReg) {
183*7330f729Sjoerg       if (MachineOperand::clobbersPhysReg(&(RegMask[0]), PReg))
184*7330f729Sjoerg         dbgs() << printReg(PReg, TRI) << " ";
185*7330f729Sjoerg     }
186*7330f729Sjoerg 
187*7330f729Sjoerg     dbgs() << " \n----------------------------------------\n";
188*7330f729Sjoerg   );
189*7330f729Sjoerg 
190*7330f729Sjoerg   PRUI.storeUpdateRegUsageInfo(F, RegMask);
191*7330f729Sjoerg 
192*7330f729Sjoerg   return false;
193*7330f729Sjoerg }
194*7330f729Sjoerg 
195*7330f729Sjoerg void RegUsageInfoCollector::
computeCalleeSavedRegs(BitVector & SavedRegs,MachineFunction & MF)196*7330f729Sjoerg computeCalleeSavedRegs(BitVector &SavedRegs, MachineFunction &MF) {
197*7330f729Sjoerg   const TargetFrameLowering &TFI = *MF.getSubtarget().getFrameLowering();
198*7330f729Sjoerg   const TargetRegisterInfo &TRI = *MF.getSubtarget().getRegisterInfo();
199*7330f729Sjoerg 
200*7330f729Sjoerg   // Target will return the set of registers that it saves/restores as needed.
201*7330f729Sjoerg   SavedRegs.clear();
202*7330f729Sjoerg   TFI.getCalleeSaves(MF, SavedRegs);
203*7330f729Sjoerg   if (SavedRegs.none())
204*7330f729Sjoerg     return;
205*7330f729Sjoerg 
206*7330f729Sjoerg   // Insert subregs.
207*7330f729Sjoerg   const MCPhysReg *CSRegs = TRI.getCalleeSavedRegs(&MF);
208*7330f729Sjoerg   for (unsigned i = 0; CSRegs[i]; ++i) {
209*7330f729Sjoerg     MCPhysReg Reg = CSRegs[i];
210*7330f729Sjoerg     if (SavedRegs.test(Reg)) {
211*7330f729Sjoerg       // Save subregisters
212*7330f729Sjoerg       for (MCSubRegIterator SR(Reg, &TRI); SR.isValid(); ++SR)
213*7330f729Sjoerg         SavedRegs.set(*SR);
214*7330f729Sjoerg     }
215*7330f729Sjoerg   }
216*7330f729Sjoerg }
217