xref: /freebsd-src/contrib/llvm-project/llvm/lib/Target/LoongArch/LoongArchFrameLowering.cpp (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
181ad6265SDimitry Andric //===-- LoongArchFrameLowering.cpp - LoongArch Frame Information -*- C++ -*-==//
281ad6265SDimitry Andric //
381ad6265SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
481ad6265SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
581ad6265SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
681ad6265SDimitry Andric //
781ad6265SDimitry Andric //===----------------------------------------------------------------------===//
881ad6265SDimitry Andric //
981ad6265SDimitry Andric // This file contains the LoongArch implementation of TargetFrameLowering class.
1081ad6265SDimitry Andric //
1181ad6265SDimitry Andric //===----------------------------------------------------------------------===//
1281ad6265SDimitry Andric 
1381ad6265SDimitry Andric #include "LoongArchFrameLowering.h"
14753f127fSDimitry Andric #include "LoongArchMachineFunctionInfo.h"
1581ad6265SDimitry Andric #include "LoongArchSubtarget.h"
16753f127fSDimitry Andric #include "MCTargetDesc/LoongArchBaseInfo.h"
17bdd1243dSDimitry Andric #include "MCTargetDesc/LoongArchMCTargetDesc.h"
1881ad6265SDimitry Andric #include "llvm/CodeGen/MachineFrameInfo.h"
1981ad6265SDimitry Andric #include "llvm/CodeGen/MachineFunction.h"
2081ad6265SDimitry Andric #include "llvm/CodeGen/MachineInstrBuilder.h"
2181ad6265SDimitry Andric #include "llvm/CodeGen/MachineRegisterInfo.h"
2281ad6265SDimitry Andric #include "llvm/CodeGen/RegisterScavenging.h"
2381ad6265SDimitry Andric #include "llvm/IR/DiagnosticInfo.h"
2481ad6265SDimitry Andric #include "llvm/MC/MCDwarf.h"
2581ad6265SDimitry Andric 
2681ad6265SDimitry Andric using namespace llvm;
2781ad6265SDimitry Andric 
2881ad6265SDimitry Andric #define DEBUG_TYPE "loongarch-frame-lowering"
2981ad6265SDimitry Andric 
3081ad6265SDimitry Andric // Return true if the specified function should have a dedicated frame
3181ad6265SDimitry Andric // pointer register.  This is true if frame pointer elimination is
3281ad6265SDimitry Andric // disabled, if it needs dynamic stack realignment, if the function has
3381ad6265SDimitry Andric // variable sized allocas, or if the frame address is taken.
3481ad6265SDimitry Andric bool LoongArchFrameLowering::hasFP(const MachineFunction &MF) const {
3581ad6265SDimitry Andric   const TargetRegisterInfo *RegInfo = MF.getSubtarget().getRegisterInfo();
3681ad6265SDimitry Andric 
3781ad6265SDimitry Andric   const MachineFrameInfo &MFI = MF.getFrameInfo();
3881ad6265SDimitry Andric   return MF.getTarget().Options.DisableFramePointerElim(MF) ||
3981ad6265SDimitry Andric          RegInfo->hasStackRealignment(MF) || MFI.hasVarSizedObjects() ||
4081ad6265SDimitry Andric          MFI.isFrameAddressTaken();
4181ad6265SDimitry Andric }
4281ad6265SDimitry Andric 
4381ad6265SDimitry Andric bool LoongArchFrameLowering::hasBP(const MachineFunction &MF) const {
4481ad6265SDimitry Andric   const MachineFrameInfo &MFI = MF.getFrameInfo();
4581ad6265SDimitry Andric   const TargetRegisterInfo *TRI = STI.getRegisterInfo();
4681ad6265SDimitry Andric 
4781ad6265SDimitry Andric   return MFI.hasVarSizedObjects() && TRI->hasStackRealignment(MF);
4881ad6265SDimitry Andric }
4981ad6265SDimitry Andric 
50753f127fSDimitry Andric void LoongArchFrameLowering::adjustReg(MachineBasicBlock &MBB,
51753f127fSDimitry Andric                                        MachineBasicBlock::iterator MBBI,
52753f127fSDimitry Andric                                        const DebugLoc &DL, Register DestReg,
53753f127fSDimitry Andric                                        Register SrcReg, int64_t Val,
54753f127fSDimitry Andric                                        MachineInstr::MIFlag Flag) const {
55753f127fSDimitry Andric   const LoongArchInstrInfo *TII = STI.getInstrInfo();
56753f127fSDimitry Andric   bool IsLA64 = STI.is64Bit();
57bdd1243dSDimitry Andric   unsigned Addi = IsLA64 ? LoongArch::ADDI_D : LoongArch::ADDI_W;
58753f127fSDimitry Andric 
59753f127fSDimitry Andric   if (DestReg == SrcReg && Val == 0)
60753f127fSDimitry Andric     return;
61753f127fSDimitry Andric 
62753f127fSDimitry Andric   if (isInt<12>(Val)) {
63753f127fSDimitry Andric     // addi.w/d $DstReg, $SrcReg, Val
64bdd1243dSDimitry Andric     BuildMI(MBB, MBBI, DL, TII->get(Addi), DestReg)
65753f127fSDimitry Andric         .addReg(SrcReg)
66753f127fSDimitry Andric         .addImm(Val)
67753f127fSDimitry Andric         .setMIFlag(Flag);
68753f127fSDimitry Andric     return;
69753f127fSDimitry Andric   }
70753f127fSDimitry Andric 
71bdd1243dSDimitry Andric   // Try to split the offset across two ADDIs. We need to keep the stack pointer
72bdd1243dSDimitry Andric   // aligned after each ADDI. We need to determine the maximum value we can put
73bdd1243dSDimitry Andric   // in each ADDI. In the negative direction, we can use -2048 which is always
74bdd1243dSDimitry Andric   // sufficiently aligned. In the positive direction, we need to find the
75bdd1243dSDimitry Andric   // largest 12-bit immediate that is aligned. Exclude -4096 since it can be
76bdd1243dSDimitry Andric   // created with LU12I.W.
77bdd1243dSDimitry Andric   assert(getStackAlign().value() < 2048 && "Stack alignment too large");
78bdd1243dSDimitry Andric   int64_t MaxPosAdjStep = 2048 - getStackAlign().value();
79bdd1243dSDimitry Andric   if (Val > -4096 && Val <= (2 * MaxPosAdjStep)) {
80bdd1243dSDimitry Andric     int64_t FirstAdj = Val < 0 ? -2048 : MaxPosAdjStep;
81bdd1243dSDimitry Andric     Val -= FirstAdj;
82bdd1243dSDimitry Andric     BuildMI(MBB, MBBI, DL, TII->get(Addi), DestReg)
83bdd1243dSDimitry Andric         .addReg(SrcReg)
84bdd1243dSDimitry Andric         .addImm(FirstAdj)
85bdd1243dSDimitry Andric         .setMIFlag(Flag);
86bdd1243dSDimitry Andric     BuildMI(MBB, MBBI, DL, TII->get(Addi), DestReg)
87bdd1243dSDimitry Andric         .addReg(DestReg, RegState::Kill)
88bdd1243dSDimitry Andric         .addImm(Val)
89bdd1243dSDimitry Andric         .setMIFlag(Flag);
90bdd1243dSDimitry Andric     return;
91bdd1243dSDimitry Andric   }
92bdd1243dSDimitry Andric 
93bdd1243dSDimitry Andric   unsigned Opc = IsLA64 ? LoongArch::ADD_D : LoongArch::ADD_W;
94bdd1243dSDimitry Andric   if (Val < 0) {
95bdd1243dSDimitry Andric     Val = -Val;
96bdd1243dSDimitry Andric     Opc = IsLA64 ? LoongArch::SUB_D : LoongArch::SUB_W;
97bdd1243dSDimitry Andric   }
98bdd1243dSDimitry Andric 
99bdd1243dSDimitry Andric   MachineRegisterInfo &MRI = MBB.getParent()->getRegInfo();
100bdd1243dSDimitry Andric   Register ScratchReg = MRI.createVirtualRegister(&LoongArch::GPRRegClass);
101bdd1243dSDimitry Andric   TII->movImm(MBB, MBBI, DL, ScratchReg, Val, Flag);
102bdd1243dSDimitry Andric   BuildMI(MBB, MBBI, DL, TII->get(Opc), DestReg)
103bdd1243dSDimitry Andric       .addReg(SrcReg)
104bdd1243dSDimitry Andric       .addReg(ScratchReg, RegState::Kill)
105bdd1243dSDimitry Andric       .setMIFlag(Flag);
106753f127fSDimitry Andric }
107753f127fSDimitry Andric 
108753f127fSDimitry Andric // Determine the size of the frame and maximum call frame size.
109753f127fSDimitry Andric void LoongArchFrameLowering::determineFrameLayout(MachineFunction &MF) const {
110753f127fSDimitry Andric   MachineFrameInfo &MFI = MF.getFrameInfo();
111753f127fSDimitry Andric 
112753f127fSDimitry Andric   // Get the number of bytes to allocate from the FrameInfo.
113753f127fSDimitry Andric   uint64_t FrameSize = MFI.getStackSize();
114753f127fSDimitry Andric 
115753f127fSDimitry Andric   // Make sure the frame is aligned.
116753f127fSDimitry Andric   FrameSize = alignTo(FrameSize, getStackAlign());
117753f127fSDimitry Andric 
118753f127fSDimitry Andric   // Update frame info.
119753f127fSDimitry Andric   MFI.setStackSize(FrameSize);
120753f127fSDimitry Andric }
121753f127fSDimitry Andric 
122bdd1243dSDimitry Andric static uint64_t estimateFunctionSizeInBytes(const LoongArchInstrInfo *TII,
123bdd1243dSDimitry Andric                                             const MachineFunction &MF) {
124bdd1243dSDimitry Andric   uint64_t FuncSize = 0;
125bdd1243dSDimitry Andric   for (auto &MBB : MF)
126bdd1243dSDimitry Andric     for (auto &MI : MBB)
127bdd1243dSDimitry Andric       FuncSize += TII->getInstSizeInBytes(MI);
128bdd1243dSDimitry Andric   return FuncSize;
129bdd1243dSDimitry Andric }
130bdd1243dSDimitry Andric 
131bdd1243dSDimitry Andric static bool needScavSlotForCFR(MachineFunction &MF) {
132bdd1243dSDimitry Andric   if (!MF.getSubtarget<LoongArchSubtarget>().hasBasicF())
133bdd1243dSDimitry Andric     return false;
134bdd1243dSDimitry Andric   for (auto &MBB : MF)
135bdd1243dSDimitry Andric     for (auto &MI : MBB)
136bdd1243dSDimitry Andric       if (MI.getOpcode() == LoongArch::PseudoST_CFR)
137bdd1243dSDimitry Andric         return true;
138bdd1243dSDimitry Andric   return false;
139bdd1243dSDimitry Andric }
140bdd1243dSDimitry Andric 
141bdd1243dSDimitry Andric void LoongArchFrameLowering::processFunctionBeforeFrameFinalized(
142bdd1243dSDimitry Andric     MachineFunction &MF, RegScavenger *RS) const {
143bdd1243dSDimitry Andric   const LoongArchRegisterInfo *RI = STI.getRegisterInfo();
144bdd1243dSDimitry Andric   const TargetRegisterClass &RC = LoongArch::GPRRegClass;
145bdd1243dSDimitry Andric   const LoongArchInstrInfo *TII = STI.getInstrInfo();
146bdd1243dSDimitry Andric   LoongArchMachineFunctionInfo *LAFI =
147bdd1243dSDimitry Andric       MF.getInfo<LoongArchMachineFunctionInfo>();
148bdd1243dSDimitry Andric   MachineFrameInfo &MFI = MF.getFrameInfo();
149bdd1243dSDimitry Andric 
150bdd1243dSDimitry Andric   unsigned ScavSlotsNum = 0;
151bdd1243dSDimitry Andric 
152*0fca6ea1SDimitry Andric   // Far branches beyond 27-bit offset require a spill slot for scratch
153*0fca6ea1SDimitry Andric   // register.
154bdd1243dSDimitry Andric   bool IsLargeFunction = !isInt<27>(estimateFunctionSizeInBytes(TII, MF));
155bdd1243dSDimitry Andric   if (IsLargeFunction)
156bdd1243dSDimitry Andric     ScavSlotsNum = 1;
157bdd1243dSDimitry Andric 
158bdd1243dSDimitry Andric   // estimateStackSize has been observed to under-estimate the final stack
159bdd1243dSDimitry Andric   // size, so give ourselves wiggle-room by checking for stack size
160bdd1243dSDimitry Andric   // representable an 11-bit signed field rather than 12-bits.
161bdd1243dSDimitry Andric   if (!isInt<11>(MFI.estimateStackSize(MF)))
162bdd1243dSDimitry Andric     ScavSlotsNum = std::max(ScavSlotsNum, 1u);
163bdd1243dSDimitry Andric 
164bdd1243dSDimitry Andric   // For CFR spill.
165bdd1243dSDimitry Andric   if (needScavSlotForCFR(MF))
166bdd1243dSDimitry Andric     ++ScavSlotsNum;
167bdd1243dSDimitry Andric 
168bdd1243dSDimitry Andric   // Create emergency spill slots.
169bdd1243dSDimitry Andric   for (unsigned i = 0; i < ScavSlotsNum; ++i) {
170bdd1243dSDimitry Andric     int FI = MFI.CreateStackObject(RI->getSpillSize(RC), RI->getSpillAlign(RC),
171bdd1243dSDimitry Andric                                    false);
172bdd1243dSDimitry Andric     RS->addScavengingFrameIndex(FI);
173bdd1243dSDimitry Andric     if (IsLargeFunction && LAFI->getBranchRelaxationSpillFrameIndex() == -1)
174bdd1243dSDimitry Andric       LAFI->setBranchRelaxationSpillFrameIndex(FI);
175bdd1243dSDimitry Andric     LLVM_DEBUG(dbgs() << "Allocated FI(" << FI
176bdd1243dSDimitry Andric                       << ") as the emergency spill slot.\n");
177bdd1243dSDimitry Andric   }
178bdd1243dSDimitry Andric }
179bdd1243dSDimitry Andric 
18081ad6265SDimitry Andric void LoongArchFrameLowering::emitPrologue(MachineFunction &MF,
18181ad6265SDimitry Andric                                           MachineBasicBlock &MBB) const {
182753f127fSDimitry Andric   MachineFrameInfo &MFI = MF.getFrameInfo();
183bdd1243dSDimitry Andric   auto *LoongArchFI = MF.getInfo<LoongArchMachineFunctionInfo>();
184753f127fSDimitry Andric   const LoongArchRegisterInfo *RI = STI.getRegisterInfo();
185753f127fSDimitry Andric   const LoongArchInstrInfo *TII = STI.getInstrInfo();
186753f127fSDimitry Andric   MachineBasicBlock::iterator MBBI = MBB.begin();
187bdd1243dSDimitry Andric   bool IsLA64 = STI.is64Bit();
188753f127fSDimitry Andric 
189753f127fSDimitry Andric   Register SPReg = LoongArch::R3;
190753f127fSDimitry Andric   Register FPReg = LoongArch::R22;
191753f127fSDimitry Andric 
192753f127fSDimitry Andric   // Debug location must be unknown since the first debug location is used
193753f127fSDimitry Andric   // to determine the end of the prologue.
194753f127fSDimitry Andric   DebugLoc DL;
195bdd1243dSDimitry Andric   // All calls are tail calls in GHC calling conv, and functions have no
196bdd1243dSDimitry Andric   // prologue/epilogue.
197bdd1243dSDimitry Andric   if (MF.getFunction().getCallingConv() == CallingConv::GHC)
198bdd1243dSDimitry Andric     return;
199753f127fSDimitry Andric   // Determine the correct frame layout
200753f127fSDimitry Andric   determineFrameLayout(MF);
201753f127fSDimitry Andric 
202753f127fSDimitry Andric   // First, compute final stack size.
203753f127fSDimitry Andric   uint64_t StackSize = MFI.getStackSize();
204bdd1243dSDimitry Andric   uint64_t RealStackSize = StackSize;
205753f127fSDimitry Andric 
206753f127fSDimitry Andric   // Early exit if there is no need to allocate space in the stack.
207753f127fSDimitry Andric   if (StackSize == 0 && !MFI.adjustsStack())
208753f127fSDimitry Andric     return;
209753f127fSDimitry Andric 
210*0fca6ea1SDimitry Andric   uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF);
211bdd1243dSDimitry Andric   // Split the SP adjustment to reduce the offsets of callee saved spill.
212bdd1243dSDimitry Andric   if (FirstSPAdjustAmount)
213bdd1243dSDimitry Andric     StackSize = FirstSPAdjustAmount;
214bdd1243dSDimitry Andric 
215753f127fSDimitry Andric   // Adjust stack.
216753f127fSDimitry Andric   adjustReg(MBB, MBBI, DL, SPReg, SPReg, -StackSize, MachineInstr::FrameSetup);
217753f127fSDimitry Andric   // Emit ".cfi_def_cfa_offset StackSize".
218753f127fSDimitry Andric   unsigned CFIIndex =
219753f127fSDimitry Andric       MF.addFrameInst(MCCFIInstruction::cfiDefCfaOffset(nullptr, StackSize));
220753f127fSDimitry Andric   BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
221753f127fSDimitry Andric       .addCFIIndex(CFIIndex)
222753f127fSDimitry Andric       .setMIFlag(MachineInstr::FrameSetup);
223753f127fSDimitry Andric 
224753f127fSDimitry Andric   const auto &CSI = MFI.getCalleeSavedInfo();
225753f127fSDimitry Andric 
226753f127fSDimitry Andric   // The frame pointer is callee-saved, and code has been generated for us to
227753f127fSDimitry Andric   // save it to the stack. We need to skip over the storing of callee-saved
228753f127fSDimitry Andric   // registers as the frame pointer must be modified after it has been saved
229753f127fSDimitry Andric   // to the stack, not before.
230753f127fSDimitry Andric   std::advance(MBBI, CSI.size());
231753f127fSDimitry Andric 
232753f127fSDimitry Andric   // Iterate over list of callee-saved registers and emit .cfi_offset
233753f127fSDimitry Andric   // directives.
234753f127fSDimitry Andric   for (const auto &Entry : CSI) {
235753f127fSDimitry Andric     int64_t Offset = MFI.getObjectOffset(Entry.getFrameIdx());
236753f127fSDimitry Andric     unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createOffset(
237753f127fSDimitry Andric         nullptr, RI->getDwarfRegNum(Entry.getReg(), true), Offset));
238753f127fSDimitry Andric     BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
239753f127fSDimitry Andric         .addCFIIndex(CFIIndex)
240753f127fSDimitry Andric         .setMIFlag(MachineInstr::FrameSetup);
241753f127fSDimitry Andric   }
242753f127fSDimitry Andric 
243753f127fSDimitry Andric   // Generate new FP.
244753f127fSDimitry Andric   if (hasFP(MF)) {
245bdd1243dSDimitry Andric     adjustReg(MBB, MBBI, DL, FPReg, SPReg,
246bdd1243dSDimitry Andric               StackSize - LoongArchFI->getVarArgsSaveSize(),
247bdd1243dSDimitry Andric               MachineInstr::FrameSetup);
248753f127fSDimitry Andric 
249bdd1243dSDimitry Andric     // Emit ".cfi_def_cfa $fp, LoongArchFI->getVarArgsSaveSize()"
250bdd1243dSDimitry Andric     unsigned CFIIndex = MF.addFrameInst(
251bdd1243dSDimitry Andric         MCCFIInstruction::cfiDefCfa(nullptr, RI->getDwarfRegNum(FPReg, true),
252bdd1243dSDimitry Andric                                     LoongArchFI->getVarArgsSaveSize()));
253753f127fSDimitry Andric     BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
254753f127fSDimitry Andric         .addCFIIndex(CFIIndex)
255753f127fSDimitry Andric         .setMIFlag(MachineInstr::FrameSetup);
256753f127fSDimitry Andric   }
257bdd1243dSDimitry Andric 
258bdd1243dSDimitry Andric   // Emit the second SP adjustment after saving callee saved registers.
259*0fca6ea1SDimitry Andric   if (FirstSPAdjustAmount) {
260*0fca6ea1SDimitry Andric     uint64_t SecondSPAdjustAmount = RealStackSize - FirstSPAdjustAmount;
261bdd1243dSDimitry Andric     assert(SecondSPAdjustAmount > 0 &&
262bdd1243dSDimitry Andric            "SecondSPAdjustAmount should be greater than zero");
263bdd1243dSDimitry Andric     adjustReg(MBB, MBBI, DL, SPReg, SPReg, -SecondSPAdjustAmount,
264bdd1243dSDimitry Andric               MachineInstr::FrameSetup);
265bdd1243dSDimitry Andric 
266*0fca6ea1SDimitry Andric     if (!hasFP(MF)) {
267bdd1243dSDimitry Andric       // If we are using a frame-pointer, and thus emitted ".cfi_def_cfa fp, 0",
268bdd1243dSDimitry Andric       // don't emit an sp-based .cfi_def_cfa_offset
269bdd1243dSDimitry Andric       // Emit ".cfi_def_cfa_offset RealStackSize"
270bdd1243dSDimitry Andric       unsigned CFIIndex = MF.addFrameInst(
271bdd1243dSDimitry Andric           MCCFIInstruction::cfiDefCfaOffset(nullptr, RealStackSize));
272bdd1243dSDimitry Andric       BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
273bdd1243dSDimitry Andric           .addCFIIndex(CFIIndex)
274bdd1243dSDimitry Andric           .setMIFlag(MachineInstr::FrameSetup);
275bdd1243dSDimitry Andric     }
276bdd1243dSDimitry Andric   }
277bdd1243dSDimitry Andric 
278bdd1243dSDimitry Andric   if (hasFP(MF)) {
279bdd1243dSDimitry Andric     // Realign stack.
280bdd1243dSDimitry Andric     if (RI->hasStackRealignment(MF)) {
2815f757f3fSDimitry Andric       unsigned Align = Log2(MFI.getMaxAlign());
2825f757f3fSDimitry Andric       assert(Align > 0 && "The stack realignment size is invalid!");
283bdd1243dSDimitry Andric       BuildMI(MBB, MBBI, DL,
2845f757f3fSDimitry Andric               TII->get(IsLA64 ? LoongArch::BSTRINS_D : LoongArch::BSTRINS_W),
2855f757f3fSDimitry Andric               SPReg)
286bdd1243dSDimitry Andric           .addReg(SPReg)
2875f757f3fSDimitry Andric           .addReg(LoongArch::R0)
2885f757f3fSDimitry Andric           .addImm(Align - 1)
2895f757f3fSDimitry Andric           .addImm(0)
290bdd1243dSDimitry Andric           .setMIFlag(MachineInstr::FrameSetup);
291bdd1243dSDimitry Andric       // FP will be used to restore the frame in the epilogue, so we need
292bdd1243dSDimitry Andric       // another base register BP to record SP after re-alignment. SP will
293bdd1243dSDimitry Andric       // track the current stack after allocating variable sized objects.
294bdd1243dSDimitry Andric       if (hasBP(MF)) {
295bdd1243dSDimitry Andric         // move BP, $sp
296bdd1243dSDimitry Andric         BuildMI(MBB, MBBI, DL, TII->get(LoongArch::OR),
297bdd1243dSDimitry Andric                 LoongArchABI::getBPReg())
298bdd1243dSDimitry Andric             .addReg(SPReg)
299bdd1243dSDimitry Andric             .addReg(LoongArch::R0)
300bdd1243dSDimitry Andric             .setMIFlag(MachineInstr::FrameSetup);
301bdd1243dSDimitry Andric       }
302bdd1243dSDimitry Andric     }
303bdd1243dSDimitry Andric   }
30481ad6265SDimitry Andric }
30581ad6265SDimitry Andric 
30681ad6265SDimitry Andric void LoongArchFrameLowering::emitEpilogue(MachineFunction &MF,
30781ad6265SDimitry Andric                                           MachineBasicBlock &MBB) const {
308753f127fSDimitry Andric   const LoongArchRegisterInfo *RI = STI.getRegisterInfo();
309753f127fSDimitry Andric   MachineFrameInfo &MFI = MF.getFrameInfo();
310bdd1243dSDimitry Andric   auto *LoongArchFI = MF.getInfo<LoongArchMachineFunctionInfo>();
311753f127fSDimitry Andric   Register SPReg = LoongArch::R3;
312bdd1243dSDimitry Andric   // All calls are tail calls in GHC calling conv, and functions have no
313bdd1243dSDimitry Andric   // prologue/epilogue.
314bdd1243dSDimitry Andric   if (MF.getFunction().getCallingConv() == CallingConv::GHC)
315bdd1243dSDimitry Andric     return;
316753f127fSDimitry Andric   MachineBasicBlock::iterator MBBI = MBB.getFirstTerminator();
317753f127fSDimitry Andric   DebugLoc DL = MBBI != MBB.end() ? MBBI->getDebugLoc() : DebugLoc();
318753f127fSDimitry Andric 
319753f127fSDimitry Andric   const auto &CSI = MFI.getCalleeSavedInfo();
320753f127fSDimitry Andric   // Skip to before the restores of callee-saved registers.
321753f127fSDimitry Andric   auto LastFrameDestroy = MBBI;
322753f127fSDimitry Andric   if (!CSI.empty())
323753f127fSDimitry Andric     LastFrameDestroy = std::prev(MBBI, CSI.size());
324753f127fSDimitry Andric 
325753f127fSDimitry Andric   // Get the number of bytes from FrameInfo.
326753f127fSDimitry Andric   uint64_t StackSize = MFI.getStackSize();
327753f127fSDimitry Andric 
328753f127fSDimitry Andric   // Restore the stack pointer.
329753f127fSDimitry Andric   if (RI->hasStackRealignment(MF) || MFI.hasVarSizedObjects()) {
330753f127fSDimitry Andric     assert(hasFP(MF) && "frame pointer should not have been eliminated");
331bdd1243dSDimitry Andric     adjustReg(MBB, LastFrameDestroy, DL, SPReg, LoongArch::R22,
332bdd1243dSDimitry Andric               -StackSize + LoongArchFI->getVarArgsSaveSize(),
333753f127fSDimitry Andric               MachineInstr::FrameDestroy);
334753f127fSDimitry Andric   }
335753f127fSDimitry Andric 
336bdd1243dSDimitry Andric   uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF);
337bdd1243dSDimitry Andric   if (FirstSPAdjustAmount) {
338bdd1243dSDimitry Andric     uint64_t SecondSPAdjustAmount = StackSize - FirstSPAdjustAmount;
339bdd1243dSDimitry Andric     assert(SecondSPAdjustAmount > 0 &&
340bdd1243dSDimitry Andric            "SecondSPAdjustAmount should be greater than zero");
341bdd1243dSDimitry Andric 
342bdd1243dSDimitry Andric     adjustReg(MBB, LastFrameDestroy, DL, SPReg, SPReg, SecondSPAdjustAmount,
343bdd1243dSDimitry Andric               MachineInstr::FrameDestroy);
344bdd1243dSDimitry Andric     StackSize = FirstSPAdjustAmount;
345bdd1243dSDimitry Andric   }
346bdd1243dSDimitry Andric 
347753f127fSDimitry Andric   // Deallocate stack
348753f127fSDimitry Andric   adjustReg(MBB, MBBI, DL, SPReg, SPReg, StackSize, MachineInstr::FrameDestroy);
349753f127fSDimitry Andric }
350753f127fSDimitry Andric 
351bdd1243dSDimitry Andric // We would like to split the SP adjustment to reduce prologue/epilogue
352bdd1243dSDimitry Andric // as following instructions. In this way, the offset of the callee saved
353bdd1243dSDimitry Andric // register could fit in a single store.
354bdd1243dSDimitry Andric // e.g.
355bdd1243dSDimitry Andric //   addi.d  $sp, $sp, -2032
356bdd1243dSDimitry Andric //   st.d    $ra, $sp,  2024
357bdd1243dSDimitry Andric //   st.d    $fp, $sp,  2016
358bdd1243dSDimitry Andric //   addi.d  $sp, $sp,   -16
359*0fca6ea1SDimitry Andric uint64_t LoongArchFrameLowering::getFirstSPAdjustAmount(
360*0fca6ea1SDimitry Andric     const MachineFunction &MF) const {
361bdd1243dSDimitry Andric   const MachineFrameInfo &MFI = MF.getFrameInfo();
362bdd1243dSDimitry Andric   const std::vector<CalleeSavedInfo> &CSI = MFI.getCalleeSavedInfo();
363bdd1243dSDimitry Andric 
364bdd1243dSDimitry Andric   // Return the FirstSPAdjustAmount if the StackSize can not fit in a signed
365bdd1243dSDimitry Andric   // 12-bit and there exists a callee-saved register needing to be pushed.
366*0fca6ea1SDimitry Andric   if (!isInt<12>(MFI.getStackSize()) && (CSI.size() > 0)) {
367bdd1243dSDimitry Andric     // FirstSPAdjustAmount is chosen as (2048 - StackAlign) because 2048 will
368bdd1243dSDimitry Andric     // cause sp = sp + 2048 in the epilogue to be split into multiple
369bdd1243dSDimitry Andric     // instructions. Offsets smaller than 2048 can fit in a single load/store
370bdd1243dSDimitry Andric     // instruction, and we have to stick with the stack alignment.
371bdd1243dSDimitry Andric     // So (2048 - StackAlign) will satisfy the stack alignment.
372*0fca6ea1SDimitry Andric     return 2048 - getStackAlign().value();
373bdd1243dSDimitry Andric   }
374bdd1243dSDimitry Andric   return 0;
375bdd1243dSDimitry Andric }
376bdd1243dSDimitry Andric 
377753f127fSDimitry Andric void LoongArchFrameLowering::determineCalleeSaves(MachineFunction &MF,
378753f127fSDimitry Andric                                                   BitVector &SavedRegs,
379753f127fSDimitry Andric                                                   RegScavenger *RS) const {
380753f127fSDimitry Andric   TargetFrameLowering::determineCalleeSaves(MF, SavedRegs, RS);
381753f127fSDimitry Andric   // Unconditionally spill RA and FP only if the function uses a frame
382753f127fSDimitry Andric   // pointer.
383753f127fSDimitry Andric   if (hasFP(MF)) {
384753f127fSDimitry Andric     SavedRegs.set(LoongArch::R1);
385753f127fSDimitry Andric     SavedRegs.set(LoongArch::R22);
386753f127fSDimitry Andric   }
387753f127fSDimitry Andric   // Mark BP as used if function has dedicated base pointer.
388753f127fSDimitry Andric   if (hasBP(MF))
389753f127fSDimitry Andric     SavedRegs.set(LoongArchABI::getBPReg());
390753f127fSDimitry Andric }
391753f127fSDimitry Andric 
392bdd1243dSDimitry Andric // Do not preserve stack space within prologue for outgoing variables if the
393bdd1243dSDimitry Andric // function contains variable size objects.
394bdd1243dSDimitry Andric // Let eliminateCallFramePseudoInstr preserve stack space for it.
395bdd1243dSDimitry Andric bool LoongArchFrameLowering::hasReservedCallFrame(
396bdd1243dSDimitry Andric     const MachineFunction &MF) const {
397bdd1243dSDimitry Andric   return !MF.getFrameInfo().hasVarSizedObjects();
398bdd1243dSDimitry Andric }
399bdd1243dSDimitry Andric 
400bdd1243dSDimitry Andric // Eliminate ADJCALLSTACKDOWN, ADJCALLSTACKUP pseudo instructions.
401bdd1243dSDimitry Andric MachineBasicBlock::iterator
402bdd1243dSDimitry Andric LoongArchFrameLowering::eliminateCallFramePseudoInstr(
403bdd1243dSDimitry Andric     MachineFunction &MF, MachineBasicBlock &MBB,
404bdd1243dSDimitry Andric     MachineBasicBlock::iterator MI) const {
405bdd1243dSDimitry Andric   Register SPReg = LoongArch::R3;
406bdd1243dSDimitry Andric   DebugLoc DL = MI->getDebugLoc();
407bdd1243dSDimitry Andric 
408bdd1243dSDimitry Andric   if (!hasReservedCallFrame(MF)) {
409bdd1243dSDimitry Andric     // If space has not been reserved for a call frame, ADJCALLSTACKDOWN and
410bdd1243dSDimitry Andric     // ADJCALLSTACKUP must be converted to instructions manipulating the stack
411bdd1243dSDimitry Andric     // pointer. This is necessary when there is a variable length stack
412bdd1243dSDimitry Andric     // allocation (e.g. alloca), which means it's not possible to allocate
413bdd1243dSDimitry Andric     // space for outgoing arguments from within the function prologue.
414bdd1243dSDimitry Andric     int64_t Amount = MI->getOperand(0).getImm();
415bdd1243dSDimitry Andric 
416bdd1243dSDimitry Andric     if (Amount != 0) {
417bdd1243dSDimitry Andric       // Ensure the stack remains aligned after adjustment.
418bdd1243dSDimitry Andric       Amount = alignSPAdjust(Amount);
419bdd1243dSDimitry Andric 
420bdd1243dSDimitry Andric       if (MI->getOpcode() == LoongArch::ADJCALLSTACKDOWN)
421bdd1243dSDimitry Andric         Amount = -Amount;
422bdd1243dSDimitry Andric 
423bdd1243dSDimitry Andric       adjustReg(MBB, MI, DL, SPReg, SPReg, Amount, MachineInstr::NoFlags);
424bdd1243dSDimitry Andric     }
425bdd1243dSDimitry Andric   }
426bdd1243dSDimitry Andric 
427bdd1243dSDimitry Andric   return MBB.erase(MI);
428bdd1243dSDimitry Andric }
429bdd1243dSDimitry Andric 
430bdd1243dSDimitry Andric bool LoongArchFrameLowering::spillCalleeSavedRegisters(
431bdd1243dSDimitry Andric     MachineBasicBlock &MBB, MachineBasicBlock::iterator MI,
432bdd1243dSDimitry Andric     ArrayRef<CalleeSavedInfo> CSI, const TargetRegisterInfo *TRI) const {
433bdd1243dSDimitry Andric   if (CSI.empty())
434bdd1243dSDimitry Andric     return true;
435bdd1243dSDimitry Andric 
436bdd1243dSDimitry Andric   MachineFunction *MF = MBB.getParent();
437bdd1243dSDimitry Andric   const TargetInstrInfo &TII = *MF->getSubtarget().getInstrInfo();
438bdd1243dSDimitry Andric 
439bdd1243dSDimitry Andric   // Insert the spill to the stack frame.
440bdd1243dSDimitry Andric   for (auto &CS : CSI) {
441bdd1243dSDimitry Andric     Register Reg = CS.getReg();
442bdd1243dSDimitry Andric     // If the register is RA and the return address is taken by method
443bdd1243dSDimitry Andric     // LoongArchTargetLowering::lowerRETURNADDR, don't set kill flag.
444bdd1243dSDimitry Andric     bool IsKill =
445bdd1243dSDimitry Andric         !(Reg == LoongArch::R1 && MF->getFrameInfo().isReturnAddressTaken());
446bdd1243dSDimitry Andric     const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg);
447bdd1243dSDimitry Andric     TII.storeRegToStackSlot(MBB, MI, Reg, IsKill, CS.getFrameIdx(), RC, TRI,
448bdd1243dSDimitry Andric                             Register());
449bdd1243dSDimitry Andric   }
450bdd1243dSDimitry Andric 
451bdd1243dSDimitry Andric   return true;
452bdd1243dSDimitry Andric }
453bdd1243dSDimitry Andric 
454753f127fSDimitry Andric StackOffset LoongArchFrameLowering::getFrameIndexReference(
455753f127fSDimitry Andric     const MachineFunction &MF, int FI, Register &FrameReg) const {
456753f127fSDimitry Andric   const MachineFrameInfo &MFI = MF.getFrameInfo();
457753f127fSDimitry Andric   const TargetRegisterInfo *RI = MF.getSubtarget().getRegisterInfo();
458bdd1243dSDimitry Andric   auto *LoongArchFI = MF.getInfo<LoongArchMachineFunctionInfo>();
459bdd1243dSDimitry Andric   uint64_t StackSize = MFI.getStackSize();
460bdd1243dSDimitry Andric   uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF);
461753f127fSDimitry Andric 
462753f127fSDimitry Andric   // Callee-saved registers should be referenced relative to the stack
463753f127fSDimitry Andric   // pointer (positive offset), otherwise use the frame pointer (negative
464753f127fSDimitry Andric   // offset).
465753f127fSDimitry Andric   const auto &CSI = MFI.getCalleeSavedInfo();
466753f127fSDimitry Andric   int MinCSFI = 0;
467753f127fSDimitry Andric   int MaxCSFI = -1;
468753f127fSDimitry Andric   StackOffset Offset =
469753f127fSDimitry Andric       StackOffset::getFixed(MFI.getObjectOffset(FI) - getOffsetOfLocalArea() +
470753f127fSDimitry Andric                             MFI.getOffsetAdjustment());
471753f127fSDimitry Andric 
472753f127fSDimitry Andric   if (CSI.size()) {
473753f127fSDimitry Andric     MinCSFI = CSI[0].getFrameIdx();
474753f127fSDimitry Andric     MaxCSFI = CSI[CSI.size() - 1].getFrameIdx();
475753f127fSDimitry Andric   }
476753f127fSDimitry Andric 
477bdd1243dSDimitry Andric   if (FI >= MinCSFI && FI <= MaxCSFI) {
478753f127fSDimitry Andric     FrameReg = LoongArch::R3;
479bdd1243dSDimitry Andric     if (FirstSPAdjustAmount)
480bdd1243dSDimitry Andric       Offset += StackOffset::getFixed(FirstSPAdjustAmount);
481bdd1243dSDimitry Andric     else
482bdd1243dSDimitry Andric       Offset += StackOffset::getFixed(StackSize);
483bdd1243dSDimitry Andric   } else if (RI->hasStackRealignment(MF) && !MFI.isFixedObjectIndex(FI)) {
484bdd1243dSDimitry Andric     // If the stack was realigned, the frame pointer is set in order to allow
485bdd1243dSDimitry Andric     // SP to be restored, so we need another base register to record the stack
486bdd1243dSDimitry Andric     // after realignment.
487bdd1243dSDimitry Andric     FrameReg = hasBP(MF) ? LoongArchABI::getBPReg() : LoongArch::R3;
488bdd1243dSDimitry Andric     Offset += StackOffset::getFixed(StackSize);
489bdd1243dSDimitry Andric   } else {
490bdd1243dSDimitry Andric     FrameReg = RI->getFrameRegister(MF);
491bdd1243dSDimitry Andric     if (hasFP(MF))
492bdd1243dSDimitry Andric       Offset += StackOffset::getFixed(LoongArchFI->getVarArgsSaveSize());
493bdd1243dSDimitry Andric     else
494bdd1243dSDimitry Andric       Offset += StackOffset::getFixed(StackSize);
495753f127fSDimitry Andric   }
496753f127fSDimitry Andric 
497753f127fSDimitry Andric   return Offset;
49881ad6265SDimitry Andric }
49906c3fb27SDimitry Andric 
50006c3fb27SDimitry Andric bool LoongArchFrameLowering::enableShrinkWrapping(
50106c3fb27SDimitry Andric     const MachineFunction &MF) const {
50206c3fb27SDimitry Andric   // Keep the conventional code flow when not optimizing.
50306c3fb27SDimitry Andric   if (MF.getFunction().hasOptNone())
50406c3fb27SDimitry Andric     return false;
50506c3fb27SDimitry Andric 
50606c3fb27SDimitry Andric   return true;
50706c3fb27SDimitry Andric }
508