xref: /llvm-project/llvm/lib/CodeGen/GlobalISel/CallLowering.cpp (revision 392e0fcfd114374115c11c7f5399c20820fbb10b)
1 //===-- lib/CodeGen/GlobalISel/CallLowering.cpp - Call lowering -----------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 ///
9 /// \file
10 /// This file implements some simple delegations needed for call lowering.
11 ///
12 //===----------------------------------------------------------------------===//
13 
14 #include "llvm/CodeGen/Analysis.h"
15 #include "llvm/CodeGen/GlobalISel/CallLowering.h"
16 #include "llvm/CodeGen/GlobalISel/Utils.h"
17 #include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
18 #include "llvm/CodeGen/MachineOperand.h"
19 #include "llvm/CodeGen/MachineRegisterInfo.h"
20 #include "llvm/CodeGen/TargetLowering.h"
21 #include "llvm/IR/DataLayout.h"
22 #include "llvm/IR/Instructions.h"
23 #include "llvm/IR/LLVMContext.h"
24 #include "llvm/IR/Module.h"
25 #include "llvm/Target/TargetMachine.h"
26 
27 #define DEBUG_TYPE "call-lowering"
28 
29 using namespace llvm;
30 
31 void CallLowering::anchor() {}
32 
33 /// Helper function which updates \p Flags when \p AttrFn returns true.
34 static void
35 addFlagsUsingAttrFn(ISD::ArgFlagsTy &Flags,
36                     const std::function<bool(Attribute::AttrKind)> &AttrFn) {
37   if (AttrFn(Attribute::SExt))
38     Flags.setSExt();
39   if (AttrFn(Attribute::ZExt))
40     Flags.setZExt();
41   if (AttrFn(Attribute::InReg))
42     Flags.setInReg();
43   if (AttrFn(Attribute::StructRet))
44     Flags.setSRet();
45   if (AttrFn(Attribute::Nest))
46     Flags.setNest();
47   if (AttrFn(Attribute::ByVal))
48     Flags.setByVal();
49   if (AttrFn(Attribute::Preallocated))
50     Flags.setPreallocated();
51   if (AttrFn(Attribute::InAlloca))
52     Flags.setInAlloca();
53   if (AttrFn(Attribute::Returned))
54     Flags.setReturned();
55   if (AttrFn(Attribute::SwiftSelf))
56     Flags.setSwiftSelf();
57   if (AttrFn(Attribute::SwiftError))
58     Flags.setSwiftError();
59 }
60 
61 ISD::ArgFlagsTy CallLowering::getAttributesForArgIdx(const CallBase &Call,
62                                                      unsigned ArgIdx) const {
63   ISD::ArgFlagsTy Flags;
64   addFlagsUsingAttrFn(Flags, [&Call, &ArgIdx](Attribute::AttrKind Attr) {
65     return Call.paramHasAttr(ArgIdx, Attr);
66   });
67   return Flags;
68 }
69 
70 void CallLowering::addArgFlagsFromAttributes(ISD::ArgFlagsTy &Flags,
71                                              const AttributeList &Attrs,
72                                              unsigned OpIdx) const {
73   addFlagsUsingAttrFn(Flags, [&Attrs, &OpIdx](Attribute::AttrKind Attr) {
74     return Attrs.hasAttribute(OpIdx, Attr);
75   });
76 }
77 
78 bool CallLowering::lowerCall(MachineIRBuilder &MIRBuilder, const CallBase &CB,
79                              ArrayRef<Register> ResRegs,
80                              ArrayRef<ArrayRef<Register>> ArgRegs,
81                              Register SwiftErrorVReg,
82                              std::function<unsigned()> GetCalleeReg) const {
83   CallLoweringInfo Info;
84   const DataLayout &DL = MIRBuilder.getDataLayout();
85   MachineFunction &MF = MIRBuilder.getMF();
86   bool CanBeTailCalled = CB.isTailCall() &&
87                          isInTailCallPosition(CB, MF.getTarget()) &&
88                          (MF.getFunction()
89                               .getFnAttribute("disable-tail-calls")
90                               .getValueAsString() != "true");
91 
92   CallingConv::ID CallConv = CB.getCallingConv();
93   Type *RetTy = CB.getType();
94   bool IsVarArg = CB.getFunctionType()->isVarArg();
95 
96   SmallVector<BaseArgInfo, 4> SplitArgs;
97   getReturnInfo(CallConv, RetTy, CB.getAttributes(), SplitArgs, DL);
98   Info.CanLowerReturn = canLowerReturn(MF, CallConv, SplitArgs, IsVarArg);
99 
100   if (!Info.CanLowerReturn) {
101     // Callee requires sret demotion.
102     insertSRetOutgoingArgument(MIRBuilder, CB, Info);
103 
104     // The sret demotion isn't compatible with tail-calls, since the sret
105     // argument points into the caller's stack frame.
106     CanBeTailCalled = false;
107   }
108 
109   // First step is to marshall all the function's parameters into the correct
110   // physregs and memory locations. Gather the sequence of argument types that
111   // we'll pass to the assigner function.
112   unsigned i = 0;
113   unsigned NumFixedArgs = CB.getFunctionType()->getNumParams();
114   for (auto &Arg : CB.args()) {
115     ArgInfo OrigArg{ArgRegs[i], Arg->getType(), getAttributesForArgIdx(CB, i),
116                     i < NumFixedArgs};
117     setArgFlags(OrigArg, i + AttributeList::FirstArgIndex, DL, CB);
118 
119     // If we have an explicit sret argument that is an Instruction, (i.e., it
120     // might point to function-local memory), we can't meaningfully tail-call.
121     if (OrigArg.Flags[0].isSRet() && isa<Instruction>(&Arg))
122       CanBeTailCalled = false;
123 
124     Info.OrigArgs.push_back(OrigArg);
125     ++i;
126   }
127 
128   // Try looking through a bitcast from one function type to another.
129   // Commonly happens with calls to objc_msgSend().
130   const Value *CalleeV = CB.getCalledOperand()->stripPointerCasts();
131   if (const Function *F = dyn_cast<Function>(CalleeV))
132     Info.Callee = MachineOperand::CreateGA(F, 0);
133   else
134     Info.Callee = MachineOperand::CreateReg(GetCalleeReg(), false);
135 
136   Info.OrigRet = ArgInfo{ResRegs, RetTy, ISD::ArgFlagsTy{}};
137   if (!Info.OrigRet.Ty->isVoidTy())
138     setArgFlags(Info.OrigRet, AttributeList::ReturnIndex, DL, CB);
139 
140   Info.KnownCallees = CB.getMetadata(LLVMContext::MD_callees);
141   Info.CallConv = CallConv;
142   Info.SwiftErrorVReg = SwiftErrorVReg;
143   Info.IsMustTailCall = CB.isMustTailCall();
144   Info.IsTailCall = CanBeTailCalled;
145   Info.IsVarArg = IsVarArg;
146   return lowerCall(MIRBuilder, Info);
147 }
148 
149 template <typename FuncInfoTy>
150 void CallLowering::setArgFlags(CallLowering::ArgInfo &Arg, unsigned OpIdx,
151                                const DataLayout &DL,
152                                const FuncInfoTy &FuncInfo) const {
153   auto &Flags = Arg.Flags[0];
154   const AttributeList &Attrs = FuncInfo.getAttributes();
155   addArgFlagsFromAttributes(Flags, Attrs, OpIdx);
156 
157   if (Flags.isByVal() || Flags.isInAlloca() || Flags.isPreallocated()) {
158     Type *ElementTy = cast<PointerType>(Arg.Ty)->getElementType();
159 
160     auto Ty = Attrs.getAttribute(OpIdx, Attribute::ByVal).getValueAsType();
161     Flags.setByValSize(DL.getTypeAllocSize(Ty ? Ty : ElementTy));
162 
163     // For ByVal, alignment should be passed from FE.  BE will guess if
164     // this info is not there but there are cases it cannot get right.
165     Align FrameAlign;
166     if (auto ParamAlign = FuncInfo.getParamAlign(OpIdx - 2))
167       FrameAlign = *ParamAlign;
168     else
169       FrameAlign = Align(getTLI()->getByValTypeAlignment(ElementTy, DL));
170     Flags.setByValAlign(FrameAlign);
171   }
172   Flags.setOrigAlign(DL.getABITypeAlign(Arg.Ty));
173 
174   // Don't try to use the returned attribute if the argument is marked as
175   // swiftself, since it won't be passed in x0.
176   if (Flags.isSwiftSelf())
177     Flags.setReturned(false);
178 }
179 
180 template void
181 CallLowering::setArgFlags<Function>(CallLowering::ArgInfo &Arg, unsigned OpIdx,
182                                     const DataLayout &DL,
183                                     const Function &FuncInfo) const;
184 
185 template void
186 CallLowering::setArgFlags<CallBase>(CallLowering::ArgInfo &Arg, unsigned OpIdx,
187                                     const DataLayout &DL,
188                                     const CallBase &FuncInfo) const;
189 
190 Register CallLowering::packRegs(ArrayRef<Register> SrcRegs, Type *PackedTy,
191                                 MachineIRBuilder &MIRBuilder) const {
192   assert(SrcRegs.size() > 1 && "Nothing to pack");
193 
194   const DataLayout &DL = MIRBuilder.getMF().getDataLayout();
195   MachineRegisterInfo *MRI = MIRBuilder.getMRI();
196 
197   LLT PackedLLT = getLLTForType(*PackedTy, DL);
198 
199   SmallVector<LLT, 8> LLTs;
200   SmallVector<uint64_t, 8> Offsets;
201   computeValueLLTs(DL, *PackedTy, LLTs, &Offsets);
202   assert(LLTs.size() == SrcRegs.size() && "Regs / types mismatch");
203 
204   Register Dst = MRI->createGenericVirtualRegister(PackedLLT);
205   MIRBuilder.buildUndef(Dst);
206   for (unsigned i = 0; i < SrcRegs.size(); ++i) {
207     Register NewDst = MRI->createGenericVirtualRegister(PackedLLT);
208     MIRBuilder.buildInsert(NewDst, Dst, SrcRegs[i], Offsets[i]);
209     Dst = NewDst;
210   }
211 
212   return Dst;
213 }
214 
215 void CallLowering::unpackRegs(ArrayRef<Register> DstRegs, Register SrcReg,
216                               Type *PackedTy,
217                               MachineIRBuilder &MIRBuilder) const {
218   assert(DstRegs.size() > 1 && "Nothing to unpack");
219 
220   const DataLayout &DL = MIRBuilder.getDataLayout();
221 
222   SmallVector<LLT, 8> LLTs;
223   SmallVector<uint64_t, 8> Offsets;
224   computeValueLLTs(DL, *PackedTy, LLTs, &Offsets);
225   assert(LLTs.size() == DstRegs.size() && "Regs / types mismatch");
226 
227   for (unsigned i = 0; i < DstRegs.size(); ++i)
228     MIRBuilder.buildExtract(DstRegs[i], SrcReg, Offsets[i]);
229 }
230 
231 bool CallLowering::handleAssignments(MachineIRBuilder &MIRBuilder,
232                                      SmallVectorImpl<ArgInfo> &Args,
233                                      ValueHandler &Handler,
234                                      CallingConv::ID CallConv, bool IsVarArg,
235                                      Register ThisReturnReg) const {
236   MachineFunction &MF = MIRBuilder.getMF();
237   const Function &F = MF.getFunction();
238   SmallVector<CCValAssign, 16> ArgLocs;
239 
240   CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, F.getContext());
241   return handleAssignments(CCInfo, ArgLocs, MIRBuilder, Args, Handler,
242                            ThisReturnReg);
243 }
244 
245 bool CallLowering::handleAssignments(CCState &CCInfo,
246                                      SmallVectorImpl<CCValAssign> &ArgLocs,
247                                      MachineIRBuilder &MIRBuilder,
248                                      SmallVectorImpl<ArgInfo> &Args,
249                                      ValueHandler &Handler,
250                                      Register ThisReturnReg) const {
251   MachineFunction &MF = MIRBuilder.getMF();
252   const Function &F = MF.getFunction();
253   const DataLayout &DL = F.getParent()->getDataLayout();
254 
255   unsigned NumArgs = Args.size();
256   for (unsigned i = 0; i != NumArgs; ++i) {
257     EVT CurVT = EVT::getEVT(Args[i].Ty);
258     if (CurVT.isSimple() &&
259         !Handler.assignArg(i, CurVT.getSimpleVT(), CurVT.getSimpleVT(),
260                            CCValAssign::Full, Args[i], Args[i].Flags[0],
261                            CCInfo))
262       continue;
263 
264     MVT NewVT = TLI->getRegisterTypeForCallingConv(
265         F.getContext(), CCInfo.getCallingConv(), EVT(CurVT));
266 
267     // If we need to split the type over multiple regs, check it's a scenario
268     // we currently support.
269     unsigned NumParts = TLI->getNumRegistersForCallingConv(
270         F.getContext(), CCInfo.getCallingConv(), CurVT);
271 
272     if (NumParts == 1) {
273       // Try to use the register type if we couldn't assign the VT.
274       if (Handler.assignArg(i, NewVT, NewVT, CCValAssign::Full, Args[i],
275                             Args[i].Flags[0], CCInfo))
276         return false;
277       continue;
278     }
279 
280     assert(NumParts > 1);
281     // For now only handle exact splits.
282     if (NewVT.getSizeInBits() * NumParts != CurVT.getSizeInBits())
283       return false;
284 
285     // For incoming arguments (physregs to vregs), we could have values in
286     // physregs (or memlocs) which we want to extract and copy to vregs.
287     // During this, we might have to deal with the LLT being split across
288     // multiple regs, so we have to record this information for later.
289     //
290     // If we have outgoing args, then we have the opposite case. We have a
291     // vreg with an LLT which we want to assign to a physical location, and
292     // we might have to record that the value has to be split later.
293     if (Handler.isIncomingArgumentHandler()) {
294       // We're handling an incoming arg which is split over multiple regs.
295       // E.g. passing an s128 on AArch64.
296       ISD::ArgFlagsTy OrigFlags = Args[i].Flags[0];
297       Args[i].OrigRegs.push_back(Args[i].Regs[0]);
298       Args[i].Regs.clear();
299       Args[i].Flags.clear();
300       LLT NewLLT = getLLTForMVT(NewVT);
301       // For each split register, create and assign a vreg that will store
302       // the incoming component of the larger value. These will later be
303       // merged to form the final vreg.
304       for (unsigned Part = 0; Part < NumParts; ++Part) {
305         Register Reg =
306             MIRBuilder.getMRI()->createGenericVirtualRegister(NewLLT);
307         ISD::ArgFlagsTy Flags = OrigFlags;
308         if (Part == 0) {
309           Flags.setSplit();
310         } else {
311           Flags.setOrigAlign(Align(1));
312           if (Part == NumParts - 1)
313             Flags.setSplitEnd();
314         }
315         Args[i].Regs.push_back(Reg);
316         Args[i].Flags.push_back(Flags);
317         if (Handler.assignArg(i, NewVT, NewVT, CCValAssign::Full, Args[i],
318                               Args[i].Flags[Part], CCInfo)) {
319           // Still couldn't assign this smaller part type for some reason.
320           return false;
321         }
322       }
323     } else {
324       // This type is passed via multiple registers in the calling convention.
325       // We need to extract the individual parts.
326       Register LargeReg = Args[i].Regs[0];
327       LLT SmallTy = LLT::scalar(NewVT.getSizeInBits());
328       auto Unmerge = MIRBuilder.buildUnmerge(SmallTy, LargeReg);
329       assert(Unmerge->getNumOperands() == NumParts + 1);
330       ISD::ArgFlagsTy OrigFlags = Args[i].Flags[0];
331       // We're going to replace the regs and flags with the split ones.
332       Args[i].Regs.clear();
333       Args[i].Flags.clear();
334       for (unsigned PartIdx = 0; PartIdx < NumParts; ++PartIdx) {
335         ISD::ArgFlagsTy Flags = OrigFlags;
336         if (PartIdx == 0) {
337           Flags.setSplit();
338         } else {
339           Flags.setOrigAlign(Align(1));
340           if (PartIdx == NumParts - 1)
341             Flags.setSplitEnd();
342         }
343 
344         // TODO: Also check if there is a valid extension that preserves the
345         // bits. However currently this call lowering doesn't support non-exact
346         // split parts, so that can't be tested.
347         if (OrigFlags.isReturned() &&
348             (NumParts * NewVT.getSizeInBits() != CurVT.getSizeInBits())) {
349           Flags.setReturned(false);
350         }
351 
352         Args[i].Regs.push_back(Unmerge.getReg(PartIdx));
353         Args[i].Flags.push_back(Flags);
354         if (Handler.assignArg(i, NewVT, NewVT, CCValAssign::Full,
355                               Args[i], Args[i].Flags[PartIdx], CCInfo))
356           return false;
357       }
358     }
359   }
360 
361   for (unsigned i = 0, e = Args.size(), j = 0; i != e; ++i, ++j) {
362     assert(j < ArgLocs.size() && "Skipped too many arg locs");
363 
364     CCValAssign &VA = ArgLocs[j];
365     assert(VA.getValNo() == i && "Location doesn't correspond to current arg");
366 
367     if (VA.needsCustom()) {
368       unsigned NumArgRegs =
369           Handler.assignCustomValue(Args[i], makeArrayRef(ArgLocs).slice(j));
370       if (!NumArgRegs)
371         return false;
372       j += NumArgRegs;
373       continue;
374     }
375 
376     // FIXME: Pack registers if we have more than one.
377     Register ArgReg = Args[i].Regs[0];
378 
379     EVT OrigVT = EVT::getEVT(Args[i].Ty);
380     EVT VAVT = VA.getValVT();
381     const LLT OrigTy = getLLTForType(*Args[i].Ty, DL);
382 
383     // Expected to be multiple regs for a single incoming arg.
384     // There should be Regs.size() ArgLocs per argument.
385     unsigned NumArgRegs = Args[i].Regs.size();
386 
387     assert((j + (NumArgRegs - 1)) < ArgLocs.size() &&
388            "Too many regs for number of args");
389     for (unsigned Part = 0; Part < NumArgRegs; ++Part) {
390       // There should be Regs.size() ArgLocs per argument.
391       VA = ArgLocs[j + Part];
392       if (VA.isMemLoc()) {
393         // Individual pieces may have been spilled to the stack and others
394         // passed in registers.
395 
396         // FIXME: Use correct address space for pointer size
397         EVT LocVT = VA.getValVT();
398         unsigned MemSize = LocVT == MVT::iPTR ? DL.getPointerSize()
399                                               : LocVT.getStoreSize();
400         unsigned Offset = VA.getLocMemOffset();
401         MachinePointerInfo MPO;
402         Register StackAddr = Handler.getStackAddress(MemSize, Offset, MPO);
403         Handler.assignValueToAddress(Args[i], Part, StackAddr, MemSize, MPO,
404                                      VA);
405         continue;
406       }
407 
408       assert(VA.isRegLoc() && "custom loc should have been handled already");
409 
410       if (i == 0 && ThisReturnReg.isValid() &&
411           Handler.isIncomingArgumentHandler() &&
412           isTypeIsValidForThisReturn(VAVT)) {
413         Handler.assignValueToReg(Args[i].Regs[i], ThisReturnReg, VA);
414         continue;
415       }
416 
417       // GlobalISel does not currently work for scalable vectors.
418       if (OrigVT.getFixedSizeInBits() >= VAVT.getFixedSizeInBits() ||
419           !Handler.isIncomingArgumentHandler()) {
420         // This is an argument that might have been split. There should be
421         // Regs.size() ArgLocs per argument.
422 
423         // Insert the argument copies. If VAVT < OrigVT, we'll insert the merge
424         // to the original register after handling all of the parts.
425         Handler.assignValueToReg(Args[i].Regs[Part], VA.getLocReg(), VA);
426         continue;
427       }
428 
429       // This ArgLoc covers multiple pieces, so we need to split it.
430       const LLT VATy(VAVT.getSimpleVT());
431       Register NewReg =
432         MIRBuilder.getMRI()->createGenericVirtualRegister(VATy);
433       Handler.assignValueToReg(NewReg, VA.getLocReg(), VA);
434       // If it's a vector type, we either need to truncate the elements
435       // or do an unmerge to get the lower block of elements.
436       if (VATy.isVector() &&
437           VATy.getNumElements() > OrigVT.getVectorNumElements()) {
438         // Just handle the case where the VA type is 2 * original type.
439         if (VATy.getNumElements() != OrigVT.getVectorNumElements() * 2) {
440           LLVM_DEBUG(dbgs()
441                      << "Incoming promoted vector arg has too many elts");
442           return false;
443         }
444         auto Unmerge = MIRBuilder.buildUnmerge({OrigTy, OrigTy}, {NewReg});
445         MIRBuilder.buildCopy(ArgReg, Unmerge.getReg(0));
446       } else {
447         MIRBuilder.buildTrunc(ArgReg, {NewReg}).getReg(0);
448       }
449     }
450 
451     // Now that all pieces have been handled, re-pack any arguments into any
452     // wider, original registers.
453     if (Handler.isIncomingArgumentHandler()) {
454       if (VAVT.getFixedSizeInBits() < OrigVT.getFixedSizeInBits()) {
455         assert(NumArgRegs >= 2);
456 
457         // Merge the split registers into the expected larger result vreg
458         // of the original call.
459         MIRBuilder.buildMerge(Args[i].OrigRegs[0], Args[i].Regs);
460       }
461     }
462 
463     j += NumArgRegs - 1;
464   }
465 
466   return true;
467 }
468 
469 void CallLowering::insertSRetLoads(MachineIRBuilder &MIRBuilder, Type *RetTy,
470                                    ArrayRef<Register> VRegs, Register DemoteReg,
471                                    int FI) const {
472   MachineFunction &MF = MIRBuilder.getMF();
473   MachineRegisterInfo &MRI = MF.getRegInfo();
474   const DataLayout &DL = MF.getDataLayout();
475 
476   SmallVector<EVT, 4> SplitVTs;
477   SmallVector<uint64_t, 4> Offsets;
478   ComputeValueVTs(*TLI, DL, RetTy, SplitVTs, &Offsets, 0);
479 
480   assert(VRegs.size() == SplitVTs.size());
481 
482   unsigned NumValues = SplitVTs.size();
483   Align BaseAlign = DL.getPrefTypeAlign(RetTy);
484   Type *RetPtrTy = RetTy->getPointerTo(DL.getAllocaAddrSpace());
485   LLT OffsetLLTy = getLLTForType(*DL.getIntPtrType(RetPtrTy), DL);
486 
487   MachinePointerInfo PtrInfo = MachinePointerInfo::getFixedStack(MF, FI);
488 
489   for (unsigned I = 0; I < NumValues; ++I) {
490     Register Addr;
491     MIRBuilder.materializePtrAdd(Addr, DemoteReg, OffsetLLTy, Offsets[I]);
492     auto *MMO = MF.getMachineMemOperand(PtrInfo, MachineMemOperand::MOLoad,
493                                         MRI.getType(VRegs[I]).getSizeInBytes(),
494                                         commonAlignment(BaseAlign, Offsets[I]));
495     MIRBuilder.buildLoad(VRegs[I], Addr, *MMO);
496   }
497 }
498 
499 void CallLowering::insertSRetStores(MachineIRBuilder &MIRBuilder, Type *RetTy,
500                                     ArrayRef<Register> VRegs,
501                                     Register DemoteReg) const {
502   MachineFunction &MF = MIRBuilder.getMF();
503   MachineRegisterInfo &MRI = MF.getRegInfo();
504   const DataLayout &DL = MF.getDataLayout();
505 
506   SmallVector<EVT, 4> SplitVTs;
507   SmallVector<uint64_t, 4> Offsets;
508   ComputeValueVTs(*TLI, DL, RetTy, SplitVTs, &Offsets, 0);
509 
510   assert(VRegs.size() == SplitVTs.size());
511 
512   unsigned NumValues = SplitVTs.size();
513   Align BaseAlign = DL.getPrefTypeAlign(RetTy);
514   unsigned AS = DL.getAllocaAddrSpace();
515   LLT OffsetLLTy =
516       getLLTForType(*DL.getIntPtrType(RetTy->getPointerTo(AS)), DL);
517 
518   MachinePointerInfo PtrInfo(AS);
519 
520   for (unsigned I = 0; I < NumValues; ++I) {
521     Register Addr;
522     MIRBuilder.materializePtrAdd(Addr, DemoteReg, OffsetLLTy, Offsets[I]);
523     auto *MMO = MF.getMachineMemOperand(PtrInfo, MachineMemOperand::MOStore,
524                                         MRI.getType(VRegs[I]).getSizeInBytes(),
525                                         commonAlignment(BaseAlign, Offsets[I]));
526     MIRBuilder.buildStore(VRegs[I], Addr, *MMO);
527   }
528 }
529 
530 void CallLowering::insertSRetIncomingArgument(
531     const Function &F, SmallVectorImpl<ArgInfo> &SplitArgs, Register &DemoteReg,
532     MachineRegisterInfo &MRI, const DataLayout &DL) const {
533   unsigned AS = DL.getAllocaAddrSpace();
534   DemoteReg = MRI.createGenericVirtualRegister(
535       LLT::pointer(AS, DL.getPointerSizeInBits(AS)));
536 
537   Type *PtrTy = PointerType::get(F.getReturnType(), AS);
538 
539   SmallVector<EVT, 1> ValueVTs;
540   ComputeValueVTs(*TLI, DL, PtrTy, ValueVTs);
541 
542   // NOTE: Assume that a pointer won't get split into more than one VT.
543   assert(ValueVTs.size() == 1);
544 
545   ArgInfo DemoteArg(DemoteReg, ValueVTs[0].getTypeForEVT(PtrTy->getContext()));
546   setArgFlags(DemoteArg, AttributeList::ReturnIndex, DL, F);
547   DemoteArg.Flags[0].setSRet();
548   SplitArgs.insert(SplitArgs.begin(), DemoteArg);
549 }
550 
551 void CallLowering::insertSRetOutgoingArgument(MachineIRBuilder &MIRBuilder,
552                                               const CallBase &CB,
553                                               CallLoweringInfo &Info) const {
554   const DataLayout &DL = MIRBuilder.getDataLayout();
555   Type *RetTy = CB.getType();
556   unsigned AS = DL.getAllocaAddrSpace();
557   LLT FramePtrTy = LLT::pointer(AS, DL.getPointerSizeInBits(AS));
558 
559   int FI = MIRBuilder.getMF().getFrameInfo().CreateStackObject(
560       DL.getTypeAllocSize(RetTy), DL.getPrefTypeAlign(RetTy), false);
561 
562   Register DemoteReg = MIRBuilder.buildFrameIndex(FramePtrTy, FI).getReg(0);
563   ArgInfo DemoteArg(DemoteReg, PointerType::get(RetTy, AS));
564   setArgFlags(DemoteArg, AttributeList::ReturnIndex, DL, CB);
565   DemoteArg.Flags[0].setSRet();
566 
567   Info.OrigArgs.insert(Info.OrigArgs.begin(), DemoteArg);
568   Info.DemoteStackIndex = FI;
569   Info.DemoteRegister = DemoteReg;
570 }
571 
572 bool CallLowering::checkReturn(CCState &CCInfo,
573                                SmallVectorImpl<BaseArgInfo> &Outs,
574                                CCAssignFn *Fn) const {
575   for (unsigned I = 0, E = Outs.size(); I < E; ++I) {
576     MVT VT = MVT::getVT(Outs[I].Ty);
577     if (Fn(I, VT, VT, CCValAssign::Full, Outs[I].Flags[0], CCInfo))
578       return false;
579   }
580   return true;
581 }
582 
583 void CallLowering::getReturnInfo(CallingConv::ID CallConv, Type *RetTy,
584                                  AttributeList Attrs,
585                                  SmallVectorImpl<BaseArgInfo> &Outs,
586                                  const DataLayout &DL) const {
587   LLVMContext &Context = RetTy->getContext();
588   ISD::ArgFlagsTy Flags = ISD::ArgFlagsTy();
589 
590   SmallVector<EVT, 4> SplitVTs;
591   ComputeValueVTs(*TLI, DL, RetTy, SplitVTs);
592   addArgFlagsFromAttributes(Flags, Attrs, AttributeList::ReturnIndex);
593 
594   for (EVT VT : SplitVTs) {
595     unsigned NumParts =
596         TLI->getNumRegistersForCallingConv(Context, CallConv, VT);
597     MVT RegVT = TLI->getRegisterTypeForCallingConv(Context, CallConv, VT);
598     Type *PartTy = EVT(RegVT).getTypeForEVT(Context);
599 
600     for (unsigned I = 0; I < NumParts; ++I) {
601       Outs.emplace_back(PartTy, Flags);
602     }
603   }
604 }
605 
606 bool CallLowering::checkReturnTypeForCallConv(MachineFunction &MF) const {
607   const auto &F = MF.getFunction();
608   Type *ReturnType = F.getReturnType();
609   CallingConv::ID CallConv = F.getCallingConv();
610 
611   SmallVector<BaseArgInfo, 4> SplitArgs;
612   getReturnInfo(CallConv, ReturnType, F.getAttributes(), SplitArgs,
613                 MF.getDataLayout());
614   return canLowerReturn(MF, CallConv, SplitArgs, F.isVarArg());
615 }
616 
617 bool CallLowering::analyzeArgInfo(CCState &CCState,
618                                   SmallVectorImpl<ArgInfo> &Args,
619                                   CCAssignFn &AssignFnFixed,
620                                   CCAssignFn &AssignFnVarArg) const {
621   for (unsigned i = 0, e = Args.size(); i < e; ++i) {
622     MVT VT = MVT::getVT(Args[i].Ty);
623     CCAssignFn &Fn = Args[i].IsFixed ? AssignFnFixed : AssignFnVarArg;
624     if (Fn(i, VT, VT, CCValAssign::Full, Args[i].Flags[0], CCState)) {
625       // Bail out on anything we can't handle.
626       LLVM_DEBUG(dbgs() << "Cannot analyze " << EVT(VT).getEVTString()
627                         << " (arg number = " << i << "\n");
628       return false;
629     }
630   }
631   return true;
632 }
633 
634 bool CallLowering::parametersInCSRMatch(
635     const MachineRegisterInfo &MRI, const uint32_t *CallerPreservedMask,
636     const SmallVectorImpl<CCValAssign> &OutLocs,
637     const SmallVectorImpl<ArgInfo> &OutArgs) const {
638   for (unsigned i = 0; i < OutLocs.size(); ++i) {
639     auto &ArgLoc = OutLocs[i];
640     // If it's not a register, it's fine.
641     if (!ArgLoc.isRegLoc())
642       continue;
643 
644     MCRegister PhysReg = ArgLoc.getLocReg();
645 
646     // Only look at callee-saved registers.
647     if (MachineOperand::clobbersPhysReg(CallerPreservedMask, PhysReg))
648       continue;
649 
650     LLVM_DEBUG(
651         dbgs()
652         << "... Call has an argument passed in a callee-saved register.\n");
653 
654     // Check if it was copied from.
655     const ArgInfo &OutInfo = OutArgs[i];
656 
657     if (OutInfo.Regs.size() > 1) {
658       LLVM_DEBUG(
659           dbgs() << "... Cannot handle arguments in multiple registers.\n");
660       return false;
661     }
662 
663     // Check if we copy the register, walking through copies from virtual
664     // registers. Note that getDefIgnoringCopies does not ignore copies from
665     // physical registers.
666     MachineInstr *RegDef = getDefIgnoringCopies(OutInfo.Regs[0], MRI);
667     if (!RegDef || RegDef->getOpcode() != TargetOpcode::COPY) {
668       LLVM_DEBUG(
669           dbgs()
670           << "... Parameter was not copied into a VReg, cannot tail call.\n");
671       return false;
672     }
673 
674     // Got a copy. Verify that it's the same as the register we want.
675     Register CopyRHS = RegDef->getOperand(1).getReg();
676     if (CopyRHS != PhysReg) {
677       LLVM_DEBUG(dbgs() << "... Callee-saved register was not copied into "
678                            "VReg, cannot tail call.\n");
679       return false;
680     }
681   }
682 
683   return true;
684 }
685 
686 bool CallLowering::resultsCompatible(CallLoweringInfo &Info,
687                                      MachineFunction &MF,
688                                      SmallVectorImpl<ArgInfo> &InArgs,
689                                      CCAssignFn &CalleeAssignFnFixed,
690                                      CCAssignFn &CalleeAssignFnVarArg,
691                                      CCAssignFn &CallerAssignFnFixed,
692                                      CCAssignFn &CallerAssignFnVarArg) const {
693   const Function &F = MF.getFunction();
694   CallingConv::ID CalleeCC = Info.CallConv;
695   CallingConv::ID CallerCC = F.getCallingConv();
696 
697   if (CallerCC == CalleeCC)
698     return true;
699 
700   SmallVector<CCValAssign, 16> ArgLocs1;
701   CCState CCInfo1(CalleeCC, false, MF, ArgLocs1, F.getContext());
702   if (!analyzeArgInfo(CCInfo1, InArgs, CalleeAssignFnFixed,
703                       CalleeAssignFnVarArg))
704     return false;
705 
706   SmallVector<CCValAssign, 16> ArgLocs2;
707   CCState CCInfo2(CallerCC, false, MF, ArgLocs2, F.getContext());
708   if (!analyzeArgInfo(CCInfo2, InArgs, CallerAssignFnFixed,
709                       CalleeAssignFnVarArg))
710     return false;
711 
712   // We need the argument locations to match up exactly. If there's more in
713   // one than the other, then we are done.
714   if (ArgLocs1.size() != ArgLocs2.size())
715     return false;
716 
717   // Make sure that each location is passed in exactly the same way.
718   for (unsigned i = 0, e = ArgLocs1.size(); i < e; ++i) {
719     const CCValAssign &Loc1 = ArgLocs1[i];
720     const CCValAssign &Loc2 = ArgLocs2[i];
721 
722     // We need both of them to be the same. So if one is a register and one
723     // isn't, we're done.
724     if (Loc1.isRegLoc() != Loc2.isRegLoc())
725       return false;
726 
727     if (Loc1.isRegLoc()) {
728       // If they don't have the same register location, we're done.
729       if (Loc1.getLocReg() != Loc2.getLocReg())
730         return false;
731 
732       // They matched, so we can move to the next ArgLoc.
733       continue;
734     }
735 
736     // Loc1 wasn't a RegLoc, so they both must be MemLocs. Check if they match.
737     if (Loc1.getLocMemOffset() != Loc2.getLocMemOffset())
738       return false;
739   }
740 
741   return true;
742 }
743 
744 Register CallLowering::ValueHandler::extendRegister(Register ValReg,
745                                                     CCValAssign &VA,
746                                                     unsigned MaxSizeBits) {
747   LLT LocTy{VA.getLocVT()};
748   LLT ValTy = MRI.getType(ValReg);
749   if (LocTy.getSizeInBits() == ValTy.getSizeInBits())
750     return ValReg;
751 
752   if (LocTy.isScalar() && MaxSizeBits && MaxSizeBits < LocTy.getSizeInBits()) {
753     if (MaxSizeBits <= ValTy.getSizeInBits())
754       return ValReg;
755     LocTy = LLT::scalar(MaxSizeBits);
756   }
757 
758   switch (VA.getLocInfo()) {
759   default: break;
760   case CCValAssign::Full:
761   case CCValAssign::BCvt:
762     // FIXME: bitconverting between vector types may or may not be a
763     // nop in big-endian situations.
764     return ValReg;
765   case CCValAssign::AExt: {
766     auto MIB = MIRBuilder.buildAnyExt(LocTy, ValReg);
767     return MIB.getReg(0);
768   }
769   case CCValAssign::SExt: {
770     Register NewReg = MRI.createGenericVirtualRegister(LocTy);
771     MIRBuilder.buildSExt(NewReg, ValReg);
772     return NewReg;
773   }
774   case CCValAssign::ZExt: {
775     Register NewReg = MRI.createGenericVirtualRegister(LocTy);
776     MIRBuilder.buildZExt(NewReg, ValReg);
777     return NewReg;
778   }
779   }
780   llvm_unreachable("unable to extend register");
781 }
782 
783 void CallLowering::ValueHandler::anchor() {}
784