1 //===-- lib/CodeGen/GlobalISel/CallLowering.cpp - Call lowering -----------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 ///
9 /// \file
10 /// This file implements some simple delegations needed for call lowering.
11 ///
12 //===----------------------------------------------------------------------===//
13 
14 #include "llvm/CodeGen/Analysis.h"
15 #include "llvm/CodeGen/GlobalISel/CallLowering.h"
16 #include "llvm/CodeGen/GlobalISel/Utils.h"
17 #include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
18 #include "llvm/CodeGen/MachineOperand.h"
19 #include "llvm/CodeGen/MachineRegisterInfo.h"
20 #include "llvm/CodeGen/TargetLowering.h"
21 #include "llvm/IR/DataLayout.h"
22 #include "llvm/IR/Instructions.h"
23 #include "llvm/IR/LLVMContext.h"
24 #include "llvm/IR/Module.h"
25 #include "llvm/Target/TargetMachine.h"
26 
27 #define DEBUG_TYPE "call-lowering"
28 
29 using namespace llvm;
30 
31 void CallLowering::anchor() {}
32 
33 /// Helper function which updates \p Flags when \p AttrFn returns true.
34 static void
35 addFlagsUsingAttrFn(ISD::ArgFlagsTy &Flags,
36                     const std::function<bool(Attribute::AttrKind)> &AttrFn) {
37   if (AttrFn(Attribute::SExt))
38     Flags.setSExt();
39   if (AttrFn(Attribute::ZExt))
40     Flags.setZExt();
41   if (AttrFn(Attribute::InReg))
42     Flags.setInReg();
43   if (AttrFn(Attribute::StructRet))
44     Flags.setSRet();
45   if (AttrFn(Attribute::Nest))
46     Flags.setNest();
47   if (AttrFn(Attribute::ByVal))
48     Flags.setByVal();
49   if (AttrFn(Attribute::Preallocated))
50     Flags.setPreallocated();
51   if (AttrFn(Attribute::InAlloca))
52     Flags.setInAlloca();
53   if (AttrFn(Attribute::Returned))
54     Flags.setReturned();
55   if (AttrFn(Attribute::SwiftSelf))
56     Flags.setSwiftSelf();
57   if (AttrFn(Attribute::SwiftError))
58     Flags.setSwiftError();
59 }
60 
61 ISD::ArgFlagsTy CallLowering::getAttributesForArgIdx(const CallBase &Call,
62                                                      unsigned ArgIdx) const {
63   ISD::ArgFlagsTy Flags;
64   addFlagsUsingAttrFn(Flags, [&Call, &ArgIdx](Attribute::AttrKind Attr) {
65     return Call.paramHasAttr(ArgIdx, Attr);
66   });
67   return Flags;
68 }
69 
70 void CallLowering::addArgFlagsFromAttributes(ISD::ArgFlagsTy &Flags,
71                                              const AttributeList &Attrs,
72                                              unsigned OpIdx) const {
73   addFlagsUsingAttrFn(Flags, [&Attrs, &OpIdx](Attribute::AttrKind Attr) {
74     return Attrs.hasAttribute(OpIdx, Attr);
75   });
76 }
77 
78 bool CallLowering::lowerCall(MachineIRBuilder &MIRBuilder, const CallBase &CB,
79                              ArrayRef<Register> ResRegs,
80                              ArrayRef<ArrayRef<Register>> ArgRegs,
81                              Register SwiftErrorVReg,
82                              std::function<unsigned()> GetCalleeReg) const {
83   CallLoweringInfo Info;
84   const DataLayout &DL = MIRBuilder.getDataLayout();
85   MachineFunction &MF = MIRBuilder.getMF();
86   bool CanBeTailCalled = CB.isTailCall() &&
87                          isInTailCallPosition(CB, MF.getTarget()) &&
88                          (MF.getFunction()
89                               .getFnAttribute("disable-tail-calls")
90                               .getValueAsString() != "true");
91 
92   CallingConv::ID CallConv = CB.getCallingConv();
93   Type *RetTy = CB.getType();
94   bool IsVarArg = CB.getFunctionType()->isVarArg();
95 
96   SmallVector<BaseArgInfo, 4> SplitArgs;
97   getReturnInfo(CallConv, RetTy, CB.getAttributes(), SplitArgs, DL);
98   Info.CanLowerReturn = canLowerReturn(MF, CallConv, SplitArgs, IsVarArg);
99 
100   if (!Info.CanLowerReturn) {
101     // Callee requires sret demotion.
102     insertSRetOutgoingArgument(MIRBuilder, CB, Info);
103 
104     // The sret demotion isn't compatible with tail-calls, since the sret
105     // argument points into the caller's stack frame.
106     CanBeTailCalled = false;
107   }
108 
109   // First step is to marshall all the function's parameters into the correct
110   // physregs and memory locations. Gather the sequence of argument types that
111   // we'll pass to the assigner function.
112   unsigned i = 0;
113   unsigned NumFixedArgs = CB.getFunctionType()->getNumParams();
114   for (auto &Arg : CB.args()) {
115     ArgInfo OrigArg{ArgRegs[i], Arg->getType(), getAttributesForArgIdx(CB, i),
116                     i < NumFixedArgs};
117     setArgFlags(OrigArg, i + AttributeList::FirstArgIndex, DL, CB);
118 
119     // If we have an explicit sret argument that is an Instruction, (i.e., it
120     // might point to function-local memory), we can't meaningfully tail-call.
121     if (OrigArg.Flags[0].isSRet() && isa<Instruction>(&Arg))
122       CanBeTailCalled = false;
123 
124     Info.OrigArgs.push_back(OrigArg);
125     ++i;
126   }
127 
128   // Try looking through a bitcast from one function type to another.
129   // Commonly happens with calls to objc_msgSend().
130   const Value *CalleeV = CB.getCalledOperand()->stripPointerCasts();
131   if (const Function *F = dyn_cast<Function>(CalleeV))
132     Info.Callee = MachineOperand::CreateGA(F, 0);
133   else
134     Info.Callee = MachineOperand::CreateReg(GetCalleeReg(), false);
135 
136   Info.OrigRet = ArgInfo{ResRegs, RetTy, ISD::ArgFlagsTy{}};
137   if (!Info.OrigRet.Ty->isVoidTy())
138     setArgFlags(Info.OrigRet, AttributeList::ReturnIndex, DL, CB);
139 
140   Info.KnownCallees = CB.getMetadata(LLVMContext::MD_callees);
141   Info.CallConv = CallConv;
142   Info.SwiftErrorVReg = SwiftErrorVReg;
143   Info.IsMustTailCall = CB.isMustTailCall();
144   Info.IsTailCall = CanBeTailCalled;
145   Info.IsVarArg = IsVarArg;
146   return lowerCall(MIRBuilder, Info);
147 }
148 
149 template <typename FuncInfoTy>
150 void CallLowering::setArgFlags(CallLowering::ArgInfo &Arg, unsigned OpIdx,
151                                const DataLayout &DL,
152                                const FuncInfoTy &FuncInfo) const {
153   auto &Flags = Arg.Flags[0];
154   const AttributeList &Attrs = FuncInfo.getAttributes();
155   addArgFlagsFromAttributes(Flags, Attrs, OpIdx);
156 
157   if (Flags.isByVal() || Flags.isInAlloca() || Flags.isPreallocated()) {
158     Type *ElementTy = cast<PointerType>(Arg.Ty)->getElementType();
159 
160     auto Ty = Attrs.getAttribute(OpIdx, Attribute::ByVal).getValueAsType();
161     Flags.setByValSize(DL.getTypeAllocSize(Ty ? Ty : ElementTy));
162 
163     // For ByVal, alignment should be passed from FE.  BE will guess if
164     // this info is not there but there are cases it cannot get right.
165     Align FrameAlign;
166     if (auto ParamAlign = FuncInfo.getParamAlign(OpIdx - 2))
167       FrameAlign = *ParamAlign;
168     else
169       FrameAlign = Align(getTLI()->getByValTypeAlignment(ElementTy, DL));
170     Flags.setByValAlign(FrameAlign);
171   }
172   Flags.setOrigAlign(DL.getABITypeAlign(Arg.Ty));
173 
174   // Don't try to use the returned attribute if the argument is marked as
175   // swiftself, since it won't be passed in x0.
176   if (Flags.isSwiftSelf())
177     Flags.setReturned(false);
178 }
179 
180 template void
181 CallLowering::setArgFlags<Function>(CallLowering::ArgInfo &Arg, unsigned OpIdx,
182                                     const DataLayout &DL,
183                                     const Function &FuncInfo) const;
184 
185 template void
186 CallLowering::setArgFlags<CallBase>(CallLowering::ArgInfo &Arg, unsigned OpIdx,
187                                     const DataLayout &DL,
188                                     const CallBase &FuncInfo) const;
189 
190 Register CallLowering::packRegs(ArrayRef<Register> SrcRegs, Type *PackedTy,
191                                 MachineIRBuilder &MIRBuilder) const {
192   assert(SrcRegs.size() > 1 && "Nothing to pack");
193 
194   const DataLayout &DL = MIRBuilder.getMF().getDataLayout();
195   MachineRegisterInfo *MRI = MIRBuilder.getMRI();
196 
197   LLT PackedLLT = getLLTForType(*PackedTy, DL);
198 
199   SmallVector<LLT, 8> LLTs;
200   SmallVector<uint64_t, 8> Offsets;
201   computeValueLLTs(DL, *PackedTy, LLTs, &Offsets);
202   assert(LLTs.size() == SrcRegs.size() && "Regs / types mismatch");
203 
204   Register Dst = MRI->createGenericVirtualRegister(PackedLLT);
205   MIRBuilder.buildUndef(Dst);
206   for (unsigned i = 0; i < SrcRegs.size(); ++i) {
207     Register NewDst = MRI->createGenericVirtualRegister(PackedLLT);
208     MIRBuilder.buildInsert(NewDst, Dst, SrcRegs[i], Offsets[i]);
209     Dst = NewDst;
210   }
211 
212   return Dst;
213 }
214 
215 void CallLowering::unpackRegs(ArrayRef<Register> DstRegs, Register SrcReg,
216                               Type *PackedTy,
217                               MachineIRBuilder &MIRBuilder) const {
218   assert(DstRegs.size() > 1 && "Nothing to unpack");
219 
220   const DataLayout &DL = MIRBuilder.getDataLayout();
221 
222   SmallVector<LLT, 8> LLTs;
223   SmallVector<uint64_t, 8> Offsets;
224   computeValueLLTs(DL, *PackedTy, LLTs, &Offsets);
225   assert(LLTs.size() == DstRegs.size() && "Regs / types mismatch");
226 
227   for (unsigned i = 0; i < DstRegs.size(); ++i)
228     MIRBuilder.buildExtract(DstRegs[i], SrcReg, Offsets[i]);
229 }
230 
231 bool CallLowering::handleAssignments(MachineIRBuilder &MIRBuilder,
232                                      SmallVectorImpl<ArgInfo> &Args,
233                                      ValueHandler &Handler,
234                                      CallingConv::ID CallConv, bool IsVarArg,
235                                      Register ThisReturnReg) const {
236   MachineFunction &MF = MIRBuilder.getMF();
237   const Function &F = MF.getFunction();
238   SmallVector<CCValAssign, 16> ArgLocs;
239 
240   CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, F.getContext());
241   return handleAssignments(CCInfo, ArgLocs, MIRBuilder, Args, Handler,
242                            ThisReturnReg);
243 }
244 
245 bool CallLowering::handleAssignments(CCState &CCInfo,
246                                      SmallVectorImpl<CCValAssign> &ArgLocs,
247                                      MachineIRBuilder &MIRBuilder,
248                                      SmallVectorImpl<ArgInfo> &Args,
249                                      ValueHandler &Handler,
250                                      Register ThisReturnReg) const {
251   MachineFunction &MF = MIRBuilder.getMF();
252   const Function &F = MF.getFunction();
253   const DataLayout &DL = F.getParent()->getDataLayout();
254 
255   unsigned NumArgs = Args.size();
256   for (unsigned i = 0; i != NumArgs; ++i) {
257     EVT CurVT = EVT::getEVT(Args[i].Ty);
258     if (CurVT.isSimple() &&
259         !Handler.assignArg(i, CurVT.getSimpleVT(), CurVT.getSimpleVT(),
260                            CCValAssign::Full, Args[i], Args[i].Flags[0],
261                            CCInfo))
262       continue;
263 
264     MVT NewVT = TLI->getRegisterTypeForCallingConv(
265         F.getContext(), CCInfo.getCallingConv(), EVT(CurVT));
266 
267     // If we need to split the type over multiple regs, check it's a scenario
268     // we currently support.
269     unsigned NumParts = TLI->getNumRegistersForCallingConv(
270         F.getContext(), CCInfo.getCallingConv(), CurVT);
271 
272     if (NumParts == 1) {
273       // Try to use the register type if we couldn't assign the VT.
274       if (Handler.assignArg(i, NewVT, NewVT, CCValAssign::Full, Args[i],
275                             Args[i].Flags[0], CCInfo))
276         return false;
277       continue;
278     }
279 
280     assert(NumParts > 1);
281     // For now only handle exact splits.
282     if (NewVT.getSizeInBits() * NumParts != CurVT.getSizeInBits())
283       return false;
284 
285     // For incoming arguments (physregs to vregs), we could have values in
286     // physregs (or memlocs) which we want to extract and copy to vregs.
287     // During this, we might have to deal with the LLT being split across
288     // multiple regs, so we have to record this information for later.
289     //
290     // If we have outgoing args, then we have the opposite case. We have a
291     // vreg with an LLT which we want to assign to a physical location, and
292     // we might have to record that the value has to be split later.
293     if (Handler.isIncomingArgumentHandler()) {
294       // We're handling an incoming arg which is split over multiple regs.
295       // E.g. passing an s128 on AArch64.
296       ISD::ArgFlagsTy OrigFlags = Args[i].Flags[0];
297       Args[i].OrigRegs.push_back(Args[i].Regs[0]);
298       Args[i].Regs.clear();
299       Args[i].Flags.clear();
300       LLT NewLLT = getLLTForMVT(NewVT);
301       // For each split register, create and assign a vreg that will store
302       // the incoming component of the larger value. These will later be
303       // merged to form the final vreg.
304       for (unsigned Part = 0; Part < NumParts; ++Part) {
305         Register Reg =
306             MIRBuilder.getMRI()->createGenericVirtualRegister(NewLLT);
307         ISD::ArgFlagsTy Flags = OrigFlags;
308         if (Part == 0) {
309           Flags.setSplit();
310         } else {
311           Flags.setOrigAlign(Align(1));
312           if (Part == NumParts - 1)
313             Flags.setSplitEnd();
314         }
315         Args[i].Regs.push_back(Reg);
316         Args[i].Flags.push_back(Flags);
317         if (Handler.assignArg(i, NewVT, NewVT, CCValAssign::Full, Args[i],
318                               Args[i].Flags[Part], CCInfo)) {
319           // Still couldn't assign this smaller part type for some reason.
320           return false;
321         }
322       }
323     } else {
324       // This type is passed via multiple registers in the calling convention.
325       // We need to extract the individual parts.
326       Register LargeReg = Args[i].Regs[0];
327       LLT SmallTy = LLT::scalar(NewVT.getSizeInBits());
328       auto Unmerge = MIRBuilder.buildUnmerge(SmallTy, LargeReg);
329       assert(Unmerge->getNumOperands() == NumParts + 1);
330       ISD::ArgFlagsTy OrigFlags = Args[i].Flags[0];
331       // We're going to replace the regs and flags with the split ones.
332       Args[i].Regs.clear();
333       Args[i].Flags.clear();
334       for (unsigned PartIdx = 0; PartIdx < NumParts; ++PartIdx) {
335         ISD::ArgFlagsTy Flags = OrigFlags;
336         if (PartIdx == 0) {
337           Flags.setSplit();
338         } else {
339           Flags.setOrigAlign(Align(1));
340           if (PartIdx == NumParts - 1)
341             Flags.setSplitEnd();
342         }
343 
344         // TODO: Also check if there is a valid extension that preserves the
345         // bits. However currently this call lowering doesn't support non-exact
346         // split parts, so that can't be tested.
347         if (OrigFlags.isReturned() &&
348             (NumParts * NewVT.getSizeInBits() != CurVT.getSizeInBits())) {
349           Flags.setReturned(false);
350         }
351 
352         Args[i].Regs.push_back(Unmerge.getReg(PartIdx));
353         Args[i].Flags.push_back(Flags);
354         if (Handler.assignArg(i, NewVT, NewVT, CCValAssign::Full,
355                               Args[i], Args[i].Flags[PartIdx], CCInfo))
356           return false;
357       }
358     }
359   }
360 
361   for (unsigned i = 0, e = Args.size(), j = 0; i != e; ++i, ++j) {
362     assert(j < ArgLocs.size() && "Skipped too many arg locs");
363 
364     CCValAssign &VA = ArgLocs[j];
365     assert(VA.getValNo() == i && "Location doesn't correspond to current arg");
366 
367     if (VA.needsCustom()) {
368       unsigned NumArgRegs =
369           Handler.assignCustomValue(Args[i], makeArrayRef(ArgLocs).slice(j));
370       if (!NumArgRegs)
371         return false;
372       j += NumArgRegs;
373       continue;
374     }
375 
376     // FIXME: Pack registers if we have more than one.
377     Register ArgReg = Args[i].Regs[0];
378 
379     EVT OrigVT = EVT::getEVT(Args[i].Ty);
380     EVT VAVT = VA.getValVT();
381     const LLT OrigTy = getLLTForType(*Args[i].Ty, DL);
382 
383     // Expected to be multiple regs for a single incoming arg.
384     // There should be Regs.size() ArgLocs per argument.
385     unsigned NumArgRegs = Args[i].Regs.size();
386 
387     assert((j + (NumArgRegs - 1)) < ArgLocs.size() &&
388            "Too many regs for number of args");
389     for (unsigned Part = 0; Part < NumArgRegs; ++Part) {
390       // There should be Regs.size() ArgLocs per argument.
391       VA = ArgLocs[j + Part];
392       if (VA.isMemLoc()) {
393         // Don't currently support loading/storing a type that needs to be split
394         // to the stack. Should be easy, just not implemented yet.
395         if (NumArgRegs > 1) {
396           LLVM_DEBUG(
397             dbgs()
398             << "Load/store a split arg to/from the stack not implemented yet\n");
399           return false;
400         }
401 
402         // FIXME: Use correct address space for pointer size
403         EVT LocVT = VA.getValVT();
404         unsigned MemSize = LocVT == MVT::iPTR ? DL.getPointerSize()
405                                               : LocVT.getStoreSize();
406         unsigned Offset = VA.getLocMemOffset();
407         MachinePointerInfo MPO;
408         Register StackAddr = Handler.getStackAddress(MemSize, Offset, MPO);
409         Handler.assignValueToAddress(Args[i], StackAddr,
410                                      MemSize, MPO, VA);
411         continue;
412       }
413 
414       assert(VA.isRegLoc() && "custom loc should have been handled already");
415 
416       if (i == 0 && ThisReturnReg.isValid() &&
417           Handler.isIncomingArgumentHandler() &&
418           isTypeIsValidForThisReturn(VAVT)) {
419         Handler.assignValueToReg(Args[i].Regs[i], ThisReturnReg, VA);
420         continue;
421       }
422 
423       // GlobalISel does not currently work for scalable vectors.
424       if (OrigVT.getFixedSizeInBits() >= VAVT.getFixedSizeInBits() ||
425           !Handler.isIncomingArgumentHandler()) {
426         // This is an argument that might have been split. There should be
427         // Regs.size() ArgLocs per argument.
428 
429         // Insert the argument copies. If VAVT < OrigVT, we'll insert the merge
430         // to the original register after handling all of the parts.
431         Handler.assignValueToReg(Args[i].Regs[Part], VA.getLocReg(), VA);
432         continue;
433       }
434 
435       // This ArgLoc covers multiple pieces, so we need to split it.
436       const LLT VATy(VAVT.getSimpleVT());
437       Register NewReg =
438         MIRBuilder.getMRI()->createGenericVirtualRegister(VATy);
439       Handler.assignValueToReg(NewReg, VA.getLocReg(), VA);
440       // If it's a vector type, we either need to truncate the elements
441       // or do an unmerge to get the lower block of elements.
442       if (VATy.isVector() &&
443           VATy.getNumElements() > OrigVT.getVectorNumElements()) {
444         // Just handle the case where the VA type is 2 * original type.
445         if (VATy.getNumElements() != OrigVT.getVectorNumElements() * 2) {
446           LLVM_DEBUG(dbgs()
447                      << "Incoming promoted vector arg has too many elts");
448           return false;
449         }
450         auto Unmerge = MIRBuilder.buildUnmerge({OrigTy, OrigTy}, {NewReg});
451         MIRBuilder.buildCopy(ArgReg, Unmerge.getReg(0));
452       } else {
453         MIRBuilder.buildTrunc(ArgReg, {NewReg}).getReg(0);
454       }
455     }
456 
457     // Now that all pieces have been handled, re-pack any arguments into any
458     // wider, original registers.
459     if (Handler.isIncomingArgumentHandler()) {
460       if (VAVT.getFixedSizeInBits() < OrigVT.getFixedSizeInBits()) {
461         assert(NumArgRegs >= 2);
462 
463         // Merge the split registers into the expected larger result vreg
464         // of the original call.
465         MIRBuilder.buildMerge(Args[i].OrigRegs[0], Args[i].Regs);
466       }
467     }
468 
469     j += NumArgRegs - 1;
470   }
471 
472   return true;
473 }
474 
475 void CallLowering::insertSRetLoads(MachineIRBuilder &MIRBuilder, Type *RetTy,
476                                    ArrayRef<Register> VRegs, Register DemoteReg,
477                                    int FI) const {
478   MachineFunction &MF = MIRBuilder.getMF();
479   MachineRegisterInfo &MRI = MF.getRegInfo();
480   const DataLayout &DL = MF.getDataLayout();
481 
482   SmallVector<EVT, 4> SplitVTs;
483   SmallVector<uint64_t, 4> Offsets;
484   ComputeValueVTs(*TLI, DL, RetTy, SplitVTs, &Offsets, 0);
485 
486   assert(VRegs.size() == SplitVTs.size());
487 
488   unsigned NumValues = SplitVTs.size();
489   Align BaseAlign = DL.getPrefTypeAlign(RetTy);
490   Type *RetPtrTy = RetTy->getPointerTo(DL.getAllocaAddrSpace());
491   LLT OffsetLLTy = getLLTForType(*DL.getIntPtrType(RetPtrTy), DL);
492 
493   MachinePointerInfo PtrInfo = MachinePointerInfo::getFixedStack(MF, FI);
494 
495   for (unsigned I = 0; I < NumValues; ++I) {
496     Register Addr;
497     MIRBuilder.materializePtrAdd(Addr, DemoteReg, OffsetLLTy, Offsets[I]);
498     auto *MMO = MF.getMachineMemOperand(PtrInfo, MachineMemOperand::MOLoad,
499                                         MRI.getType(VRegs[I]).getSizeInBytes(),
500                                         commonAlignment(BaseAlign, Offsets[I]));
501     MIRBuilder.buildLoad(VRegs[I], Addr, *MMO);
502   }
503 }
504 
505 void CallLowering::insertSRetStores(MachineIRBuilder &MIRBuilder, Type *RetTy,
506                                     ArrayRef<Register> VRegs,
507                                     Register DemoteReg) const {
508   MachineFunction &MF = MIRBuilder.getMF();
509   MachineRegisterInfo &MRI = MF.getRegInfo();
510   const DataLayout &DL = MF.getDataLayout();
511 
512   SmallVector<EVT, 4> SplitVTs;
513   SmallVector<uint64_t, 4> Offsets;
514   ComputeValueVTs(*TLI, DL, RetTy, SplitVTs, &Offsets, 0);
515 
516   assert(VRegs.size() == SplitVTs.size());
517 
518   unsigned NumValues = SplitVTs.size();
519   Align BaseAlign = DL.getPrefTypeAlign(RetTy);
520   unsigned AS = DL.getAllocaAddrSpace();
521   LLT OffsetLLTy =
522       getLLTForType(*DL.getIntPtrType(RetTy->getPointerTo(AS)), DL);
523 
524   MachinePointerInfo PtrInfo(AS);
525 
526   for (unsigned I = 0; I < NumValues; ++I) {
527     Register Addr;
528     MIRBuilder.materializePtrAdd(Addr, DemoteReg, OffsetLLTy, Offsets[I]);
529     auto *MMO = MF.getMachineMemOperand(PtrInfo, MachineMemOperand::MOStore,
530                                         MRI.getType(VRegs[I]).getSizeInBytes(),
531                                         commonAlignment(BaseAlign, Offsets[I]));
532     MIRBuilder.buildStore(VRegs[I], Addr, *MMO);
533   }
534 }
535 
536 void CallLowering::insertSRetIncomingArgument(
537     const Function &F, SmallVectorImpl<ArgInfo> &SplitArgs, Register &DemoteReg,
538     MachineRegisterInfo &MRI, const DataLayout &DL) const {
539   unsigned AS = DL.getAllocaAddrSpace();
540   DemoteReg = MRI.createGenericVirtualRegister(
541       LLT::pointer(AS, DL.getPointerSizeInBits(AS)));
542 
543   Type *PtrTy = PointerType::get(F.getReturnType(), AS);
544 
545   SmallVector<EVT, 1> ValueVTs;
546   ComputeValueVTs(*TLI, DL, PtrTy, ValueVTs);
547 
548   // NOTE: Assume that a pointer won't get split into more than one VT.
549   assert(ValueVTs.size() == 1);
550 
551   ArgInfo DemoteArg(DemoteReg, ValueVTs[0].getTypeForEVT(PtrTy->getContext()));
552   setArgFlags(DemoteArg, AttributeList::ReturnIndex, DL, F);
553   DemoteArg.Flags[0].setSRet();
554   SplitArgs.insert(SplitArgs.begin(), DemoteArg);
555 }
556 
557 void CallLowering::insertSRetOutgoingArgument(MachineIRBuilder &MIRBuilder,
558                                               const CallBase &CB,
559                                               CallLoweringInfo &Info) const {
560   const DataLayout &DL = MIRBuilder.getDataLayout();
561   Type *RetTy = CB.getType();
562   unsigned AS = DL.getAllocaAddrSpace();
563   LLT FramePtrTy = LLT::pointer(AS, DL.getPointerSizeInBits(AS));
564 
565   int FI = MIRBuilder.getMF().getFrameInfo().CreateStackObject(
566       DL.getTypeAllocSize(RetTy), DL.getPrefTypeAlign(RetTy), false);
567 
568   Register DemoteReg = MIRBuilder.buildFrameIndex(FramePtrTy, FI).getReg(0);
569   ArgInfo DemoteArg(DemoteReg, PointerType::get(RetTy, AS));
570   setArgFlags(DemoteArg, AttributeList::ReturnIndex, DL, CB);
571   DemoteArg.Flags[0].setSRet();
572 
573   Info.OrigArgs.insert(Info.OrigArgs.begin(), DemoteArg);
574   Info.DemoteStackIndex = FI;
575   Info.DemoteRegister = DemoteReg;
576 }
577 
578 bool CallLowering::checkReturn(CCState &CCInfo,
579                                SmallVectorImpl<BaseArgInfo> &Outs,
580                                CCAssignFn *Fn) const {
581   for (unsigned I = 0, E = Outs.size(); I < E; ++I) {
582     MVT VT = MVT::getVT(Outs[I].Ty);
583     if (Fn(I, VT, VT, CCValAssign::Full, Outs[I].Flags[0], CCInfo))
584       return false;
585   }
586   return true;
587 }
588 
589 void CallLowering::getReturnInfo(CallingConv::ID CallConv, Type *RetTy,
590                                  AttributeList Attrs,
591                                  SmallVectorImpl<BaseArgInfo> &Outs,
592                                  const DataLayout &DL) const {
593   LLVMContext &Context = RetTy->getContext();
594   ISD::ArgFlagsTy Flags = ISD::ArgFlagsTy();
595 
596   SmallVector<EVT, 4> SplitVTs;
597   ComputeValueVTs(*TLI, DL, RetTy, SplitVTs);
598   addArgFlagsFromAttributes(Flags, Attrs, AttributeList::ReturnIndex);
599 
600   for (EVT VT : SplitVTs) {
601     unsigned NumParts =
602         TLI->getNumRegistersForCallingConv(Context, CallConv, VT);
603     MVT RegVT = TLI->getRegisterTypeForCallingConv(Context, CallConv, VT);
604     Type *PartTy = EVT(RegVT).getTypeForEVT(Context);
605 
606     for (unsigned I = 0; I < NumParts; ++I) {
607       Outs.emplace_back(PartTy, Flags);
608     }
609   }
610 }
611 
612 bool CallLowering::checkReturnTypeForCallConv(MachineFunction &MF) const {
613   const auto &F = MF.getFunction();
614   Type *ReturnType = F.getReturnType();
615   CallingConv::ID CallConv = F.getCallingConv();
616 
617   SmallVector<BaseArgInfo, 4> SplitArgs;
618   getReturnInfo(CallConv, ReturnType, F.getAttributes(), SplitArgs,
619                 MF.getDataLayout());
620   return canLowerReturn(MF, CallConv, SplitArgs, F.isVarArg());
621 }
622 
623 bool CallLowering::analyzeArgInfo(CCState &CCState,
624                                   SmallVectorImpl<ArgInfo> &Args,
625                                   CCAssignFn &AssignFnFixed,
626                                   CCAssignFn &AssignFnVarArg) const {
627   for (unsigned i = 0, e = Args.size(); i < e; ++i) {
628     MVT VT = MVT::getVT(Args[i].Ty);
629     CCAssignFn &Fn = Args[i].IsFixed ? AssignFnFixed : AssignFnVarArg;
630     if (Fn(i, VT, VT, CCValAssign::Full, Args[i].Flags[0], CCState)) {
631       // Bail out on anything we can't handle.
632       LLVM_DEBUG(dbgs() << "Cannot analyze " << EVT(VT).getEVTString()
633                         << " (arg number = " << i << "\n");
634       return false;
635     }
636   }
637   return true;
638 }
639 
640 bool CallLowering::parametersInCSRMatch(
641     const MachineRegisterInfo &MRI, const uint32_t *CallerPreservedMask,
642     const SmallVectorImpl<CCValAssign> &OutLocs,
643     const SmallVectorImpl<ArgInfo> &OutArgs) const {
644   for (unsigned i = 0; i < OutLocs.size(); ++i) {
645     auto &ArgLoc = OutLocs[i];
646     // If it's not a register, it's fine.
647     if (!ArgLoc.isRegLoc())
648       continue;
649 
650     MCRegister PhysReg = ArgLoc.getLocReg();
651 
652     // Only look at callee-saved registers.
653     if (MachineOperand::clobbersPhysReg(CallerPreservedMask, PhysReg))
654       continue;
655 
656     LLVM_DEBUG(
657         dbgs()
658         << "... Call has an argument passed in a callee-saved register.\n");
659 
660     // Check if it was copied from.
661     const ArgInfo &OutInfo = OutArgs[i];
662 
663     if (OutInfo.Regs.size() > 1) {
664       LLVM_DEBUG(
665           dbgs() << "... Cannot handle arguments in multiple registers.\n");
666       return false;
667     }
668 
669     // Check if we copy the register, walking through copies from virtual
670     // registers. Note that getDefIgnoringCopies does not ignore copies from
671     // physical registers.
672     MachineInstr *RegDef = getDefIgnoringCopies(OutInfo.Regs[0], MRI);
673     if (!RegDef || RegDef->getOpcode() != TargetOpcode::COPY) {
674       LLVM_DEBUG(
675           dbgs()
676           << "... Parameter was not copied into a VReg, cannot tail call.\n");
677       return false;
678     }
679 
680     // Got a copy. Verify that it's the same as the register we want.
681     Register CopyRHS = RegDef->getOperand(1).getReg();
682     if (CopyRHS != PhysReg) {
683       LLVM_DEBUG(dbgs() << "... Callee-saved register was not copied into "
684                            "VReg, cannot tail call.\n");
685       return false;
686     }
687   }
688 
689   return true;
690 }
691 
692 bool CallLowering::resultsCompatible(CallLoweringInfo &Info,
693                                      MachineFunction &MF,
694                                      SmallVectorImpl<ArgInfo> &InArgs,
695                                      CCAssignFn &CalleeAssignFnFixed,
696                                      CCAssignFn &CalleeAssignFnVarArg,
697                                      CCAssignFn &CallerAssignFnFixed,
698                                      CCAssignFn &CallerAssignFnVarArg) const {
699   const Function &F = MF.getFunction();
700   CallingConv::ID CalleeCC = Info.CallConv;
701   CallingConv::ID CallerCC = F.getCallingConv();
702 
703   if (CallerCC == CalleeCC)
704     return true;
705 
706   SmallVector<CCValAssign, 16> ArgLocs1;
707   CCState CCInfo1(CalleeCC, false, MF, ArgLocs1, F.getContext());
708   if (!analyzeArgInfo(CCInfo1, InArgs, CalleeAssignFnFixed,
709                       CalleeAssignFnVarArg))
710     return false;
711 
712   SmallVector<CCValAssign, 16> ArgLocs2;
713   CCState CCInfo2(CallerCC, false, MF, ArgLocs2, F.getContext());
714   if (!analyzeArgInfo(CCInfo2, InArgs, CallerAssignFnFixed,
715                       CalleeAssignFnVarArg))
716     return false;
717 
718   // We need the argument locations to match up exactly. If there's more in
719   // one than the other, then we are done.
720   if (ArgLocs1.size() != ArgLocs2.size())
721     return false;
722 
723   // Make sure that each location is passed in exactly the same way.
724   for (unsigned i = 0, e = ArgLocs1.size(); i < e; ++i) {
725     const CCValAssign &Loc1 = ArgLocs1[i];
726     const CCValAssign &Loc2 = ArgLocs2[i];
727 
728     // We need both of them to be the same. So if one is a register and one
729     // isn't, we're done.
730     if (Loc1.isRegLoc() != Loc2.isRegLoc())
731       return false;
732 
733     if (Loc1.isRegLoc()) {
734       // If they don't have the same register location, we're done.
735       if (Loc1.getLocReg() != Loc2.getLocReg())
736         return false;
737 
738       // They matched, so we can move to the next ArgLoc.
739       continue;
740     }
741 
742     // Loc1 wasn't a RegLoc, so they both must be MemLocs. Check if they match.
743     if (Loc1.getLocMemOffset() != Loc2.getLocMemOffset())
744       return false;
745   }
746 
747   return true;
748 }
749 
750 Register CallLowering::ValueHandler::extendRegister(Register ValReg,
751                                                     CCValAssign &VA,
752                                                     unsigned MaxSizeBits) {
753   LLT LocTy{VA.getLocVT()};
754   LLT ValTy = MRI.getType(ValReg);
755   if (LocTy.getSizeInBits() == ValTy.getSizeInBits())
756     return ValReg;
757 
758   if (LocTy.isScalar() && MaxSizeBits && MaxSizeBits < LocTy.getSizeInBits()) {
759     if (MaxSizeBits <= ValTy.getSizeInBits())
760       return ValReg;
761     LocTy = LLT::scalar(MaxSizeBits);
762   }
763 
764   switch (VA.getLocInfo()) {
765   default: break;
766   case CCValAssign::Full:
767   case CCValAssign::BCvt:
768     // FIXME: bitconverting between vector types may or may not be a
769     // nop in big-endian situations.
770     return ValReg;
771   case CCValAssign::AExt: {
772     auto MIB = MIRBuilder.buildAnyExt(LocTy, ValReg);
773     return MIB.getReg(0);
774   }
775   case CCValAssign::SExt: {
776     Register NewReg = MRI.createGenericVirtualRegister(LocTy);
777     MIRBuilder.buildSExt(NewReg, ValReg);
778     return NewReg;
779   }
780   case CCValAssign::ZExt: {
781     Register NewReg = MRI.createGenericVirtualRegister(LocTy);
782     MIRBuilder.buildZExt(NewReg, ValReg);
783     return NewReg;
784   }
785   }
786   llvm_unreachable("unable to extend register");
787 }
788 
789 void CallLowering::ValueHandler::anchor() {}
790