1 //===-- FixupStatepointCallerSaved.cpp - Fixup caller saved registers  ----===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 ///
10 /// \file
11 /// Statepoint instruction in deopt parameters contains values which are
12 /// meaningful to the runtime and should be able to be read at the moment the
13 /// call returns. So we can say that we need to encode the fact that these
14 /// values are "late read" by runtime. If we could express this notion for
15 /// register allocator it would produce the right form for us.
16 /// The need to fixup (i.e this pass) is specifically handling the fact that
17 /// we cannot describe such a late read for the register allocator.
18 /// Register allocator may put the value on a register clobbered by the call.
19 /// This pass forces the spill of such registers and replaces corresponding
20 /// statepoint operands to added spill slots.
21 ///
22 //===----------------------------------------------------------------------===//
23 
24 #include "llvm/ADT/SmallSet.h"
25 #include "llvm/ADT/Statistic.h"
26 #include "llvm/CodeGen/MachineFrameInfo.h"
27 #include "llvm/CodeGen/MachineFunctionPass.h"
28 #include "llvm/CodeGen/MachineRegisterInfo.h"
29 #include "llvm/CodeGen/Passes.h"
30 #include "llvm/CodeGen/StackMaps.h"
31 #include "llvm/CodeGen/TargetFrameLowering.h"
32 #include "llvm/CodeGen/TargetInstrInfo.h"
33 #include "llvm/IR/Statepoint.h"
34 #include "llvm/InitializePasses.h"
35 #include "llvm/Support/Debug.h"
36 
37 using namespace llvm;
38 
39 #define DEBUG_TYPE "fixup-statepoint-caller-saved"
40 STATISTIC(NumSpilledRegisters, "Number of spilled register");
41 STATISTIC(NumSpillSlotsAllocated, "Number of spill slots allocated");
42 STATISTIC(NumSpillSlotsExtended, "Number of spill slots extended");
43 
44 static cl::opt<bool> FixupSCSExtendSlotSize(
45     "fixup-scs-extend-slot-size", cl::Hidden, cl::init(false),
46     cl::desc("Allow spill in spill slot of greater size than register size"),
47     cl::Hidden);
48 
49 static cl::opt<bool> PassGCPtrInCSR(
50     "fixup-allow-gcptr-in-csr", cl::Hidden, cl::init(false),
51     cl::desc("Allow passing GC Pointer arguments in callee saved registers"));
52 
53 static cl::opt<bool> EnableCopyProp(
54     "fixup-scs-enable-copy-propagation", cl::Hidden, cl::init(true),
55     cl::desc("Enable simple copy propagation during register reloading"));
56 
57 // This is purely debugging option.
58 // It may be handy for investigating statepoint spilling issues.
59 static cl::opt<unsigned> MaxStatepointsWithRegs(
60     "fixup-max-csr-statepoints", cl::Hidden,
61     cl::desc("Max number of statepoints allowed to pass GC Ptrs in registers"));
62 
63 namespace {
64 
65 class FixupStatepointCallerSaved : public MachineFunctionPass {
66 public:
67   static char ID;
68 
69   FixupStatepointCallerSaved() : MachineFunctionPass(ID) {
70     initializeFixupStatepointCallerSavedPass(*PassRegistry::getPassRegistry());
71   }
72 
73   void getAnalysisUsage(AnalysisUsage &AU) const override {
74     AU.setPreservesCFG();
75     MachineFunctionPass::getAnalysisUsage(AU);
76   }
77 
78   StringRef getPassName() const override {
79     return "Fixup Statepoint Caller Saved";
80   }
81 
82   bool runOnMachineFunction(MachineFunction &MF) override;
83 };
84 
85 } // End anonymous namespace.
86 
87 char FixupStatepointCallerSaved::ID = 0;
88 char &llvm::FixupStatepointCallerSavedID = FixupStatepointCallerSaved::ID;
89 
90 INITIALIZE_PASS_BEGIN(FixupStatepointCallerSaved, DEBUG_TYPE,
91                       "Fixup Statepoint Caller Saved", false, false)
92 INITIALIZE_PASS_END(FixupStatepointCallerSaved, DEBUG_TYPE,
93                     "Fixup Statepoint Caller Saved", false, false)
94 
95 // Utility function to get size of the register.
96 static unsigned getRegisterSize(const TargetRegisterInfo &TRI, Register Reg) {
97   const TargetRegisterClass *RC = TRI.getMinimalPhysRegClass(Reg);
98   return TRI.getSpillSize(*RC);
99 }
100 
101 // Advance iterator to the next stack map entry
102 static MachineInstr::const_mop_iterator
103 advanceToNextStackMapElt(MachineInstr::const_mop_iterator MOI) {
104   if (MOI->isImm()) {
105     switch (MOI->getImm()) {
106     default:
107       llvm_unreachable("Unrecognized operand type.");
108     case StackMaps::DirectMemRefOp:
109       MOI += 2; // <Reg>, <Imm>
110       break;
111     case StackMaps::IndirectMemRefOp:
112       MOI += 3; // <Size>, <Reg>, <Imm>
113       break;
114     case StackMaps::ConstantOp:
115       MOI += 1;
116       break;
117     }
118   }
119   return ++MOI;
120 }
121 
122 // Return statepoint GC args as a set
123 static SmallSet<Register, 8> collectGCRegs(MachineInstr &MI) {
124   StatepointOpers SO(&MI);
125   unsigned NumDeoptIdx = SO.getNumDeoptArgsIdx();
126   unsigned NumDeoptArgs = MI.getOperand(NumDeoptIdx).getImm();
127   MachineInstr::const_mop_iterator MOI(MI.operands_begin() + NumDeoptIdx + 1),
128       MOE(MI.operands_end());
129 
130   // Skip deopt args
131   while (NumDeoptArgs--)
132     MOI = advanceToNextStackMapElt(MOI);
133 
134   SmallSet<Register, 8> Result;
135   while (MOI != MOE) {
136     if (MOI->isReg() && !MOI->isImplicit())
137       Result.insert(MOI->getReg());
138     MOI = advanceToNextStackMapElt(MOI);
139   }
140   return Result;
141 }
142 
143 // Try to eliminate redundant copy to register which we're going to
144 // spill, i.e. try to change:
145 //    X = COPY Y
146 //    SPILL X
147 //  to
148 //    SPILL Y
149 //  If there are no uses of X between copy and STATEPOINT, that COPY
150 //  may be eliminated.
151 //  Reg - register we're about to spill
152 //  RI - On entry points to statepoint.
153 //       On successful copy propagation set to new spill point.
154 //  IsKill - set to true if COPY is Kill (there are no uses of Y)
155 //  Returns either found source copy register or original one.
156 static Register performCopyPropagation(Register Reg,
157                                        MachineBasicBlock::iterator &RI,
158                                        bool &IsKill, const TargetInstrInfo &TII,
159                                        const TargetRegisterInfo &TRI) {
160   if (!EnableCopyProp)
161     return Reg;
162 
163   // First check if statepoint itself uses Reg in non-meta operands.
164   int Idx = RI->findRegisterUseOperandIdx(Reg, false, &TRI);
165   if (Idx >= 0 && (unsigned)Idx < StatepointOpers(&*RI).getNumDeoptArgsIdx())
166     return Reg;
167 
168   MachineBasicBlock *MBB = RI->getParent();
169   MachineBasicBlock::reverse_iterator E = MBB->rend();
170   MachineInstr *Def = nullptr, *Use = nullptr;
171   for (auto It = ++(RI.getReverse()); It != E; ++It) {
172     if (It->readsRegister(Reg, &TRI) && !Use)
173       Use = &*It;
174     if (It->modifiesRegister(Reg, &TRI)) {
175       Def = &*It;
176       break;
177     }
178   }
179 
180   if (!Def)
181     return Reg;
182 
183   auto DestSrc = TII.isCopyInstr(*Def);
184   if (!DestSrc || DestSrc->Destination->getReg() != Reg)
185     return Reg;
186 
187   Register SrcReg = DestSrc->Source->getReg();
188 
189   if (getRegisterSize(TRI, Reg) != getRegisterSize(TRI, SrcReg))
190     return Reg;
191 
192   LLVM_DEBUG(dbgs() << "spillRegisters: perform copy propagation "
193                     << printReg(Reg, &TRI) << " -> " << printReg(SrcReg, &TRI)
194                     << "\n");
195 
196   // Insert spill immediately after Def
197   RI = ++MachineBasicBlock::iterator(Def);
198   IsKill = DestSrc->Source->isKill();
199 
200   // There are no uses of original register between COPY and STATEPOINT.
201   // There can't be any after STATEPOINT, so we can eliminate Def.
202   if (!Use) {
203     LLVM_DEBUG(dbgs() << "spillRegisters: removing dead copy " << *Def);
204     Def->eraseFromParent();
205   }
206   return SrcReg;
207 }
208 
209 namespace {
210 // Pair {Register, FrameIndex}
211 using RegSlotPair = std::pair<Register, int>;
212 
213 // Keeps track of what reloads were inserted in MBB.
214 class RegReloadCache {
215   using ReloadSet = SmallSet<RegSlotPair, 8>;
216   DenseMap<const MachineBasicBlock *, ReloadSet> Reloads;
217 
218 public:
219   RegReloadCache() = default;
220 
221   // Record reload of Reg from FI in block MBB
222   void recordReload(Register Reg, int FI, const MachineBasicBlock *MBB) {
223     RegSlotPair RSP(Reg, FI);
224     auto Res = Reloads[MBB].insert(RSP);
225     assert(Res.second && "reload already exists");
226   }
227 
228   // Does basic block MBB contains reload of Reg from FI?
229   bool hasReload(Register Reg, int FI, const MachineBasicBlock *MBB) {
230     RegSlotPair RSP(Reg, FI);
231     return Reloads.count(MBB) && Reloads[MBB].count(RSP);
232   }
233 };
234 
235 // Cache used frame indexes during statepoint re-write to re-use them in
236 // processing next statepoint instruction.
237 // Two strategies. One is to preserve the size of spill slot while another one
238 // extends the size of spill slots to reduce the number of them, causing
239 // the less total frame size. But unspill will have "implicit" any extend.
240 class FrameIndexesCache {
241 private:
242   struct FrameIndexesPerSize {
243     // List of used frame indexes during processing previous statepoints.
244     SmallVector<int, 8> Slots;
245     // Current index of un-used yet frame index.
246     unsigned Index = 0;
247   };
248   MachineFrameInfo &MFI;
249   const TargetRegisterInfo &TRI;
250   // Map size to list of frame indexes of this size. If the mode is
251   // FixupSCSExtendSlotSize then the key 0 is used to keep all frame indexes.
252   // If the size of required spill slot is greater than in a cache then the
253   // size will be increased.
254   DenseMap<unsigned, FrameIndexesPerSize> Cache;
255 
256   // Keeps track of slots reserved for the shared landing pad processing.
257   // Initialized from GlobalIndices for the current EHPad.
258   SmallSet<int, 8> ReservedSlots;
259 
260   // Landing pad can be destination of several statepoints. Every register
261   // defined by such statepoints must be spilled to the same stack slot.
262   // This map keeps that information.
263   DenseMap<const MachineBasicBlock *, SmallVector<RegSlotPair, 8>>
264       GlobalIndices;
265 
266   FrameIndexesPerSize &getCacheBucket(unsigned Size) {
267     // In FixupSCSExtendSlotSize mode the bucket with 0 index is used
268     // for all sizes.
269     return Cache[FixupSCSExtendSlotSize ? 0 : Size];
270   }
271 
272 public:
273   FrameIndexesCache(MachineFrameInfo &MFI, const TargetRegisterInfo &TRI)
274       : MFI(MFI), TRI(TRI) {}
275   // Reset the current state of used frame indexes. After invocation of
276   // this function all frame indexes are available for allocation with
277   // the exception of slots reserved for landing pad processing (if any).
278   void reset(const MachineBasicBlock *EHPad) {
279     for (auto &It : Cache)
280       It.second.Index = 0;
281 
282     ReservedSlots.clear();
283     if (EHPad && GlobalIndices.count(EHPad))
284       for (auto &RSP : GlobalIndices[EHPad])
285         ReservedSlots.insert(RSP.second);
286   }
287 
288   // Get frame index to spill the register.
289   int getFrameIndex(Register Reg, MachineBasicBlock *EHPad) {
290     // Check if slot for Reg is already reserved at EHPad.
291     auto It = GlobalIndices.find(EHPad);
292     if (It != GlobalIndices.end()) {
293       auto &Vec = It->second;
294       auto Idx = llvm::find_if(
295           Vec, [Reg](RegSlotPair &RSP) { return Reg == RSP.first; });
296       if (Idx != Vec.end()) {
297         int FI = Idx->second;
298         LLVM_DEBUG(dbgs() << "Found global FI " << FI << " for register "
299                           << printReg(Reg, &TRI) << " at "
300                           << printMBBReference(*EHPad) << "\n");
301         assert(ReservedSlots.count(FI) && "using unreserved slot");
302         return FI;
303       }
304     }
305 
306     unsigned Size = getRegisterSize(TRI, Reg);
307     FrameIndexesPerSize &Line = getCacheBucket(Size);
308     while (Line.Index < Line.Slots.size()) {
309       int FI = Line.Slots[Line.Index++];
310       if (ReservedSlots.count(FI))
311         continue;
312       // If all sizes are kept together we probably need to extend the
313       // spill slot size.
314       if (MFI.getObjectSize(FI) < Size) {
315         MFI.setObjectSize(FI, Size);
316         MFI.setObjectAlignment(FI, Align(Size));
317         NumSpillSlotsExtended++;
318       }
319       return FI;
320     }
321     int FI = MFI.CreateSpillStackObject(Size, Align(Size));
322     NumSpillSlotsAllocated++;
323     Line.Slots.push_back(FI);
324     ++Line.Index;
325 
326     // Remember assignment {Reg, FI} for EHPad
327     if (EHPad) {
328       GlobalIndices[EHPad].push_back(std::make_pair(Reg, FI));
329       LLVM_DEBUG(dbgs() << "Reserved FI " << FI << " for spilling reg "
330                         << printReg(Reg, &TRI) << " at landing pad "
331                         << printMBBReference(*EHPad) << "\n");
332     }
333 
334     return FI;
335   }
336 
337   // Sort all registers to spill in descendent order. In the
338   // FixupSCSExtendSlotSize mode it will minimize the total frame size.
339   // In non FixupSCSExtendSlotSize mode we can skip this step.
340   void sortRegisters(SmallVectorImpl<Register> &Regs) {
341     if (!FixupSCSExtendSlotSize)
342       return;
343     llvm::sort(Regs.begin(), Regs.end(), [&](Register &A, Register &B) {
344       return getRegisterSize(TRI, A) > getRegisterSize(TRI, B);
345     });
346   }
347 };
348 
349 // Describes the state of the current processing statepoint instruction.
350 class StatepointState {
351 private:
352   // statepoint instruction.
353   MachineInstr &MI;
354   MachineFunction &MF;
355   // If non-null then statepoint is invoke, and this points to the landing pad.
356   MachineBasicBlock *EHPad;
357   const TargetRegisterInfo &TRI;
358   const TargetInstrInfo &TII;
359   MachineFrameInfo &MFI;
360   // Mask with callee saved registers.
361   const uint32_t *Mask;
362   // Cache of frame indexes used on previous instruction processing.
363   FrameIndexesCache &CacheFI;
364   bool AllowGCPtrInCSR;
365   // Operands with physical registers requiring spilling.
366   SmallVector<unsigned, 8> OpsToSpill;
367   // Set of register to spill.
368   SmallVector<Register, 8> RegsToSpill;
369   // Set of registers to reload after statepoint.
370   SmallVector<Register, 8> RegsToReload;
371   // Map Register to Frame Slot index.
372   DenseMap<Register, int> RegToSlotIdx;
373 
374 public:
375   StatepointState(MachineInstr &MI, const uint32_t *Mask,
376                   FrameIndexesCache &CacheFI, bool AllowGCPtrInCSR)
377       : MI(MI), MF(*MI.getMF()), TRI(*MF.getSubtarget().getRegisterInfo()),
378         TII(*MF.getSubtarget().getInstrInfo()), MFI(MF.getFrameInfo()),
379         Mask(Mask), CacheFI(CacheFI), AllowGCPtrInCSR(AllowGCPtrInCSR) {
380 
381     // Find statepoint's landing pad, if any.
382     EHPad = nullptr;
383     MachineBasicBlock *MBB = MI.getParent();
384     // Invoke statepoint must be last one in block.
385     bool Last = std::none_of(++MI.getIterator(), MBB->end().getInstrIterator(),
386                              [](MachineInstr &I) {
387                                return I.getOpcode() == TargetOpcode::STATEPOINT;
388                              });
389 
390     if (!Last)
391       return;
392 
393     auto IsEHPad = [](MachineBasicBlock *B) { return B->isEHPad(); };
394 
395     assert(llvm::count_if(MBB->successors(), IsEHPad) < 2 && "multiple EHPads");
396 
397     auto It = llvm::find_if(MBB->successors(), IsEHPad);
398     if (It != MBB->succ_end())
399       EHPad = *It;
400   }
401 
402   MachineBasicBlock *getEHPad() const { return EHPad; }
403 
404   // Return true if register is callee saved.
405   bool isCalleeSaved(Register Reg) { return (Mask[Reg / 32] >> Reg % 32) & 1; }
406 
407   // Iterates over statepoint meta args to find caller saver registers.
408   // Also cache the size of found registers.
409   // Returns true if caller save registers found.
410   bool findRegistersToSpill() {
411     SmallSet<Register, 8> VisitedRegs;
412     SmallSet<Register, 8> GCRegs = collectGCRegs(MI);
413     for (unsigned Idx = StatepointOpers(&MI).getVarIdx(),
414                   EndIdx = MI.getNumOperands();
415          Idx < EndIdx; ++Idx) {
416       MachineOperand &MO = MI.getOperand(Idx);
417       if (!MO.isReg() || MO.isImplicit())
418         continue;
419       Register Reg = MO.getReg();
420       assert(Reg.isPhysical() && "Only physical regs are expected");
421 
422       if (isCalleeSaved(Reg) && (AllowGCPtrInCSR || !is_contained(GCRegs, Reg)))
423         continue;
424 
425       LLVM_DEBUG(dbgs() << "Will spill " << printReg(Reg, &TRI) << " at index "
426                         << Idx << "\n");
427 
428       if (VisitedRegs.insert(Reg).second)
429         RegsToSpill.push_back(Reg);
430       OpsToSpill.push_back(Idx);
431     }
432     CacheFI.sortRegisters(RegsToSpill);
433     return !RegsToSpill.empty();
434   }
435 
436   // Spill all caller saved registers right before statepoint instruction.
437   // Remember frame index where register is spilled.
438   void spillRegisters() {
439     for (Register Reg : RegsToSpill) {
440       int FI = CacheFI.getFrameIndex(Reg, EHPad);
441       const TargetRegisterClass *RC = TRI.getMinimalPhysRegClass(Reg);
442 
443       NumSpilledRegisters++;
444       RegToSlotIdx[Reg] = FI;
445 
446       LLVM_DEBUG(dbgs() << "Spilling " << printReg(Reg, &TRI) << " to FI " << FI
447                         << "\n");
448 
449       // Perform trivial copy propagation
450       bool IsKill = true;
451       MachineBasicBlock::iterator InsertBefore(MI);
452       Reg = performCopyPropagation(Reg, InsertBefore, IsKill, TII, TRI);
453 
454       LLVM_DEBUG(dbgs() << "Insert spill before " << *InsertBefore);
455       TII.storeRegToStackSlot(*MI.getParent(), InsertBefore, Reg, IsKill, FI,
456                               RC, &TRI);
457     }
458   }
459 
460   void insertReloadBefore(unsigned Reg, MachineBasicBlock::iterator It,
461                           MachineBasicBlock *MBB) {
462     const TargetRegisterClass *RC = TRI.getMinimalPhysRegClass(Reg);
463     int FI = RegToSlotIdx[Reg];
464     if (It != MBB->end()) {
465       TII.loadRegFromStackSlot(*MBB, It, Reg, FI, RC, &TRI);
466       return;
467     }
468 
469     // To insert reload at the end of MBB, insert it before last instruction
470     // and then swap them.
471     assert(MBB->begin() != MBB->end() && "Empty block");
472     --It;
473     TII.loadRegFromStackSlot(*MBB, It, Reg, FI, RC, &TRI);
474     MachineInstr *Reload = It->getPrevNode();
475     int Dummy = 0;
476     assert(TII.isLoadFromStackSlot(*Reload, Dummy) == Reg);
477     assert(Dummy == FI);
478     MBB->remove(Reload);
479     MBB->insertAfter(It, Reload);
480   }
481 
482   // Insert reloads of (relocated) registers spilled in statepoint.
483   void insertReloads(MachineInstr *NewStatepoint, RegReloadCache &RC) {
484     MachineBasicBlock *MBB = NewStatepoint->getParent();
485     auto InsertPoint = std::next(NewStatepoint->getIterator());
486 
487     for (auto Reg : RegsToReload) {
488       insertReloadBefore(Reg, InsertPoint, MBB);
489       LLVM_DEBUG(dbgs() << "Reloading " << printReg(Reg, &TRI) << " from FI "
490                         << RegToSlotIdx[Reg] << " after statepoint\n");
491 
492       if (EHPad && !RC.hasReload(Reg, RegToSlotIdx[Reg], EHPad)) {
493         RC.recordReload(Reg, RegToSlotIdx[Reg], EHPad);
494         auto EHPadInsertPoint = EHPad->SkipPHIsLabelsAndDebug(EHPad->begin());
495         insertReloadBefore(Reg, EHPadInsertPoint, EHPad);
496         LLVM_DEBUG(dbgs() << "...also reload at EHPad "
497                           << printMBBReference(*EHPad) << "\n");
498       }
499     }
500   }
501 
502   // Re-write statepoint machine instruction to replace caller saved operands
503   // with indirect memory location (frame index).
504   MachineInstr *rewriteStatepoint() {
505     MachineInstr *NewMI =
506         MF.CreateMachineInstr(TII.get(MI.getOpcode()), MI.getDebugLoc(), true);
507     MachineInstrBuilder MIB(MF, NewMI);
508 
509     unsigned NumOps = MI.getNumOperands();
510 
511     // New indices for the remaining defs.
512     SmallVector<unsigned, 8> NewIndices;
513     unsigned NumDefs = MI.getNumDefs();
514     for (unsigned I = 0; I < NumDefs; ++I) {
515       MachineOperand &DefMO = MI.getOperand(I);
516       assert(DefMO.isReg() && DefMO.isDef() && "Expected Reg Def operand");
517       Register Reg = DefMO.getReg();
518       if (!AllowGCPtrInCSR) {
519         assert(is_contained(RegsToSpill, Reg));
520         RegsToReload.push_back(Reg);
521       } else {
522         if (isCalleeSaved(Reg)) {
523           NewIndices.push_back(NewMI->getNumOperands());
524           MIB.addReg(Reg, RegState::Define);
525         } else {
526           NewIndices.push_back(NumOps);
527           RegsToReload.push_back(Reg);
528         }
529       }
530     }
531 
532     // Add End marker.
533     OpsToSpill.push_back(MI.getNumOperands());
534     unsigned CurOpIdx = 0;
535 
536     for (unsigned I = NumDefs; I < MI.getNumOperands(); ++I) {
537       MachineOperand &MO = MI.getOperand(I);
538       if (I == OpsToSpill[CurOpIdx]) {
539         int FI = RegToSlotIdx[MO.getReg()];
540         MIB.addImm(StackMaps::IndirectMemRefOp);
541         MIB.addImm(getRegisterSize(TRI, MO.getReg()));
542         assert(MO.isReg() && "Should be register");
543         assert(MO.getReg().isPhysical() && "Should be physical register");
544         MIB.addFrameIndex(FI);
545         MIB.addImm(0);
546         ++CurOpIdx;
547       } else {
548         MIB.add(MO);
549         unsigned OldDef;
550         if (AllowGCPtrInCSR && MI.isRegTiedToDefOperand(I, &OldDef)) {
551           assert(OldDef < NumDefs);
552           assert(NewIndices[OldDef] < NumOps);
553           MIB->tieOperands(NewIndices[OldDef], MIB->getNumOperands() - 1);
554         }
555       }
556     }
557     assert(CurOpIdx == (OpsToSpill.size() - 1) && "Not all operands processed");
558     // Add mem operands.
559     NewMI->setMemRefs(MF, MI.memoperands());
560     for (auto It : RegToSlotIdx) {
561       Register R = It.first;
562       int FrameIndex = It.second;
563       auto PtrInfo = MachinePointerInfo::getFixedStack(MF, FrameIndex);
564       MachineMemOperand::Flags Flags = MachineMemOperand::MOLoad;
565       if (is_contained(RegsToReload, R))
566         Flags |= MachineMemOperand::MOStore;
567       auto *MMO =
568           MF.getMachineMemOperand(PtrInfo, Flags, getRegisterSize(TRI, R),
569                                   MFI.getObjectAlign(FrameIndex));
570       NewMI->addMemOperand(MF, MMO);
571     }
572 
573     // Insert new statepoint and erase old one.
574     MI.getParent()->insert(MI, NewMI);
575 
576     LLVM_DEBUG(dbgs() << "rewritten statepoint to : " << *NewMI << "\n");
577     MI.eraseFromParent();
578     return NewMI;
579   }
580 };
581 
582 class StatepointProcessor {
583 private:
584   MachineFunction &MF;
585   const TargetRegisterInfo &TRI;
586   FrameIndexesCache CacheFI;
587   RegReloadCache ReloadCache;
588 
589 public:
590   StatepointProcessor(MachineFunction &MF)
591       : MF(MF), TRI(*MF.getSubtarget().getRegisterInfo()),
592         CacheFI(MF.getFrameInfo(), TRI) {}
593 
594   bool process(MachineInstr &MI, bool AllowGCPtrInCSR) {
595     StatepointOpers SO(&MI);
596     uint64_t Flags = SO.getFlags();
597     // Do nothing for LiveIn, it supports all registers.
598     if (Flags & (uint64_t)StatepointFlags::DeoptLiveIn)
599       return false;
600     LLVM_DEBUG(dbgs() << "\nMBB " << MI.getParent()->getNumber() << " "
601                       << MI.getParent()->getName() << " : process statepoint "
602                       << MI);
603     CallingConv::ID CC = SO.getCallingConv();
604     const uint32_t *Mask = TRI.getCallPreservedMask(MF, CC);
605     StatepointState SS(MI, Mask, CacheFI, AllowGCPtrInCSR);
606     CacheFI.reset(SS.getEHPad());
607 
608     if (!SS.findRegistersToSpill())
609       return false;
610 
611     SS.spillRegisters();
612     auto *NewStatepoint = SS.rewriteStatepoint();
613     SS.insertReloads(NewStatepoint, ReloadCache);
614     return true;
615   }
616 };
617 } // namespace
618 
619 bool FixupStatepointCallerSaved::runOnMachineFunction(MachineFunction &MF) {
620   if (skipFunction(MF.getFunction()))
621     return false;
622 
623   const Function &F = MF.getFunction();
624   if (!F.hasGC())
625     return false;
626 
627   SmallVector<MachineInstr *, 16> Statepoints;
628   for (MachineBasicBlock &BB : MF)
629     for (MachineInstr &I : BB)
630       if (I.getOpcode() == TargetOpcode::STATEPOINT)
631         Statepoints.push_back(&I);
632 
633   if (Statepoints.empty())
634     return false;
635 
636   bool Changed = false;
637   StatepointProcessor SPP(MF);
638   unsigned NumStatepoints = 0;
639   bool AllowGCPtrInCSR = PassGCPtrInCSR;
640   for (MachineInstr *I : Statepoints) {
641     ++NumStatepoints;
642     if (MaxStatepointsWithRegs.getNumOccurrences() &&
643         NumStatepoints >= MaxStatepointsWithRegs)
644       AllowGCPtrInCSR = false;
645     Changed |= SPP.process(*I, AllowGCPtrInCSR);
646   }
647   return Changed;
648 }
649