1*0b57cec5SDimitry Andric //===- ResourcePriorityQueue.cpp - A DFA-oriented priority queue -*- C++ -*-==//
2*0b57cec5SDimitry Andric //
3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
8*0b57cec5SDimitry Andric //
9*0b57cec5SDimitry Andric // This file implements the ResourcePriorityQueue class, which is a
10*0b57cec5SDimitry Andric // SchedulingPriorityQueue that prioritizes instructions using DFA state to
11*0b57cec5SDimitry Andric // reduce the length of the critical path through the basic block
12*0b57cec5SDimitry Andric // on VLIW platforms.
13*0b57cec5SDimitry Andric // The scheduler is basically a top-down adaptable list scheduler with DFA
14*0b57cec5SDimitry Andric // resource tracking added to the cost function.
15*0b57cec5SDimitry Andric // DFA is queried as a state machine to model "packets/bundles" during
16*0b57cec5SDimitry Andric // schedule. Currently packets/bundles are discarded at the end of
17*0b57cec5SDimitry Andric // scheduling, affecting only order of instructions.
18*0b57cec5SDimitry Andric //
19*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
20*0b57cec5SDimitry Andric 
21*0b57cec5SDimitry Andric #include "llvm/CodeGen/ResourcePriorityQueue.h"
22*0b57cec5SDimitry Andric #include "llvm/CodeGen/DFAPacketizer.h"
23*0b57cec5SDimitry Andric #include "llvm/CodeGen/MachineInstr.h"
24*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGISel.h"
25*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGNodes.h"
26*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h"
27*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetLowering.h"
28*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetRegisterInfo.h"
29*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetSubtargetInfo.h"
30*0b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
31*0b57cec5SDimitry Andric #include "llvm/Support/Debug.h"
32*0b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h"
33*0b57cec5SDimitry Andric #include "llvm/Target/TargetMachine.h"
34*0b57cec5SDimitry Andric 
35*0b57cec5SDimitry Andric using namespace llvm;
36*0b57cec5SDimitry Andric 
37*0b57cec5SDimitry Andric #define DEBUG_TYPE "scheduler"
38*0b57cec5SDimitry Andric 
39*0b57cec5SDimitry Andric static cl::opt<bool> DisableDFASched("disable-dfa-sched", cl::Hidden,
40*0b57cec5SDimitry Andric   cl::ZeroOrMore, cl::init(false),
41*0b57cec5SDimitry Andric   cl::desc("Disable use of DFA during scheduling"));
42*0b57cec5SDimitry Andric 
43*0b57cec5SDimitry Andric static cl::opt<int> RegPressureThreshold(
44*0b57cec5SDimitry Andric   "dfa-sched-reg-pressure-threshold", cl::Hidden, cl::ZeroOrMore, cl::init(5),
45*0b57cec5SDimitry Andric   cl::desc("Track reg pressure and switch priority to in-depth"));
46*0b57cec5SDimitry Andric 
ResourcePriorityQueue(SelectionDAGISel * IS)47*0b57cec5SDimitry Andric ResourcePriorityQueue::ResourcePriorityQueue(SelectionDAGISel *IS)
48*0b57cec5SDimitry Andric     : Picker(this), InstrItins(IS->MF->getSubtarget().getInstrItineraryData()) {
49*0b57cec5SDimitry Andric   const TargetSubtargetInfo &STI = IS->MF->getSubtarget();
50*0b57cec5SDimitry Andric   TRI = STI.getRegisterInfo();
51*0b57cec5SDimitry Andric   TLI = IS->TLI;
52*0b57cec5SDimitry Andric   TII = STI.getInstrInfo();
53*0b57cec5SDimitry Andric   ResourcesModel.reset(TII->CreateTargetScheduleState(STI));
54*0b57cec5SDimitry Andric   // This hard requirement could be relaxed, but for now
55*0b57cec5SDimitry Andric   // do not let it proceed.
56*0b57cec5SDimitry Andric   assert(ResourcesModel && "Unimplemented CreateTargetScheduleState.");
57*0b57cec5SDimitry Andric 
58*0b57cec5SDimitry Andric   unsigned NumRC = TRI->getNumRegClasses();
59*0b57cec5SDimitry Andric   RegLimit.resize(NumRC);
60*0b57cec5SDimitry Andric   RegPressure.resize(NumRC);
61*0b57cec5SDimitry Andric   std::fill(RegLimit.begin(), RegLimit.end(), 0);
62*0b57cec5SDimitry Andric   std::fill(RegPressure.begin(), RegPressure.end(), 0);
63*0b57cec5SDimitry Andric   for (const TargetRegisterClass *RC : TRI->regclasses())
64*0b57cec5SDimitry Andric     RegLimit[RC->getID()] = TRI->getRegPressureLimit(RC, *IS->MF);
65*0b57cec5SDimitry Andric 
66*0b57cec5SDimitry Andric   ParallelLiveRanges = 0;
67*0b57cec5SDimitry Andric   HorizontalVerticalBalance = 0;
68*0b57cec5SDimitry Andric }
69*0b57cec5SDimitry Andric 
70*0b57cec5SDimitry Andric unsigned
numberRCValPredInSU(SUnit * SU,unsigned RCId)71*0b57cec5SDimitry Andric ResourcePriorityQueue::numberRCValPredInSU(SUnit *SU, unsigned RCId) {
72*0b57cec5SDimitry Andric   unsigned NumberDeps = 0;
73*0b57cec5SDimitry Andric   for (SDep &Pred : SU->Preds) {
74*0b57cec5SDimitry Andric     if (Pred.isCtrl())
75*0b57cec5SDimitry Andric       continue;
76*0b57cec5SDimitry Andric 
77*0b57cec5SDimitry Andric     SUnit *PredSU = Pred.getSUnit();
78*0b57cec5SDimitry Andric     const SDNode *ScegN = PredSU->getNode();
79*0b57cec5SDimitry Andric 
80*0b57cec5SDimitry Andric     if (!ScegN)
81*0b57cec5SDimitry Andric       continue;
82*0b57cec5SDimitry Andric 
83*0b57cec5SDimitry Andric     // If value is passed to CopyToReg, it is probably
84*0b57cec5SDimitry Andric     // live outside BB.
85*0b57cec5SDimitry Andric     switch (ScegN->getOpcode()) {
86*0b57cec5SDimitry Andric       default:  break;
87*0b57cec5SDimitry Andric       case ISD::TokenFactor:    break;
88*0b57cec5SDimitry Andric       case ISD::CopyFromReg:    NumberDeps++;  break;
89*0b57cec5SDimitry Andric       case ISD::CopyToReg:      break;
90*0b57cec5SDimitry Andric       case ISD::INLINEASM:      break;
91*0b57cec5SDimitry Andric       case ISD::INLINEASM_BR:   break;
92*0b57cec5SDimitry Andric     }
93*0b57cec5SDimitry Andric     if (!ScegN->isMachineOpcode())
94*0b57cec5SDimitry Andric       continue;
95*0b57cec5SDimitry Andric 
96*0b57cec5SDimitry Andric     for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
97*0b57cec5SDimitry Andric       MVT VT = ScegN->getSimpleValueType(i);
98*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)
99*0b57cec5SDimitry Andric           && (TLI->getRegClassFor(VT)->getID() == RCId)) {
100*0b57cec5SDimitry Andric         NumberDeps++;
101*0b57cec5SDimitry Andric         break;
102*0b57cec5SDimitry Andric       }
103*0b57cec5SDimitry Andric     }
104*0b57cec5SDimitry Andric   }
105*0b57cec5SDimitry Andric   return NumberDeps;
106*0b57cec5SDimitry Andric }
107*0b57cec5SDimitry Andric 
numberRCValSuccInSU(SUnit * SU,unsigned RCId)108*0b57cec5SDimitry Andric unsigned ResourcePriorityQueue::numberRCValSuccInSU(SUnit *SU,
109*0b57cec5SDimitry Andric                                                     unsigned RCId) {
110*0b57cec5SDimitry Andric   unsigned NumberDeps = 0;
111*0b57cec5SDimitry Andric   for (const SDep &Succ : SU->Succs) {
112*0b57cec5SDimitry Andric     if (Succ.isCtrl())
113*0b57cec5SDimitry Andric       continue;
114*0b57cec5SDimitry Andric 
115*0b57cec5SDimitry Andric     SUnit *SuccSU = Succ.getSUnit();
116*0b57cec5SDimitry Andric     const SDNode *ScegN = SuccSU->getNode();
117*0b57cec5SDimitry Andric     if (!ScegN)
118*0b57cec5SDimitry Andric       continue;
119*0b57cec5SDimitry Andric 
120*0b57cec5SDimitry Andric     // If value is passed to CopyToReg, it is probably
121*0b57cec5SDimitry Andric     // live outside BB.
122*0b57cec5SDimitry Andric     switch (ScegN->getOpcode()) {
123*0b57cec5SDimitry Andric       default:  break;
124*0b57cec5SDimitry Andric       case ISD::TokenFactor:    break;
125*0b57cec5SDimitry Andric       case ISD::CopyFromReg:    break;
126*0b57cec5SDimitry Andric       case ISD::CopyToReg:      NumberDeps++;  break;
127*0b57cec5SDimitry Andric       case ISD::INLINEASM:      break;
128*0b57cec5SDimitry Andric       case ISD::INLINEASM_BR:   break;
129*0b57cec5SDimitry Andric     }
130*0b57cec5SDimitry Andric     if (!ScegN->isMachineOpcode())
131*0b57cec5SDimitry Andric       continue;
132*0b57cec5SDimitry Andric 
133*0b57cec5SDimitry Andric     for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
134*0b57cec5SDimitry Andric       const SDValue &Op = ScegN->getOperand(i);
135*0b57cec5SDimitry Andric       MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
136*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)
137*0b57cec5SDimitry Andric           && (TLI->getRegClassFor(VT)->getID() == RCId)) {
138*0b57cec5SDimitry Andric         NumberDeps++;
139*0b57cec5SDimitry Andric         break;
140*0b57cec5SDimitry Andric       }
141*0b57cec5SDimitry Andric     }
142*0b57cec5SDimitry Andric   }
143*0b57cec5SDimitry Andric   return NumberDeps;
144*0b57cec5SDimitry Andric }
145*0b57cec5SDimitry Andric 
numberCtrlDepsInSU(SUnit * SU)146*0b57cec5SDimitry Andric static unsigned numberCtrlDepsInSU(SUnit *SU) {
147*0b57cec5SDimitry Andric   unsigned NumberDeps = 0;
148*0b57cec5SDimitry Andric   for (const SDep &Succ : SU->Succs)
149*0b57cec5SDimitry Andric     if (Succ.isCtrl())
150*0b57cec5SDimitry Andric       NumberDeps++;
151*0b57cec5SDimitry Andric 
152*0b57cec5SDimitry Andric   return NumberDeps;
153*0b57cec5SDimitry Andric }
154*0b57cec5SDimitry Andric 
numberCtrlPredInSU(SUnit * SU)155*0b57cec5SDimitry Andric static unsigned numberCtrlPredInSU(SUnit *SU) {
156*0b57cec5SDimitry Andric   unsigned NumberDeps = 0;
157*0b57cec5SDimitry Andric   for (SDep &Pred : SU->Preds)
158*0b57cec5SDimitry Andric     if (Pred.isCtrl())
159*0b57cec5SDimitry Andric       NumberDeps++;
160*0b57cec5SDimitry Andric 
161*0b57cec5SDimitry Andric   return NumberDeps;
162*0b57cec5SDimitry Andric }
163*0b57cec5SDimitry Andric 
164*0b57cec5SDimitry Andric ///
165*0b57cec5SDimitry Andric /// Initialize nodes.
166*0b57cec5SDimitry Andric ///
initNodes(std::vector<SUnit> & sunits)167*0b57cec5SDimitry Andric void ResourcePriorityQueue::initNodes(std::vector<SUnit> &sunits) {
168*0b57cec5SDimitry Andric   SUnits = &sunits;
169*0b57cec5SDimitry Andric   NumNodesSolelyBlocking.resize(SUnits->size(), 0);
170*0b57cec5SDimitry Andric 
171*0b57cec5SDimitry Andric   for (unsigned i = 0, e = SUnits->size(); i != e; ++i) {
172*0b57cec5SDimitry Andric     SUnit *SU = &(*SUnits)[i];
173*0b57cec5SDimitry Andric     initNumRegDefsLeft(SU);
174*0b57cec5SDimitry Andric     SU->NodeQueueId = 0;
175*0b57cec5SDimitry Andric   }
176*0b57cec5SDimitry Andric }
177*0b57cec5SDimitry Andric 
178*0b57cec5SDimitry Andric /// This heuristic is used if DFA scheduling is not desired
179*0b57cec5SDimitry Andric /// for some VLIW platform.
operator ()(const SUnit * LHS,const SUnit * RHS) const180*0b57cec5SDimitry Andric bool resource_sort::operator()(const SUnit *LHS, const SUnit *RHS) const {
181*0b57cec5SDimitry Andric   // The isScheduleHigh flag allows nodes with wraparound dependencies that
182*0b57cec5SDimitry Andric   // cannot easily be modeled as edges with latencies to be scheduled as
183*0b57cec5SDimitry Andric   // soon as possible in a top-down schedule.
184*0b57cec5SDimitry Andric   if (LHS->isScheduleHigh && !RHS->isScheduleHigh)
185*0b57cec5SDimitry Andric     return false;
186*0b57cec5SDimitry Andric 
187*0b57cec5SDimitry Andric   if (!LHS->isScheduleHigh && RHS->isScheduleHigh)
188*0b57cec5SDimitry Andric     return true;
189*0b57cec5SDimitry Andric 
190*0b57cec5SDimitry Andric   unsigned LHSNum = LHS->NodeNum;
191*0b57cec5SDimitry Andric   unsigned RHSNum = RHS->NodeNum;
192*0b57cec5SDimitry Andric 
193*0b57cec5SDimitry Andric   // The most important heuristic is scheduling the critical path.
194*0b57cec5SDimitry Andric   unsigned LHSLatency = PQ->getLatency(LHSNum);
195*0b57cec5SDimitry Andric   unsigned RHSLatency = PQ->getLatency(RHSNum);
196*0b57cec5SDimitry Andric   if (LHSLatency < RHSLatency) return true;
197*0b57cec5SDimitry Andric   if (LHSLatency > RHSLatency) return false;
198*0b57cec5SDimitry Andric 
199*0b57cec5SDimitry Andric   // After that, if two nodes have identical latencies, look to see if one will
200*0b57cec5SDimitry Andric   // unblock more other nodes than the other.
201*0b57cec5SDimitry Andric   unsigned LHSBlocked = PQ->getNumSolelyBlockNodes(LHSNum);
202*0b57cec5SDimitry Andric   unsigned RHSBlocked = PQ->getNumSolelyBlockNodes(RHSNum);
203*0b57cec5SDimitry Andric   if (LHSBlocked < RHSBlocked) return true;
204*0b57cec5SDimitry Andric   if (LHSBlocked > RHSBlocked) return false;
205*0b57cec5SDimitry Andric 
206*0b57cec5SDimitry Andric   // Finally, just to provide a stable ordering, use the node number as a
207*0b57cec5SDimitry Andric   // deciding factor.
208*0b57cec5SDimitry Andric   return LHSNum < RHSNum;
209*0b57cec5SDimitry Andric }
210*0b57cec5SDimitry Andric 
211*0b57cec5SDimitry Andric 
212*0b57cec5SDimitry Andric /// getSingleUnscheduledPred - If there is exactly one unscheduled predecessor
213*0b57cec5SDimitry Andric /// of SU, return it, otherwise return null.
getSingleUnscheduledPred(SUnit * SU)214*0b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::getSingleUnscheduledPred(SUnit *SU) {
215*0b57cec5SDimitry Andric   SUnit *OnlyAvailablePred = nullptr;
216*0b57cec5SDimitry Andric   for (const SDep &Pred : SU->Preds) {
217*0b57cec5SDimitry Andric     SUnit &PredSU = *Pred.getSUnit();
218*0b57cec5SDimitry Andric     if (!PredSU.isScheduled) {
219*0b57cec5SDimitry Andric       // We found an available, but not scheduled, predecessor.  If it's the
220*0b57cec5SDimitry Andric       // only one we have found, keep track of it... otherwise give up.
221*0b57cec5SDimitry Andric       if (OnlyAvailablePred && OnlyAvailablePred != &PredSU)
222*0b57cec5SDimitry Andric         return nullptr;
223*0b57cec5SDimitry Andric       OnlyAvailablePred = &PredSU;
224*0b57cec5SDimitry Andric     }
225*0b57cec5SDimitry Andric   }
226*0b57cec5SDimitry Andric   return OnlyAvailablePred;
227*0b57cec5SDimitry Andric }
228*0b57cec5SDimitry Andric 
push(SUnit * SU)229*0b57cec5SDimitry Andric void ResourcePriorityQueue::push(SUnit *SU) {
230*0b57cec5SDimitry Andric   // Look at all of the successors of this node.  Count the number of nodes that
231*0b57cec5SDimitry Andric   // this node is the sole unscheduled node for.
232*0b57cec5SDimitry Andric   unsigned NumNodesBlocking = 0;
233*0b57cec5SDimitry Andric   for (const SDep &Succ : SU->Succs)
234*0b57cec5SDimitry Andric     if (getSingleUnscheduledPred(Succ.getSUnit()) == SU)
235*0b57cec5SDimitry Andric       ++NumNodesBlocking;
236*0b57cec5SDimitry Andric 
237*0b57cec5SDimitry Andric   NumNodesSolelyBlocking[SU->NodeNum] = NumNodesBlocking;
238*0b57cec5SDimitry Andric   Queue.push_back(SU);
239*0b57cec5SDimitry Andric }
240*0b57cec5SDimitry Andric 
241*0b57cec5SDimitry Andric /// Check if scheduling of this SU is possible
242*0b57cec5SDimitry Andric /// in the current packet.
isResourceAvailable(SUnit * SU)243*0b57cec5SDimitry Andric bool ResourcePriorityQueue::isResourceAvailable(SUnit *SU) {
244*0b57cec5SDimitry Andric   if (!SU || !SU->getNode())
245*0b57cec5SDimitry Andric     return false;
246*0b57cec5SDimitry Andric 
247*0b57cec5SDimitry Andric   // If this is a compound instruction,
248*0b57cec5SDimitry Andric   // it is likely to be a call. Do not delay it.
249*0b57cec5SDimitry Andric   if (SU->getNode()->getGluedNode())
250*0b57cec5SDimitry Andric     return true;
251*0b57cec5SDimitry Andric 
252*0b57cec5SDimitry Andric   // First see if the pipeline could receive this instruction
253*0b57cec5SDimitry Andric   // in the current cycle.
254*0b57cec5SDimitry Andric   if (SU->getNode()->isMachineOpcode())
255*0b57cec5SDimitry Andric     switch (SU->getNode()->getMachineOpcode()) {
256*0b57cec5SDimitry Andric     default:
257*0b57cec5SDimitry Andric       if (!ResourcesModel->canReserveResources(&TII->get(
258*0b57cec5SDimitry Andric           SU->getNode()->getMachineOpcode())))
259*0b57cec5SDimitry Andric            return false;
260*0b57cec5SDimitry Andric       break;
261*0b57cec5SDimitry Andric     case TargetOpcode::EXTRACT_SUBREG:
262*0b57cec5SDimitry Andric     case TargetOpcode::INSERT_SUBREG:
263*0b57cec5SDimitry Andric     case TargetOpcode::SUBREG_TO_REG:
264*0b57cec5SDimitry Andric     case TargetOpcode::REG_SEQUENCE:
265*0b57cec5SDimitry Andric     case TargetOpcode::IMPLICIT_DEF:
266*0b57cec5SDimitry Andric         break;
267*0b57cec5SDimitry Andric     }
268*0b57cec5SDimitry Andric 
269*0b57cec5SDimitry Andric   // Now see if there are no other dependencies
270*0b57cec5SDimitry Andric   // to instructions already in the packet.
271*0b57cec5SDimitry Andric   for (unsigned i = 0, e = Packet.size(); i != e; ++i)
272*0b57cec5SDimitry Andric     for (const SDep &Succ : Packet[i]->Succs) {
273*0b57cec5SDimitry Andric       // Since we do not add pseudos to packets, might as well
274*0b57cec5SDimitry Andric       // ignore order deps.
275*0b57cec5SDimitry Andric       if (Succ.isCtrl())
276*0b57cec5SDimitry Andric         continue;
277*0b57cec5SDimitry Andric 
278*0b57cec5SDimitry Andric       if (Succ.getSUnit() == SU)
279*0b57cec5SDimitry Andric         return false;
280*0b57cec5SDimitry Andric     }
281*0b57cec5SDimitry Andric 
282*0b57cec5SDimitry Andric   return true;
283*0b57cec5SDimitry Andric }
284*0b57cec5SDimitry Andric 
285*0b57cec5SDimitry Andric /// Keep track of available resources.
reserveResources(SUnit * SU)286*0b57cec5SDimitry Andric void ResourcePriorityQueue::reserveResources(SUnit *SU) {
287*0b57cec5SDimitry Andric   // If this SU does not fit in the packet
288*0b57cec5SDimitry Andric   // start a new one.
289*0b57cec5SDimitry Andric   if (!isResourceAvailable(SU) || SU->getNode()->getGluedNode()) {
290*0b57cec5SDimitry Andric     ResourcesModel->clearResources();
291*0b57cec5SDimitry Andric     Packet.clear();
292*0b57cec5SDimitry Andric   }
293*0b57cec5SDimitry Andric 
294*0b57cec5SDimitry Andric   if (SU->getNode() && SU->getNode()->isMachineOpcode()) {
295*0b57cec5SDimitry Andric     switch (SU->getNode()->getMachineOpcode()) {
296*0b57cec5SDimitry Andric     default:
297*0b57cec5SDimitry Andric       ResourcesModel->reserveResources(&TII->get(
298*0b57cec5SDimitry Andric         SU->getNode()->getMachineOpcode()));
299*0b57cec5SDimitry Andric       break;
300*0b57cec5SDimitry Andric     case TargetOpcode::EXTRACT_SUBREG:
301*0b57cec5SDimitry Andric     case TargetOpcode::INSERT_SUBREG:
302*0b57cec5SDimitry Andric     case TargetOpcode::SUBREG_TO_REG:
303*0b57cec5SDimitry Andric     case TargetOpcode::REG_SEQUENCE:
304*0b57cec5SDimitry Andric     case TargetOpcode::IMPLICIT_DEF:
305*0b57cec5SDimitry Andric       break;
306*0b57cec5SDimitry Andric     }
307*0b57cec5SDimitry Andric     Packet.push_back(SU);
308*0b57cec5SDimitry Andric   }
309*0b57cec5SDimitry Andric   // Forcefully end packet for PseudoOps.
310*0b57cec5SDimitry Andric   else {
311*0b57cec5SDimitry Andric     ResourcesModel->clearResources();
312*0b57cec5SDimitry Andric     Packet.clear();
313*0b57cec5SDimitry Andric   }
314*0b57cec5SDimitry Andric 
315*0b57cec5SDimitry Andric   // If packet is now full, reset the state so in the next cycle
316*0b57cec5SDimitry Andric   // we start fresh.
317*0b57cec5SDimitry Andric   if (Packet.size() >= InstrItins->SchedModel.IssueWidth) {
318*0b57cec5SDimitry Andric     ResourcesModel->clearResources();
319*0b57cec5SDimitry Andric     Packet.clear();
320*0b57cec5SDimitry Andric   }
321*0b57cec5SDimitry Andric }
322*0b57cec5SDimitry Andric 
rawRegPressureDelta(SUnit * SU,unsigned RCId)323*0b57cec5SDimitry Andric int ResourcePriorityQueue::rawRegPressureDelta(SUnit *SU, unsigned RCId) {
324*0b57cec5SDimitry Andric   int RegBalance = 0;
325*0b57cec5SDimitry Andric 
326*0b57cec5SDimitry Andric   if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
327*0b57cec5SDimitry Andric     return RegBalance;
328*0b57cec5SDimitry Andric 
329*0b57cec5SDimitry Andric   // Gen estimate.
330*0b57cec5SDimitry Andric   for (unsigned i = 0, e = SU->getNode()->getNumValues(); i != e; ++i) {
331*0b57cec5SDimitry Andric       MVT VT = SU->getNode()->getSimpleValueType(i);
332*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)
333*0b57cec5SDimitry Andric           && TLI->getRegClassFor(VT)
334*0b57cec5SDimitry Andric           && TLI->getRegClassFor(VT)->getID() == RCId)
335*0b57cec5SDimitry Andric         RegBalance += numberRCValSuccInSU(SU, RCId);
336*0b57cec5SDimitry Andric   }
337*0b57cec5SDimitry Andric   // Kill estimate.
338*0b57cec5SDimitry Andric   for (unsigned i = 0, e = SU->getNode()->getNumOperands(); i != e; ++i) {
339*0b57cec5SDimitry Andric       const SDValue &Op = SU->getNode()->getOperand(i);
340*0b57cec5SDimitry Andric       MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
341*0b57cec5SDimitry Andric       if (isa<ConstantSDNode>(Op.getNode()))
342*0b57cec5SDimitry Andric         continue;
343*0b57cec5SDimitry Andric 
344*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT) && TLI->getRegClassFor(VT)
345*0b57cec5SDimitry Andric           && TLI->getRegClassFor(VT)->getID() == RCId)
346*0b57cec5SDimitry Andric         RegBalance -= numberRCValPredInSU(SU, RCId);
347*0b57cec5SDimitry Andric   }
348*0b57cec5SDimitry Andric   return RegBalance;
349*0b57cec5SDimitry Andric }
350*0b57cec5SDimitry Andric 
351*0b57cec5SDimitry Andric /// Estimates change in reg pressure from this SU.
352*0b57cec5SDimitry Andric /// It is achieved by trivial tracking of defined
353*0b57cec5SDimitry Andric /// and used vregs in dependent instructions.
354*0b57cec5SDimitry Andric /// The RawPressure flag makes this function to ignore
355*0b57cec5SDimitry Andric /// existing reg file sizes, and report raw def/use
356*0b57cec5SDimitry Andric /// balance.
regPressureDelta(SUnit * SU,bool RawPressure)357*0b57cec5SDimitry Andric int ResourcePriorityQueue::regPressureDelta(SUnit *SU, bool RawPressure) {
358*0b57cec5SDimitry Andric   int RegBalance = 0;
359*0b57cec5SDimitry Andric 
360*0b57cec5SDimitry Andric   if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
361*0b57cec5SDimitry Andric     return RegBalance;
362*0b57cec5SDimitry Andric 
363*0b57cec5SDimitry Andric   if (RawPressure) {
364*0b57cec5SDimitry Andric     for (const TargetRegisterClass *RC : TRI->regclasses())
365*0b57cec5SDimitry Andric       RegBalance += rawRegPressureDelta(SU, RC->getID());
366*0b57cec5SDimitry Andric   }
367*0b57cec5SDimitry Andric   else {
368*0b57cec5SDimitry Andric     for (const TargetRegisterClass *RC : TRI->regclasses()) {
369*0b57cec5SDimitry Andric       if ((RegPressure[RC->getID()] +
370*0b57cec5SDimitry Andric            rawRegPressureDelta(SU, RC->getID()) > 0) &&
371*0b57cec5SDimitry Andric           (RegPressure[RC->getID()] +
372*0b57cec5SDimitry Andric            rawRegPressureDelta(SU, RC->getID())  >= RegLimit[RC->getID()]))
373*0b57cec5SDimitry Andric         RegBalance += rawRegPressureDelta(SU, RC->getID());
374*0b57cec5SDimitry Andric     }
375*0b57cec5SDimitry Andric   }
376*0b57cec5SDimitry Andric 
377*0b57cec5SDimitry Andric   return RegBalance;
378*0b57cec5SDimitry Andric }
379*0b57cec5SDimitry Andric 
380*0b57cec5SDimitry Andric // Constants used to denote relative importance of
381*0b57cec5SDimitry Andric // heuristic components for cost computation.
382*0b57cec5SDimitry Andric static const unsigned PriorityOne = 200;
383*0b57cec5SDimitry Andric static const unsigned PriorityTwo = 50;
384*0b57cec5SDimitry Andric static const unsigned PriorityThree = 15;
385*0b57cec5SDimitry Andric static const unsigned PriorityFour = 5;
386*0b57cec5SDimitry Andric static const unsigned ScaleOne = 20;
387*0b57cec5SDimitry Andric static const unsigned ScaleTwo = 10;
388*0b57cec5SDimitry Andric static const unsigned ScaleThree = 5;
389*0b57cec5SDimitry Andric static const unsigned FactorOne = 2;
390*0b57cec5SDimitry Andric 
391*0b57cec5SDimitry Andric /// Returns single number reflecting benefit of scheduling SU
392*0b57cec5SDimitry Andric /// in the current cycle.
SUSchedulingCost(SUnit * SU)393*0b57cec5SDimitry Andric int ResourcePriorityQueue::SUSchedulingCost(SUnit *SU) {
394*0b57cec5SDimitry Andric   // Initial trivial priority.
395*0b57cec5SDimitry Andric   int ResCount = 1;
396*0b57cec5SDimitry Andric 
397*0b57cec5SDimitry Andric   // Do not waste time on a node that is already scheduled.
398*0b57cec5SDimitry Andric   if (SU->isScheduled)
399*0b57cec5SDimitry Andric     return ResCount;
400*0b57cec5SDimitry Andric 
401*0b57cec5SDimitry Andric   // Forced priority is high.
402*0b57cec5SDimitry Andric   if (SU->isScheduleHigh)
403*0b57cec5SDimitry Andric     ResCount += PriorityOne;
404*0b57cec5SDimitry Andric 
405*0b57cec5SDimitry Andric   // Adaptable scheduling
406*0b57cec5SDimitry Andric   // A small, but very parallel
407*0b57cec5SDimitry Andric   // region, where reg pressure is an issue.
408*0b57cec5SDimitry Andric   if (HorizontalVerticalBalance > RegPressureThreshold) {
409*0b57cec5SDimitry Andric     // Critical path first
410*0b57cec5SDimitry Andric     ResCount += (SU->getHeight() * ScaleTwo);
411*0b57cec5SDimitry Andric     // If resources are available for it, multiply the
412*0b57cec5SDimitry Andric     // chance of scheduling.
413*0b57cec5SDimitry Andric     if (isResourceAvailable(SU))
414*0b57cec5SDimitry Andric       ResCount <<= FactorOne;
415*0b57cec5SDimitry Andric 
416*0b57cec5SDimitry Andric     // Consider change to reg pressure from scheduling
417*0b57cec5SDimitry Andric     // this SU.
418*0b57cec5SDimitry Andric     ResCount -= (regPressureDelta(SU,true) * ScaleOne);
419*0b57cec5SDimitry Andric   }
420*0b57cec5SDimitry Andric   // Default heuristic, greeady and
421*0b57cec5SDimitry Andric   // critical path driven.
422*0b57cec5SDimitry Andric   else {
423*0b57cec5SDimitry Andric     // Critical path first.
424*0b57cec5SDimitry Andric     ResCount += (SU->getHeight() * ScaleTwo);
425*0b57cec5SDimitry Andric     // Now see how many instructions is blocked by this SU.
426*0b57cec5SDimitry Andric     ResCount += (NumNodesSolelyBlocking[SU->NodeNum] * ScaleTwo);
427*0b57cec5SDimitry Andric     // If resources are available for it, multiply the
428*0b57cec5SDimitry Andric     // chance of scheduling.
429*0b57cec5SDimitry Andric     if (isResourceAvailable(SU))
430*0b57cec5SDimitry Andric       ResCount <<= FactorOne;
431*0b57cec5SDimitry Andric 
432*0b57cec5SDimitry Andric     ResCount -= (regPressureDelta(SU) * ScaleTwo);
433*0b57cec5SDimitry Andric   }
434*0b57cec5SDimitry Andric 
435*0b57cec5SDimitry Andric   // These are platform-specific things.
436*0b57cec5SDimitry Andric   // Will need to go into the back end
437*0b57cec5SDimitry Andric   // and accessed from here via a hook.
438*0b57cec5SDimitry Andric   for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) {
439*0b57cec5SDimitry Andric     if (N->isMachineOpcode()) {
440*0b57cec5SDimitry Andric       const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
441*0b57cec5SDimitry Andric       if (TID.isCall())
442*0b57cec5SDimitry Andric         ResCount += (PriorityTwo + (ScaleThree*N->getNumValues()));
443*0b57cec5SDimitry Andric     }
444*0b57cec5SDimitry Andric     else
445*0b57cec5SDimitry Andric       switch (N->getOpcode()) {
446*0b57cec5SDimitry Andric       default:  break;
447*0b57cec5SDimitry Andric       case ISD::TokenFactor:
448*0b57cec5SDimitry Andric       case ISD::CopyFromReg:
449*0b57cec5SDimitry Andric       case ISD::CopyToReg:
450*0b57cec5SDimitry Andric         ResCount += PriorityFour;
451*0b57cec5SDimitry Andric         break;
452*0b57cec5SDimitry Andric 
453*0b57cec5SDimitry Andric       case ISD::INLINEASM:
454*0b57cec5SDimitry Andric       case ISD::INLINEASM_BR:
455*0b57cec5SDimitry Andric         ResCount += PriorityThree;
456*0b57cec5SDimitry Andric         break;
457*0b57cec5SDimitry Andric       }
458*0b57cec5SDimitry Andric   }
459*0b57cec5SDimitry Andric   return ResCount;
460*0b57cec5SDimitry Andric }
461*0b57cec5SDimitry Andric 
462*0b57cec5SDimitry Andric 
463*0b57cec5SDimitry Andric /// Main resource tracking point.
scheduledNode(SUnit * SU)464*0b57cec5SDimitry Andric void ResourcePriorityQueue::scheduledNode(SUnit *SU) {
465*0b57cec5SDimitry Andric   // Use NULL entry as an event marker to reset
466*0b57cec5SDimitry Andric   // the DFA state.
467*0b57cec5SDimitry Andric   if (!SU) {
468*0b57cec5SDimitry Andric     ResourcesModel->clearResources();
469*0b57cec5SDimitry Andric     Packet.clear();
470*0b57cec5SDimitry Andric     return;
471*0b57cec5SDimitry Andric   }
472*0b57cec5SDimitry Andric 
473*0b57cec5SDimitry Andric   const SDNode *ScegN = SU->getNode();
474*0b57cec5SDimitry Andric   // Update reg pressure tracking.
475*0b57cec5SDimitry Andric   // First update current node.
476*0b57cec5SDimitry Andric   if (ScegN->isMachineOpcode()) {
477*0b57cec5SDimitry Andric     // Estimate generated regs.
478*0b57cec5SDimitry Andric     for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
479*0b57cec5SDimitry Andric       MVT VT = ScegN->getSimpleValueType(i);
480*0b57cec5SDimitry Andric 
481*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)) {
482*0b57cec5SDimitry Andric         const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
483*0b57cec5SDimitry Andric         if (RC)
484*0b57cec5SDimitry Andric           RegPressure[RC->getID()] += numberRCValSuccInSU(SU, RC->getID());
485*0b57cec5SDimitry Andric       }
486*0b57cec5SDimitry Andric     }
487*0b57cec5SDimitry Andric     // Estimate killed regs.
488*0b57cec5SDimitry Andric     for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
489*0b57cec5SDimitry Andric       const SDValue &Op = ScegN->getOperand(i);
490*0b57cec5SDimitry Andric       MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
491*0b57cec5SDimitry Andric 
492*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)) {
493*0b57cec5SDimitry Andric         const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
494*0b57cec5SDimitry Andric         if (RC) {
495*0b57cec5SDimitry Andric           if (RegPressure[RC->getID()] >
496*0b57cec5SDimitry Andric             (numberRCValPredInSU(SU, RC->getID())))
497*0b57cec5SDimitry Andric             RegPressure[RC->getID()] -= numberRCValPredInSU(SU, RC->getID());
498*0b57cec5SDimitry Andric           else RegPressure[RC->getID()] = 0;
499*0b57cec5SDimitry Andric         }
500*0b57cec5SDimitry Andric       }
501*0b57cec5SDimitry Andric     }
502*0b57cec5SDimitry Andric     for (SDep &Pred : SU->Preds) {
503*0b57cec5SDimitry Andric       if (Pred.isCtrl() || (Pred.getSUnit()->NumRegDefsLeft == 0))
504*0b57cec5SDimitry Andric         continue;
505*0b57cec5SDimitry Andric       --Pred.getSUnit()->NumRegDefsLeft;
506*0b57cec5SDimitry Andric     }
507*0b57cec5SDimitry Andric   }
508*0b57cec5SDimitry Andric 
509*0b57cec5SDimitry Andric   // Reserve resources for this SU.
510*0b57cec5SDimitry Andric   reserveResources(SU);
511*0b57cec5SDimitry Andric 
512*0b57cec5SDimitry Andric   // Adjust number of parallel live ranges.
513*0b57cec5SDimitry Andric   // Heuristic is simple - node with no data successors reduces
514*0b57cec5SDimitry Andric   // number of live ranges. All others, increase it.
515*0b57cec5SDimitry Andric   unsigned NumberNonControlDeps = 0;
516*0b57cec5SDimitry Andric 
517*0b57cec5SDimitry Andric   for (const SDep &Succ : SU->Succs) {
518*0b57cec5SDimitry Andric     adjustPriorityOfUnscheduledPreds(Succ.getSUnit());
519*0b57cec5SDimitry Andric     if (!Succ.isCtrl())
520*0b57cec5SDimitry Andric       NumberNonControlDeps++;
521*0b57cec5SDimitry Andric   }
522*0b57cec5SDimitry Andric 
523*0b57cec5SDimitry Andric   if (!NumberNonControlDeps) {
524*0b57cec5SDimitry Andric     if (ParallelLiveRanges >= SU->NumPreds)
525*0b57cec5SDimitry Andric       ParallelLiveRanges -= SU->NumPreds;
526*0b57cec5SDimitry Andric     else
527*0b57cec5SDimitry Andric       ParallelLiveRanges = 0;
528*0b57cec5SDimitry Andric 
529*0b57cec5SDimitry Andric   }
530*0b57cec5SDimitry Andric   else
531*0b57cec5SDimitry Andric     ParallelLiveRanges += SU->NumRegDefsLeft;
532*0b57cec5SDimitry Andric 
533*0b57cec5SDimitry Andric   // Track parallel live chains.
534*0b57cec5SDimitry Andric   HorizontalVerticalBalance += (SU->Succs.size() - numberCtrlDepsInSU(SU));
535*0b57cec5SDimitry Andric   HorizontalVerticalBalance -= (SU->Preds.size() - numberCtrlPredInSU(SU));
536*0b57cec5SDimitry Andric }
537*0b57cec5SDimitry Andric 
initNumRegDefsLeft(SUnit * SU)538*0b57cec5SDimitry Andric void ResourcePriorityQueue::initNumRegDefsLeft(SUnit *SU) {
539*0b57cec5SDimitry Andric   unsigned  NodeNumDefs = 0;
540*0b57cec5SDimitry Andric   for (SDNode *N = SU->getNode(); N; N = N->getGluedNode())
541*0b57cec5SDimitry Andric     if (N->isMachineOpcode()) {
542*0b57cec5SDimitry Andric       const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
543*0b57cec5SDimitry Andric       // No register need be allocated for this.
544*0b57cec5SDimitry Andric       if (N->getMachineOpcode() == TargetOpcode::IMPLICIT_DEF) {
545*0b57cec5SDimitry Andric         NodeNumDefs = 0;
546*0b57cec5SDimitry Andric         break;
547*0b57cec5SDimitry Andric       }
548*0b57cec5SDimitry Andric       NodeNumDefs = std::min(N->getNumValues(), TID.getNumDefs());
549*0b57cec5SDimitry Andric     }
550*0b57cec5SDimitry Andric     else
551*0b57cec5SDimitry Andric       switch(N->getOpcode()) {
552*0b57cec5SDimitry Andric         default:     break;
553*0b57cec5SDimitry Andric         case ISD::CopyFromReg:
554*0b57cec5SDimitry Andric           NodeNumDefs++;
555*0b57cec5SDimitry Andric           break;
556*0b57cec5SDimitry Andric         case ISD::INLINEASM:
557*0b57cec5SDimitry Andric         case ISD::INLINEASM_BR:
558*0b57cec5SDimitry Andric           NodeNumDefs++;
559*0b57cec5SDimitry Andric           break;
560*0b57cec5SDimitry Andric       }
561*0b57cec5SDimitry Andric 
562*0b57cec5SDimitry Andric   SU->NumRegDefsLeft = NodeNumDefs;
563*0b57cec5SDimitry Andric }
564*0b57cec5SDimitry Andric 
565*0b57cec5SDimitry Andric /// adjustPriorityOfUnscheduledPreds - One of the predecessors of SU was just
566*0b57cec5SDimitry Andric /// scheduled.  If SU is not itself available, then there is at least one
567*0b57cec5SDimitry Andric /// predecessor node that has not been scheduled yet.  If SU has exactly ONE
568*0b57cec5SDimitry Andric /// unscheduled predecessor, we want to increase its priority: it getting
569*0b57cec5SDimitry Andric /// scheduled will make this node available, so it is better than some other
570*0b57cec5SDimitry Andric /// node of the same priority that will not make a node available.
adjustPriorityOfUnscheduledPreds(SUnit * SU)571*0b57cec5SDimitry Andric void ResourcePriorityQueue::adjustPriorityOfUnscheduledPreds(SUnit *SU) {
572*0b57cec5SDimitry Andric   if (SU->isAvailable) return;  // All preds scheduled.
573*0b57cec5SDimitry Andric 
574*0b57cec5SDimitry Andric   SUnit *OnlyAvailablePred = getSingleUnscheduledPred(SU);
575*0b57cec5SDimitry Andric   if (!OnlyAvailablePred || !OnlyAvailablePred->isAvailable)
576*0b57cec5SDimitry Andric     return;
577*0b57cec5SDimitry Andric 
578*0b57cec5SDimitry Andric   // Okay, we found a single predecessor that is available, but not scheduled.
579*0b57cec5SDimitry Andric   // Since it is available, it must be in the priority queue.  First remove it.
580*0b57cec5SDimitry Andric   remove(OnlyAvailablePred);
581*0b57cec5SDimitry Andric 
582*0b57cec5SDimitry Andric   // Reinsert the node into the priority queue, which recomputes its
583*0b57cec5SDimitry Andric   // NumNodesSolelyBlocking value.
584*0b57cec5SDimitry Andric   push(OnlyAvailablePred);
585*0b57cec5SDimitry Andric }
586*0b57cec5SDimitry Andric 
587*0b57cec5SDimitry Andric 
588*0b57cec5SDimitry Andric /// Main access point - returns next instructions
589*0b57cec5SDimitry Andric /// to be placed in scheduling sequence.
pop()590*0b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::pop() {
591*0b57cec5SDimitry Andric   if (empty())
592*0b57cec5SDimitry Andric     return nullptr;
593*0b57cec5SDimitry Andric 
594*0b57cec5SDimitry Andric   std::vector<SUnit *>::iterator Best = Queue.begin();
595*0b57cec5SDimitry Andric   if (!DisableDFASched) {
596*0b57cec5SDimitry Andric     int BestCost = SUSchedulingCost(*Best);
597*0b57cec5SDimitry Andric     for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I) {
598*0b57cec5SDimitry Andric 
599*0b57cec5SDimitry Andric       if (SUSchedulingCost(*I) > BestCost) {
600*0b57cec5SDimitry Andric         BestCost = SUSchedulingCost(*I);
601*0b57cec5SDimitry Andric         Best = I;
602*0b57cec5SDimitry Andric       }
603*0b57cec5SDimitry Andric     }
604*0b57cec5SDimitry Andric   }
605*0b57cec5SDimitry Andric   // Use default TD scheduling mechanism.
606*0b57cec5SDimitry Andric   else {
607*0b57cec5SDimitry Andric     for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I)
608*0b57cec5SDimitry Andric       if (Picker(*Best, *I))
609*0b57cec5SDimitry Andric         Best = I;
610*0b57cec5SDimitry Andric   }
611*0b57cec5SDimitry Andric 
612*0b57cec5SDimitry Andric   SUnit *V = *Best;
613*0b57cec5SDimitry Andric   if (Best != std::prev(Queue.end()))
614*0b57cec5SDimitry Andric     std::swap(*Best, Queue.back());
615*0b57cec5SDimitry Andric 
616*0b57cec5SDimitry Andric   Queue.pop_back();
617*0b57cec5SDimitry Andric 
618*0b57cec5SDimitry Andric   return V;
619*0b57cec5SDimitry Andric }
620*0b57cec5SDimitry Andric 
621*0b57cec5SDimitry Andric 
remove(SUnit * SU)622*0b57cec5SDimitry Andric void ResourcePriorityQueue::remove(SUnit *SU) {
623*0b57cec5SDimitry Andric   assert(!Queue.empty() && "Queue is empty!");
624*0b57cec5SDimitry Andric   std::vector<SUnit *>::iterator I = find(Queue, SU);
625*0b57cec5SDimitry Andric   if (I != std::prev(Queue.end()))
626     std::swap(*I, Queue.back());
627 
628   Queue.pop_back();
629 }
630