1*0b57cec5SDimitry Andric //===- ResourcePriorityQueue.cpp - A DFA-oriented priority queue -*- C++ -*-==//
2*0b57cec5SDimitry Andric //
3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
8*0b57cec5SDimitry Andric //
9*0b57cec5SDimitry Andric // This file implements the ResourcePriorityQueue class, which is a
10*0b57cec5SDimitry Andric // SchedulingPriorityQueue that prioritizes instructions using DFA state to
11*0b57cec5SDimitry Andric // reduce the length of the critical path through the basic block
12*0b57cec5SDimitry Andric // on VLIW platforms.
13*0b57cec5SDimitry Andric // The scheduler is basically a top-down adaptable list scheduler with DFA
14*0b57cec5SDimitry Andric // resource tracking added to the cost function.
15*0b57cec5SDimitry Andric // DFA is queried as a state machine to model "packets/bundles" during
16*0b57cec5SDimitry Andric // schedule. Currently packets/bundles are discarded at the end of
17*0b57cec5SDimitry Andric // scheduling, affecting only order of instructions.
18*0b57cec5SDimitry Andric //
19*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
20*0b57cec5SDimitry Andric 
21*0b57cec5SDimitry Andric #include "llvm/CodeGen/ResourcePriorityQueue.h"
22*0b57cec5SDimitry Andric #include "llvm/CodeGen/DFAPacketizer.h"
23*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGISel.h"
24*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGNodes.h"
25*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h"
26*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetLowering.h"
27*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetRegisterInfo.h"
28*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetSubtargetInfo.h"
29*0b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
30*0b57cec5SDimitry Andric 
31*0b57cec5SDimitry Andric using namespace llvm;
32*0b57cec5SDimitry Andric 
33*0b57cec5SDimitry Andric #define DEBUG_TYPE "scheduler"
34*0b57cec5SDimitry Andric 
35*0b57cec5SDimitry Andric static cl::opt<bool>
36*0b57cec5SDimitry Andric     DisableDFASched("disable-dfa-sched", cl::Hidden,
37*0b57cec5SDimitry Andric                     cl::desc("Disable use of DFA during scheduling"));
38*0b57cec5SDimitry Andric 
39*0b57cec5SDimitry Andric static cl::opt<int> RegPressureThreshold(
40*0b57cec5SDimitry Andric     "dfa-sched-reg-pressure-threshold", cl::Hidden, cl::init(5),
41*0b57cec5SDimitry Andric     cl::desc("Track reg pressure and switch priority to in-depth"));
42*0b57cec5SDimitry Andric 
ResourcePriorityQueue(SelectionDAGISel * IS)43*0b57cec5SDimitry Andric ResourcePriorityQueue::ResourcePriorityQueue(SelectionDAGISel *IS)
44*0b57cec5SDimitry Andric     : Picker(this), InstrItins(IS->MF->getSubtarget().getInstrItineraryData()) {
45*0b57cec5SDimitry Andric   const TargetSubtargetInfo &STI = IS->MF->getSubtarget();
46*0b57cec5SDimitry Andric   TRI = STI.getRegisterInfo();
47*0b57cec5SDimitry Andric   TLI = IS->TLI;
48*0b57cec5SDimitry Andric   TII = STI.getInstrInfo();
49*0b57cec5SDimitry Andric   ResourcesModel.reset(TII->CreateTargetScheduleState(STI));
50*0b57cec5SDimitry Andric   // This hard requirement could be relaxed, but for now
51*0b57cec5SDimitry Andric   // do not let it proceed.
52*0b57cec5SDimitry Andric   assert(ResourcesModel && "Unimplemented CreateTargetScheduleState.");
53*0b57cec5SDimitry Andric 
54*0b57cec5SDimitry Andric   unsigned NumRC = TRI->getNumRegClasses();
55*0b57cec5SDimitry Andric   RegLimit.resize(NumRC);
56*0b57cec5SDimitry Andric   RegPressure.resize(NumRC);
57*0b57cec5SDimitry Andric   std::fill(RegLimit.begin(), RegLimit.end(), 0);
58*0b57cec5SDimitry Andric   std::fill(RegPressure.begin(), RegPressure.end(), 0);
59*0b57cec5SDimitry Andric   for (const TargetRegisterClass *RC : TRI->regclasses())
60*0b57cec5SDimitry Andric     RegLimit[RC->getID()] = TRI->getRegPressureLimit(RC, *IS->MF);
61*0b57cec5SDimitry Andric 
62*0b57cec5SDimitry Andric   ParallelLiveRanges = 0;
63*0b57cec5SDimitry Andric   HorizontalVerticalBalance = 0;
64*0b57cec5SDimitry Andric }
65*0b57cec5SDimitry Andric 
66*0b57cec5SDimitry Andric unsigned
numberRCValPredInSU(SUnit * SU,unsigned RCId)67*0b57cec5SDimitry Andric ResourcePriorityQueue::numberRCValPredInSU(SUnit *SU, unsigned RCId) {
68*0b57cec5SDimitry Andric   unsigned NumberDeps = 0;
69*0b57cec5SDimitry Andric   for (SDep &Pred : SU->Preds) {
70*0b57cec5SDimitry Andric     if (Pred.isCtrl())
71*0b57cec5SDimitry Andric       continue;
72*0b57cec5SDimitry Andric 
73*0b57cec5SDimitry Andric     SUnit *PredSU = Pred.getSUnit();
74*0b57cec5SDimitry Andric     const SDNode *ScegN = PredSU->getNode();
75*0b57cec5SDimitry Andric 
76*0b57cec5SDimitry Andric     if (!ScegN)
77*0b57cec5SDimitry Andric       continue;
78*0b57cec5SDimitry Andric 
79*0b57cec5SDimitry Andric     // If value is passed to CopyToReg, it is probably
80*0b57cec5SDimitry Andric     // live outside BB.
81*0b57cec5SDimitry Andric     switch (ScegN->getOpcode()) {
82*0b57cec5SDimitry Andric       default:  break;
83*0b57cec5SDimitry Andric       case ISD::TokenFactor:    break;
84*0b57cec5SDimitry Andric       case ISD::CopyFromReg:    NumberDeps++;  break;
85*0b57cec5SDimitry Andric       case ISD::CopyToReg:      break;
86*0b57cec5SDimitry Andric       case ISD::INLINEASM:      break;
87*0b57cec5SDimitry Andric       case ISD::INLINEASM_BR:   break;
88*0b57cec5SDimitry Andric     }
89*0b57cec5SDimitry Andric     if (!ScegN->isMachineOpcode())
90*0b57cec5SDimitry Andric       continue;
91*0b57cec5SDimitry Andric 
92*0b57cec5SDimitry Andric     for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
93*0b57cec5SDimitry Andric       MVT VT = ScegN->getSimpleValueType(i);
94*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)
95*0b57cec5SDimitry Andric           && (TLI->getRegClassFor(VT)->getID() == RCId)) {
96*0b57cec5SDimitry Andric         NumberDeps++;
97*0b57cec5SDimitry Andric         break;
98*0b57cec5SDimitry Andric       }
99*0b57cec5SDimitry Andric     }
100*0b57cec5SDimitry Andric   }
101*0b57cec5SDimitry Andric   return NumberDeps;
102*0b57cec5SDimitry Andric }
103*0b57cec5SDimitry Andric 
numberRCValSuccInSU(SUnit * SU,unsigned RCId)104*0b57cec5SDimitry Andric unsigned ResourcePriorityQueue::numberRCValSuccInSU(SUnit *SU,
105*0b57cec5SDimitry Andric                                                     unsigned RCId) {
106*0b57cec5SDimitry Andric   unsigned NumberDeps = 0;
107*0b57cec5SDimitry Andric   for (const SDep &Succ : SU->Succs) {
108*0b57cec5SDimitry Andric     if (Succ.isCtrl())
109*0b57cec5SDimitry Andric       continue;
110*0b57cec5SDimitry Andric 
111*0b57cec5SDimitry Andric     SUnit *SuccSU = Succ.getSUnit();
112*0b57cec5SDimitry Andric     const SDNode *ScegN = SuccSU->getNode();
113*0b57cec5SDimitry Andric     if (!ScegN)
114*0b57cec5SDimitry Andric       continue;
115*0b57cec5SDimitry Andric 
116*0b57cec5SDimitry Andric     // If value is passed to CopyToReg, it is probably
117*0b57cec5SDimitry Andric     // live outside BB.
118*0b57cec5SDimitry Andric     switch (ScegN->getOpcode()) {
119*0b57cec5SDimitry Andric       default:  break;
120*0b57cec5SDimitry Andric       case ISD::TokenFactor:    break;
121*0b57cec5SDimitry Andric       case ISD::CopyFromReg:    break;
122*0b57cec5SDimitry Andric       case ISD::CopyToReg:      NumberDeps++;  break;
123*0b57cec5SDimitry Andric       case ISD::INLINEASM:      break;
124*0b57cec5SDimitry Andric       case ISD::INLINEASM_BR:   break;
125*0b57cec5SDimitry Andric     }
126*0b57cec5SDimitry Andric     if (!ScegN->isMachineOpcode())
127*0b57cec5SDimitry Andric       continue;
128*0b57cec5SDimitry Andric 
129*0b57cec5SDimitry Andric     for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
130*0b57cec5SDimitry Andric       const SDValue &Op = ScegN->getOperand(i);
131*0b57cec5SDimitry Andric       MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
132*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)
133*0b57cec5SDimitry Andric           && (TLI->getRegClassFor(VT)->getID() == RCId)) {
134*0b57cec5SDimitry Andric         NumberDeps++;
135*0b57cec5SDimitry Andric         break;
136*0b57cec5SDimitry Andric       }
137*0b57cec5SDimitry Andric     }
138*0b57cec5SDimitry Andric   }
139*0b57cec5SDimitry Andric   return NumberDeps;
140*0b57cec5SDimitry Andric }
141*0b57cec5SDimitry Andric 
numberCtrlDepsInSU(SUnit * SU)142*0b57cec5SDimitry Andric static unsigned numberCtrlDepsInSU(SUnit *SU) {
143*0b57cec5SDimitry Andric   unsigned NumberDeps = 0;
144*0b57cec5SDimitry Andric   for (const SDep &Succ : SU->Succs)
145*0b57cec5SDimitry Andric     if (Succ.isCtrl())
146*0b57cec5SDimitry Andric       NumberDeps++;
147*0b57cec5SDimitry Andric 
148*0b57cec5SDimitry Andric   return NumberDeps;
149*0b57cec5SDimitry Andric }
150*0b57cec5SDimitry Andric 
numberCtrlPredInSU(SUnit * SU)151*0b57cec5SDimitry Andric static unsigned numberCtrlPredInSU(SUnit *SU) {
152*0b57cec5SDimitry Andric   unsigned NumberDeps = 0;
153*0b57cec5SDimitry Andric   for (SDep &Pred : SU->Preds)
154*0b57cec5SDimitry Andric     if (Pred.isCtrl())
155*0b57cec5SDimitry Andric       NumberDeps++;
156*0b57cec5SDimitry Andric 
157*0b57cec5SDimitry Andric   return NumberDeps;
158*0b57cec5SDimitry Andric }
159*0b57cec5SDimitry Andric 
160*0b57cec5SDimitry Andric ///
161*0b57cec5SDimitry Andric /// Initialize nodes.
162*0b57cec5SDimitry Andric ///
initNodes(std::vector<SUnit> & sunits)163*0b57cec5SDimitry Andric void ResourcePriorityQueue::initNodes(std::vector<SUnit> &sunits) {
164*0b57cec5SDimitry Andric   SUnits = &sunits;
165*0b57cec5SDimitry Andric   NumNodesSolelyBlocking.resize(SUnits->size(), 0);
166*0b57cec5SDimitry Andric 
167*0b57cec5SDimitry Andric   for (SUnit &SU : *SUnits) {
168*0b57cec5SDimitry Andric     initNumRegDefsLeft(&SU);
169*0b57cec5SDimitry Andric     SU.NodeQueueId = 0;
170*0b57cec5SDimitry Andric   }
171*0b57cec5SDimitry Andric }
172*0b57cec5SDimitry Andric 
173*0b57cec5SDimitry Andric /// This heuristic is used if DFA scheduling is not desired
174*0b57cec5SDimitry Andric /// for some VLIW platform.
operator ()(const SUnit * LHS,const SUnit * RHS) const175*0b57cec5SDimitry Andric bool resource_sort::operator()(const SUnit *LHS, const SUnit *RHS) const {
176*0b57cec5SDimitry Andric   // The isScheduleHigh flag allows nodes with wraparound dependencies that
177*0b57cec5SDimitry Andric   // cannot easily be modeled as edges with latencies to be scheduled as
178*0b57cec5SDimitry Andric   // soon as possible in a top-down schedule.
179*0b57cec5SDimitry Andric   if (LHS->isScheduleHigh && !RHS->isScheduleHigh)
180*0b57cec5SDimitry Andric     return false;
181*0b57cec5SDimitry Andric 
182*0b57cec5SDimitry Andric   if (!LHS->isScheduleHigh && RHS->isScheduleHigh)
183*0b57cec5SDimitry Andric     return true;
184*0b57cec5SDimitry Andric 
185*0b57cec5SDimitry Andric   unsigned LHSNum = LHS->NodeNum;
186*0b57cec5SDimitry Andric   unsigned RHSNum = RHS->NodeNum;
187*0b57cec5SDimitry Andric 
188*0b57cec5SDimitry Andric   // The most important heuristic is scheduling the critical path.
189*0b57cec5SDimitry Andric   unsigned LHSLatency = PQ->getLatency(LHSNum);
190*0b57cec5SDimitry Andric   unsigned RHSLatency = PQ->getLatency(RHSNum);
191*0b57cec5SDimitry Andric   if (LHSLatency < RHSLatency) return true;
192*0b57cec5SDimitry Andric   if (LHSLatency > RHSLatency) return false;
193*0b57cec5SDimitry Andric 
194*0b57cec5SDimitry Andric   // After that, if two nodes have identical latencies, look to see if one will
195*0b57cec5SDimitry Andric   // unblock more other nodes than the other.
196*0b57cec5SDimitry Andric   unsigned LHSBlocked = PQ->getNumSolelyBlockNodes(LHSNum);
197*0b57cec5SDimitry Andric   unsigned RHSBlocked = PQ->getNumSolelyBlockNodes(RHSNum);
198*0b57cec5SDimitry Andric   if (LHSBlocked < RHSBlocked) return true;
199*0b57cec5SDimitry Andric   if (LHSBlocked > RHSBlocked) return false;
200*0b57cec5SDimitry Andric 
201*0b57cec5SDimitry Andric   // Finally, just to provide a stable ordering, use the node number as a
202*0b57cec5SDimitry Andric   // deciding factor.
203*0b57cec5SDimitry Andric   return LHSNum < RHSNum;
204*0b57cec5SDimitry Andric }
205*0b57cec5SDimitry Andric 
206*0b57cec5SDimitry Andric 
207*0b57cec5SDimitry Andric /// getSingleUnscheduledPred - If there is exactly one unscheduled predecessor
208*0b57cec5SDimitry Andric /// of SU, return it, otherwise return null.
getSingleUnscheduledPred(SUnit * SU)209*0b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::getSingleUnscheduledPred(SUnit *SU) {
210*0b57cec5SDimitry Andric   SUnit *OnlyAvailablePred = nullptr;
211*0b57cec5SDimitry Andric   for (const SDep &Pred : SU->Preds) {
212*0b57cec5SDimitry Andric     SUnit &PredSU = *Pred.getSUnit();
213*0b57cec5SDimitry Andric     if (!PredSU.isScheduled) {
214*0b57cec5SDimitry Andric       // We found an available, but not scheduled, predecessor.  If it's the
215*0b57cec5SDimitry Andric       // only one we have found, keep track of it... otherwise give up.
216*0b57cec5SDimitry Andric       if (OnlyAvailablePred && OnlyAvailablePred != &PredSU)
217*0b57cec5SDimitry Andric         return nullptr;
218*0b57cec5SDimitry Andric       OnlyAvailablePred = &PredSU;
219*0b57cec5SDimitry Andric     }
220*0b57cec5SDimitry Andric   }
221*0b57cec5SDimitry Andric   return OnlyAvailablePred;
222*0b57cec5SDimitry Andric }
223*0b57cec5SDimitry Andric 
push(SUnit * SU)224*0b57cec5SDimitry Andric void ResourcePriorityQueue::push(SUnit *SU) {
225*0b57cec5SDimitry Andric   // Look at all of the successors of this node.  Count the number of nodes that
226*0b57cec5SDimitry Andric   // this node is the sole unscheduled node for.
227*0b57cec5SDimitry Andric   unsigned NumNodesBlocking = 0;
228*0b57cec5SDimitry Andric   for (const SDep &Succ : SU->Succs)
229*0b57cec5SDimitry Andric     if (getSingleUnscheduledPred(Succ.getSUnit()) == SU)
230*0b57cec5SDimitry Andric       ++NumNodesBlocking;
231*0b57cec5SDimitry Andric 
232*0b57cec5SDimitry Andric   NumNodesSolelyBlocking[SU->NodeNum] = NumNodesBlocking;
233*0b57cec5SDimitry Andric   Queue.push_back(SU);
234*0b57cec5SDimitry Andric }
235*0b57cec5SDimitry Andric 
236*0b57cec5SDimitry Andric /// Check if scheduling of this SU is possible
237*0b57cec5SDimitry Andric /// in the current packet.
isResourceAvailable(SUnit * SU)238*0b57cec5SDimitry Andric bool ResourcePriorityQueue::isResourceAvailable(SUnit *SU) {
239*0b57cec5SDimitry Andric   if (!SU || !SU->getNode())
240*0b57cec5SDimitry Andric     return false;
241*0b57cec5SDimitry Andric 
242*0b57cec5SDimitry Andric   // If this is a compound instruction,
243*0b57cec5SDimitry Andric   // it is likely to be a call. Do not delay it.
244*0b57cec5SDimitry Andric   if (SU->getNode()->getGluedNode())
245*0b57cec5SDimitry Andric     return true;
246*0b57cec5SDimitry Andric 
247*0b57cec5SDimitry Andric   // First see if the pipeline could receive this instruction
248*0b57cec5SDimitry Andric   // in the current cycle.
249*0b57cec5SDimitry Andric   if (SU->getNode()->isMachineOpcode())
250*0b57cec5SDimitry Andric     switch (SU->getNode()->getMachineOpcode()) {
251*0b57cec5SDimitry Andric     default:
252*0b57cec5SDimitry Andric       if (!ResourcesModel->canReserveResources(&TII->get(
253*0b57cec5SDimitry Andric           SU->getNode()->getMachineOpcode())))
254*0b57cec5SDimitry Andric            return false;
255*0b57cec5SDimitry Andric       break;
256*0b57cec5SDimitry Andric     case TargetOpcode::EXTRACT_SUBREG:
257*0b57cec5SDimitry Andric     case TargetOpcode::INSERT_SUBREG:
258*0b57cec5SDimitry Andric     case TargetOpcode::SUBREG_TO_REG:
259*0b57cec5SDimitry Andric     case TargetOpcode::REG_SEQUENCE:
260*0b57cec5SDimitry Andric     case TargetOpcode::IMPLICIT_DEF:
261*0b57cec5SDimitry Andric         break;
262*0b57cec5SDimitry Andric     }
263*0b57cec5SDimitry Andric 
264*0b57cec5SDimitry Andric   // Now see if there are no other dependencies
265*0b57cec5SDimitry Andric   // to instructions already in the packet.
266*0b57cec5SDimitry Andric   for (const SUnit *S : Packet)
267*0b57cec5SDimitry Andric     for (const SDep &Succ : S->Succs) {
268*0b57cec5SDimitry Andric       // Since we do not add pseudos to packets, might as well
269*0b57cec5SDimitry Andric       // ignore order deps.
270*0b57cec5SDimitry Andric       if (Succ.isCtrl())
271*0b57cec5SDimitry Andric         continue;
272*0b57cec5SDimitry Andric 
273*0b57cec5SDimitry Andric       if (Succ.getSUnit() == SU)
274*0b57cec5SDimitry Andric         return false;
275*0b57cec5SDimitry Andric     }
276*0b57cec5SDimitry Andric 
277*0b57cec5SDimitry Andric   return true;
278*0b57cec5SDimitry Andric }
279*0b57cec5SDimitry Andric 
280*0b57cec5SDimitry Andric /// Keep track of available resources.
reserveResources(SUnit * SU)281*0b57cec5SDimitry Andric void ResourcePriorityQueue::reserveResources(SUnit *SU) {
282*0b57cec5SDimitry Andric   // If this SU does not fit in the packet
283*0b57cec5SDimitry Andric   // start a new one.
284*0b57cec5SDimitry Andric   if (!isResourceAvailable(SU) || SU->getNode()->getGluedNode()) {
285*0b57cec5SDimitry Andric     ResourcesModel->clearResources();
286*0b57cec5SDimitry Andric     Packet.clear();
287*0b57cec5SDimitry Andric   }
288*0b57cec5SDimitry Andric 
289*0b57cec5SDimitry Andric   if (SU->getNode() && SU->getNode()->isMachineOpcode()) {
290*0b57cec5SDimitry Andric     switch (SU->getNode()->getMachineOpcode()) {
291*0b57cec5SDimitry Andric     default:
292*0b57cec5SDimitry Andric       ResourcesModel->reserveResources(&TII->get(
293*0b57cec5SDimitry Andric         SU->getNode()->getMachineOpcode()));
294*0b57cec5SDimitry Andric       break;
295*0b57cec5SDimitry Andric     case TargetOpcode::EXTRACT_SUBREG:
296*0b57cec5SDimitry Andric     case TargetOpcode::INSERT_SUBREG:
297*0b57cec5SDimitry Andric     case TargetOpcode::SUBREG_TO_REG:
298*0b57cec5SDimitry Andric     case TargetOpcode::REG_SEQUENCE:
299*0b57cec5SDimitry Andric     case TargetOpcode::IMPLICIT_DEF:
300*0b57cec5SDimitry Andric       break;
301*0b57cec5SDimitry Andric     }
302*0b57cec5SDimitry Andric     Packet.push_back(SU);
303*0b57cec5SDimitry Andric   }
304*0b57cec5SDimitry Andric   // Forcefully end packet for PseudoOps.
305*0b57cec5SDimitry Andric   else {
306*0b57cec5SDimitry Andric     ResourcesModel->clearResources();
307*0b57cec5SDimitry Andric     Packet.clear();
308*0b57cec5SDimitry Andric   }
309*0b57cec5SDimitry Andric 
310*0b57cec5SDimitry Andric   // If packet is now full, reset the state so in the next cycle
311*0b57cec5SDimitry Andric   // we start fresh.
312*0b57cec5SDimitry Andric   if (Packet.size() >= InstrItins->SchedModel.IssueWidth) {
313*0b57cec5SDimitry Andric     ResourcesModel->clearResources();
314*0b57cec5SDimitry Andric     Packet.clear();
315*0b57cec5SDimitry Andric   }
316*0b57cec5SDimitry Andric }
317*0b57cec5SDimitry Andric 
rawRegPressureDelta(SUnit * SU,unsigned RCId)318*0b57cec5SDimitry Andric int ResourcePriorityQueue::rawRegPressureDelta(SUnit *SU, unsigned RCId) {
319*0b57cec5SDimitry Andric   int RegBalance = 0;
320*0b57cec5SDimitry Andric 
321*0b57cec5SDimitry Andric   if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
322*0b57cec5SDimitry Andric     return RegBalance;
323*0b57cec5SDimitry Andric 
324*0b57cec5SDimitry Andric   // Gen estimate.
325*0b57cec5SDimitry Andric   for (unsigned i = 0, e = SU->getNode()->getNumValues(); i != e; ++i) {
326*0b57cec5SDimitry Andric       MVT VT = SU->getNode()->getSimpleValueType(i);
327*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)
328*0b57cec5SDimitry Andric           && TLI->getRegClassFor(VT)
329*0b57cec5SDimitry Andric           && TLI->getRegClassFor(VT)->getID() == RCId)
330*0b57cec5SDimitry Andric         RegBalance += numberRCValSuccInSU(SU, RCId);
331*0b57cec5SDimitry Andric   }
332*0b57cec5SDimitry Andric   // Kill estimate.
333*0b57cec5SDimitry Andric   for (unsigned i = 0, e = SU->getNode()->getNumOperands(); i != e; ++i) {
334*0b57cec5SDimitry Andric       const SDValue &Op = SU->getNode()->getOperand(i);
335*0b57cec5SDimitry Andric       MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
336*0b57cec5SDimitry Andric       if (isa<ConstantSDNode>(Op.getNode()))
337*0b57cec5SDimitry Andric         continue;
338*0b57cec5SDimitry Andric 
339*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT) && TLI->getRegClassFor(VT)
340*0b57cec5SDimitry Andric           && TLI->getRegClassFor(VT)->getID() == RCId)
341*0b57cec5SDimitry Andric         RegBalance -= numberRCValPredInSU(SU, RCId);
342*0b57cec5SDimitry Andric   }
343*0b57cec5SDimitry Andric   return RegBalance;
344*0b57cec5SDimitry Andric }
345*0b57cec5SDimitry Andric 
346*0b57cec5SDimitry Andric /// Estimates change in reg pressure from this SU.
347*0b57cec5SDimitry Andric /// It is achieved by trivial tracking of defined
348*0b57cec5SDimitry Andric /// and used vregs in dependent instructions.
349*0b57cec5SDimitry Andric /// The RawPressure flag makes this function to ignore
350*0b57cec5SDimitry Andric /// existing reg file sizes, and report raw def/use
351*0b57cec5SDimitry Andric /// balance.
regPressureDelta(SUnit * SU,bool RawPressure)352*0b57cec5SDimitry Andric int ResourcePriorityQueue::regPressureDelta(SUnit *SU, bool RawPressure) {
353*0b57cec5SDimitry Andric   int RegBalance = 0;
354*0b57cec5SDimitry Andric 
355*0b57cec5SDimitry Andric   if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
356*0b57cec5SDimitry Andric     return RegBalance;
357*0b57cec5SDimitry Andric 
358*0b57cec5SDimitry Andric   if (RawPressure) {
359*0b57cec5SDimitry Andric     for (const TargetRegisterClass *RC : TRI->regclasses())
360*0b57cec5SDimitry Andric       RegBalance += rawRegPressureDelta(SU, RC->getID());
361*0b57cec5SDimitry Andric   }
362*0b57cec5SDimitry Andric   else {
363*0b57cec5SDimitry Andric     for (const TargetRegisterClass *RC : TRI->regclasses()) {
364*0b57cec5SDimitry Andric       if ((RegPressure[RC->getID()] +
365*0b57cec5SDimitry Andric            rawRegPressureDelta(SU, RC->getID()) > 0) &&
366*0b57cec5SDimitry Andric           (RegPressure[RC->getID()] +
367*0b57cec5SDimitry Andric            rawRegPressureDelta(SU, RC->getID())  >= RegLimit[RC->getID()]))
368*0b57cec5SDimitry Andric         RegBalance += rawRegPressureDelta(SU, RC->getID());
369*0b57cec5SDimitry Andric     }
370*0b57cec5SDimitry Andric   }
371*0b57cec5SDimitry Andric 
372*0b57cec5SDimitry Andric   return RegBalance;
373*0b57cec5SDimitry Andric }
374*0b57cec5SDimitry Andric 
375*0b57cec5SDimitry Andric // Constants used to denote relative importance of
376*0b57cec5SDimitry Andric // heuristic components for cost computation.
377*0b57cec5SDimitry Andric static const unsigned PriorityOne = 200;
378*0b57cec5SDimitry Andric static const unsigned PriorityTwo = 50;
379*0b57cec5SDimitry Andric static const unsigned PriorityThree = 15;
380*0b57cec5SDimitry Andric static const unsigned PriorityFour = 5;
381*0b57cec5SDimitry Andric static const unsigned ScaleOne = 20;
382*0b57cec5SDimitry Andric static const unsigned ScaleTwo = 10;
383*0b57cec5SDimitry Andric static const unsigned ScaleThree = 5;
384*0b57cec5SDimitry Andric static const unsigned FactorOne = 2;
385*0b57cec5SDimitry Andric 
386*0b57cec5SDimitry Andric /// Returns single number reflecting benefit of scheduling SU
387*0b57cec5SDimitry Andric /// in the current cycle.
SUSchedulingCost(SUnit * SU)388*0b57cec5SDimitry Andric int ResourcePriorityQueue::SUSchedulingCost(SUnit *SU) {
389*0b57cec5SDimitry Andric   // Initial trivial priority.
390*0b57cec5SDimitry Andric   int ResCount = 1;
391*0b57cec5SDimitry Andric 
392*0b57cec5SDimitry Andric   // Do not waste time on a node that is already scheduled.
393*0b57cec5SDimitry Andric   if (SU->isScheduled)
394*0b57cec5SDimitry Andric     return ResCount;
395*0b57cec5SDimitry Andric 
396*0b57cec5SDimitry Andric   // Forced priority is high.
397*0b57cec5SDimitry Andric   if (SU->isScheduleHigh)
398*0b57cec5SDimitry Andric     ResCount += PriorityOne;
399*0b57cec5SDimitry Andric 
400*0b57cec5SDimitry Andric   // Adaptable scheduling
401*0b57cec5SDimitry Andric   // A small, but very parallel
402*0b57cec5SDimitry Andric   // region, where reg pressure is an issue.
403*0b57cec5SDimitry Andric   if (HorizontalVerticalBalance > RegPressureThreshold) {
404*0b57cec5SDimitry Andric     // Critical path first
405*0b57cec5SDimitry Andric     ResCount += (SU->getHeight() * ScaleTwo);
406*0b57cec5SDimitry Andric     // If resources are available for it, multiply the
407*0b57cec5SDimitry Andric     // chance of scheduling.
408*0b57cec5SDimitry Andric     if (isResourceAvailable(SU))
409*0b57cec5SDimitry Andric       ResCount <<= FactorOne;
410*0b57cec5SDimitry Andric 
411*0b57cec5SDimitry Andric     // Consider change to reg pressure from scheduling
412*0b57cec5SDimitry Andric     // this SU.
413*0b57cec5SDimitry Andric     ResCount -= (regPressureDelta(SU,true) * ScaleOne);
414*0b57cec5SDimitry Andric   }
415*0b57cec5SDimitry Andric   // Default heuristic, greeady and
416*0b57cec5SDimitry Andric   // critical path driven.
417*0b57cec5SDimitry Andric   else {
418*0b57cec5SDimitry Andric     // Critical path first.
419*0b57cec5SDimitry Andric     ResCount += (SU->getHeight() * ScaleTwo);
420*0b57cec5SDimitry Andric     // Now see how many instructions is blocked by this SU.
421*0b57cec5SDimitry Andric     ResCount += (NumNodesSolelyBlocking[SU->NodeNum] * ScaleTwo);
422*0b57cec5SDimitry Andric     // If resources are available for it, multiply the
423*0b57cec5SDimitry Andric     // chance of scheduling.
424*0b57cec5SDimitry Andric     if (isResourceAvailable(SU))
425*0b57cec5SDimitry Andric       ResCount <<= FactorOne;
426*0b57cec5SDimitry Andric 
427*0b57cec5SDimitry Andric     ResCount -= (regPressureDelta(SU) * ScaleTwo);
428*0b57cec5SDimitry Andric   }
429*0b57cec5SDimitry Andric 
430*0b57cec5SDimitry Andric   // These are platform-specific things.
431*0b57cec5SDimitry Andric   // Will need to go into the back end
432*0b57cec5SDimitry Andric   // and accessed from here via a hook.
433*0b57cec5SDimitry Andric   for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) {
434*0b57cec5SDimitry Andric     if (N->isMachineOpcode()) {
435*0b57cec5SDimitry Andric       const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
436*0b57cec5SDimitry Andric       if (TID.isCall())
437*0b57cec5SDimitry Andric         ResCount += (PriorityTwo + (ScaleThree*N->getNumValues()));
438*0b57cec5SDimitry Andric     }
439*0b57cec5SDimitry Andric     else
440*0b57cec5SDimitry Andric       switch (N->getOpcode()) {
441*0b57cec5SDimitry Andric       default:  break;
442*0b57cec5SDimitry Andric       case ISD::TokenFactor:
443*0b57cec5SDimitry Andric       case ISD::CopyFromReg:
444*0b57cec5SDimitry Andric       case ISD::CopyToReg:
445*0b57cec5SDimitry Andric         ResCount += PriorityFour;
446*0b57cec5SDimitry Andric         break;
447*0b57cec5SDimitry Andric 
448*0b57cec5SDimitry Andric       case ISD::INLINEASM:
449*0b57cec5SDimitry Andric       case ISD::INLINEASM_BR:
450*0b57cec5SDimitry Andric         ResCount += PriorityThree;
451*0b57cec5SDimitry Andric         break;
452*0b57cec5SDimitry Andric       }
453*0b57cec5SDimitry Andric   }
454*0b57cec5SDimitry Andric   return ResCount;
455*0b57cec5SDimitry Andric }
456*0b57cec5SDimitry Andric 
457*0b57cec5SDimitry Andric 
458*0b57cec5SDimitry Andric /// Main resource tracking point.
scheduledNode(SUnit * SU)459*0b57cec5SDimitry Andric void ResourcePriorityQueue::scheduledNode(SUnit *SU) {
460*0b57cec5SDimitry Andric   // Use NULL entry as an event marker to reset
461*0b57cec5SDimitry Andric   // the DFA state.
462*0b57cec5SDimitry Andric   if (!SU) {
463*0b57cec5SDimitry Andric     ResourcesModel->clearResources();
464*0b57cec5SDimitry Andric     Packet.clear();
465*0b57cec5SDimitry Andric     return;
466*0b57cec5SDimitry Andric   }
467*0b57cec5SDimitry Andric 
468*0b57cec5SDimitry Andric   const SDNode *ScegN = SU->getNode();
469*0b57cec5SDimitry Andric   // Update reg pressure tracking.
470*0b57cec5SDimitry Andric   // First update current node.
471*0b57cec5SDimitry Andric   if (ScegN->isMachineOpcode()) {
472*0b57cec5SDimitry Andric     // Estimate generated regs.
473*0b57cec5SDimitry Andric     for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
474*0b57cec5SDimitry Andric       MVT VT = ScegN->getSimpleValueType(i);
475*0b57cec5SDimitry Andric 
476*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)) {
477*0b57cec5SDimitry Andric         const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
478*0b57cec5SDimitry Andric         if (RC)
479*0b57cec5SDimitry Andric           RegPressure[RC->getID()] += numberRCValSuccInSU(SU, RC->getID());
480*0b57cec5SDimitry Andric       }
481*0b57cec5SDimitry Andric     }
482*0b57cec5SDimitry Andric     // Estimate killed regs.
483*0b57cec5SDimitry Andric     for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
484*0b57cec5SDimitry Andric       const SDValue &Op = ScegN->getOperand(i);
485*0b57cec5SDimitry Andric       MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
486*0b57cec5SDimitry Andric 
487*0b57cec5SDimitry Andric       if (TLI->isTypeLegal(VT)) {
488*0b57cec5SDimitry Andric         const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
489*0b57cec5SDimitry Andric         if (RC) {
490*0b57cec5SDimitry Andric           if (RegPressure[RC->getID()] >
491*0b57cec5SDimitry Andric             (numberRCValPredInSU(SU, RC->getID())))
492*0b57cec5SDimitry Andric             RegPressure[RC->getID()] -= numberRCValPredInSU(SU, RC->getID());
493*0b57cec5SDimitry Andric           else RegPressure[RC->getID()] = 0;
494*0b57cec5SDimitry Andric         }
495*0b57cec5SDimitry Andric       }
496*0b57cec5SDimitry Andric     }
497*0b57cec5SDimitry Andric     for (SDep &Pred : SU->Preds) {
498*0b57cec5SDimitry Andric       if (Pred.isCtrl() || (Pred.getSUnit()->NumRegDefsLeft == 0))
499*0b57cec5SDimitry Andric         continue;
500*0b57cec5SDimitry Andric       --Pred.getSUnit()->NumRegDefsLeft;
501*0b57cec5SDimitry Andric     }
502*0b57cec5SDimitry Andric   }
503*0b57cec5SDimitry Andric 
504*0b57cec5SDimitry Andric   // Reserve resources for this SU.
505*0b57cec5SDimitry Andric   reserveResources(SU);
506*0b57cec5SDimitry Andric 
507*0b57cec5SDimitry Andric   // Adjust number of parallel live ranges.
508*0b57cec5SDimitry Andric   // Heuristic is simple - node with no data successors reduces
509*0b57cec5SDimitry Andric   // number of live ranges. All others, increase it.
510*0b57cec5SDimitry Andric   unsigned NumberNonControlDeps = 0;
511*0b57cec5SDimitry Andric 
512*0b57cec5SDimitry Andric   for (const SDep &Succ : SU->Succs) {
513*0b57cec5SDimitry Andric     adjustPriorityOfUnscheduledPreds(Succ.getSUnit());
514*0b57cec5SDimitry Andric     if (!Succ.isCtrl())
515*0b57cec5SDimitry Andric       NumberNonControlDeps++;
516*0b57cec5SDimitry Andric   }
517*0b57cec5SDimitry Andric 
518*0b57cec5SDimitry Andric   if (!NumberNonControlDeps) {
519*0b57cec5SDimitry Andric     if (ParallelLiveRanges >= SU->NumPreds)
520*0b57cec5SDimitry Andric       ParallelLiveRanges -= SU->NumPreds;
521*0b57cec5SDimitry Andric     else
522*0b57cec5SDimitry Andric       ParallelLiveRanges = 0;
523*0b57cec5SDimitry Andric 
524*0b57cec5SDimitry Andric   }
525*0b57cec5SDimitry Andric   else
526*0b57cec5SDimitry Andric     ParallelLiveRanges += SU->NumRegDefsLeft;
527*0b57cec5SDimitry Andric 
528*0b57cec5SDimitry Andric   // Track parallel live chains.
529*0b57cec5SDimitry Andric   HorizontalVerticalBalance += (SU->Succs.size() - numberCtrlDepsInSU(SU));
530*0b57cec5SDimitry Andric   HorizontalVerticalBalance -= (SU->Preds.size() - numberCtrlPredInSU(SU));
531*0b57cec5SDimitry Andric }
532*0b57cec5SDimitry Andric 
initNumRegDefsLeft(SUnit * SU)533*0b57cec5SDimitry Andric void ResourcePriorityQueue::initNumRegDefsLeft(SUnit *SU) {
534*0b57cec5SDimitry Andric   unsigned  NodeNumDefs = 0;
535*0b57cec5SDimitry Andric   for (SDNode *N = SU->getNode(); N; N = N->getGluedNode())
536*0b57cec5SDimitry Andric     if (N->isMachineOpcode()) {
537*0b57cec5SDimitry Andric       const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
538*0b57cec5SDimitry Andric       // No register need be allocated for this.
539*0b57cec5SDimitry Andric       if (N->getMachineOpcode() == TargetOpcode::IMPLICIT_DEF) {
540*0b57cec5SDimitry Andric         NodeNumDefs = 0;
541*0b57cec5SDimitry Andric         break;
542*0b57cec5SDimitry Andric       }
543*0b57cec5SDimitry Andric       NodeNumDefs = std::min(N->getNumValues(), TID.getNumDefs());
544*0b57cec5SDimitry Andric     }
545*0b57cec5SDimitry Andric     else
546*0b57cec5SDimitry Andric       switch(N->getOpcode()) {
547*0b57cec5SDimitry Andric         default:     break;
548*0b57cec5SDimitry Andric         case ISD::CopyFromReg:
549*0b57cec5SDimitry Andric           NodeNumDefs++;
550*0b57cec5SDimitry Andric           break;
551*0b57cec5SDimitry Andric         case ISD::INLINEASM:
552*0b57cec5SDimitry Andric         case ISD::INLINEASM_BR:
553*0b57cec5SDimitry Andric           NodeNumDefs++;
554*0b57cec5SDimitry Andric           break;
555*0b57cec5SDimitry Andric       }
556*0b57cec5SDimitry Andric 
557*0b57cec5SDimitry Andric   SU->NumRegDefsLeft = NodeNumDefs;
558*0b57cec5SDimitry Andric }
559*0b57cec5SDimitry Andric 
560*0b57cec5SDimitry Andric /// adjustPriorityOfUnscheduledPreds - One of the predecessors of SU was just
561*0b57cec5SDimitry Andric /// scheduled.  If SU is not itself available, then there is at least one
562*0b57cec5SDimitry Andric /// predecessor node that has not been scheduled yet.  If SU has exactly ONE
563*0b57cec5SDimitry Andric /// unscheduled predecessor, we want to increase its priority: it getting
564*0b57cec5SDimitry Andric /// scheduled will make this node available, so it is better than some other
565*0b57cec5SDimitry Andric /// node of the same priority that will not make a node available.
adjustPriorityOfUnscheduledPreds(SUnit * SU)566*0b57cec5SDimitry Andric void ResourcePriorityQueue::adjustPriorityOfUnscheduledPreds(SUnit *SU) {
567*0b57cec5SDimitry Andric   if (SU->isAvailable) return;  // All preds scheduled.
568*0b57cec5SDimitry Andric 
569*0b57cec5SDimitry Andric   SUnit *OnlyAvailablePred = getSingleUnscheduledPred(SU);
570*0b57cec5SDimitry Andric   if (!OnlyAvailablePred || !OnlyAvailablePred->isAvailable)
571*0b57cec5SDimitry Andric     return;
572*0b57cec5SDimitry Andric 
573*0b57cec5SDimitry Andric   // Okay, we found a single predecessor that is available, but not scheduled.
574*0b57cec5SDimitry Andric   // Since it is available, it must be in the priority queue.  First remove it.
575*0b57cec5SDimitry Andric   remove(OnlyAvailablePred);
576*0b57cec5SDimitry Andric 
577*0b57cec5SDimitry Andric   // Reinsert the node into the priority queue, which recomputes its
578*0b57cec5SDimitry Andric   // NumNodesSolelyBlocking value.
579*0b57cec5SDimitry Andric   push(OnlyAvailablePred);
580*0b57cec5SDimitry Andric }
581*0b57cec5SDimitry Andric 
582*0b57cec5SDimitry Andric 
583*0b57cec5SDimitry Andric /// Main access point - returns next instructions
584*0b57cec5SDimitry Andric /// to be placed in scheduling sequence.
pop()585*0b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::pop() {
586*0b57cec5SDimitry Andric   if (empty())
587*0b57cec5SDimitry Andric     return nullptr;
588*0b57cec5SDimitry Andric 
589*0b57cec5SDimitry Andric   std::vector<SUnit *>::iterator Best = Queue.begin();
590*0b57cec5SDimitry Andric   if (!DisableDFASched) {
591*0b57cec5SDimitry Andric     int BestCost = SUSchedulingCost(*Best);
592*0b57cec5SDimitry Andric     for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I) {
593*0b57cec5SDimitry Andric 
594*0b57cec5SDimitry Andric       if (SUSchedulingCost(*I) > BestCost) {
595*0b57cec5SDimitry Andric         BestCost = SUSchedulingCost(*I);
596*0b57cec5SDimitry Andric         Best = I;
597*0b57cec5SDimitry Andric       }
598*0b57cec5SDimitry Andric     }
599*0b57cec5SDimitry Andric   }
600*0b57cec5SDimitry Andric   // Use default TD scheduling mechanism.
601*0b57cec5SDimitry Andric   else {
602*0b57cec5SDimitry Andric     for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I)
603*0b57cec5SDimitry Andric       if (Picker(*Best, *I))
604*0b57cec5SDimitry Andric         Best = I;
605*0b57cec5SDimitry Andric   }
606*0b57cec5SDimitry Andric 
607*0b57cec5SDimitry Andric   SUnit *V = *Best;
608*0b57cec5SDimitry Andric   if (Best != std::prev(Queue.end()))
609*0b57cec5SDimitry Andric     std::swap(*Best, Queue.back());
610*0b57cec5SDimitry Andric 
611*0b57cec5SDimitry Andric   Queue.pop_back();
612*0b57cec5SDimitry Andric 
613*0b57cec5SDimitry Andric   return V;
614*0b57cec5SDimitry Andric }
615*0b57cec5SDimitry Andric 
616*0b57cec5SDimitry Andric 
remove(SUnit * SU)617*0b57cec5SDimitry Andric void ResourcePriorityQueue::remove(SUnit *SU) {
618*0b57cec5SDimitry Andric   assert(!Queue.empty() && "Queue is empty!");
619*0b57cec5SDimitry Andric   std::vector<SUnit *>::iterator I = find(Queue, SU);
620*0b57cec5SDimitry Andric   if (I != std::prev(Queue.end()))
621*0b57cec5SDimitry Andric     std::swap(*I, Queue.back());
622*0b57cec5SDimitry Andric 
623*0b57cec5SDimitry Andric   Queue.pop_back();
624*0b57cec5SDimitry Andric }
625*0b57cec5SDimitry Andric