1*0b57cec5SDimitry Andric //===- ResourcePriorityQueue.cpp - A DFA-oriented priority queue -*- C++ -*-==//
2*0b57cec5SDimitry Andric //
3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
8*0b57cec5SDimitry Andric //
9*0b57cec5SDimitry Andric // This file implements the ResourcePriorityQueue class, which is a
10*0b57cec5SDimitry Andric // SchedulingPriorityQueue that prioritizes instructions using DFA state to
11*0b57cec5SDimitry Andric // reduce the length of the critical path through the basic block
12*0b57cec5SDimitry Andric // on VLIW platforms.
13*0b57cec5SDimitry Andric // The scheduler is basically a top-down adaptable list scheduler with DFA
14*0b57cec5SDimitry Andric // resource tracking added to the cost function.
15*0b57cec5SDimitry Andric // DFA is queried as a state machine to model "packets/bundles" during
16*0b57cec5SDimitry Andric // schedule. Currently packets/bundles are discarded at the end of
17*0b57cec5SDimitry Andric // scheduling, affecting only order of instructions.
18*0b57cec5SDimitry Andric //
19*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
20*0b57cec5SDimitry Andric
21*0b57cec5SDimitry Andric #include "llvm/CodeGen/ResourcePriorityQueue.h"
22*0b57cec5SDimitry Andric #include "llvm/CodeGen/DFAPacketizer.h"
23*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGISel.h"
24*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGNodes.h"
25*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h"
26*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetLowering.h"
27*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetRegisterInfo.h"
28*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetSubtargetInfo.h"
29*0b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
30*0b57cec5SDimitry Andric
31*0b57cec5SDimitry Andric using namespace llvm;
32*0b57cec5SDimitry Andric
33*0b57cec5SDimitry Andric #define DEBUG_TYPE "scheduler"
34*0b57cec5SDimitry Andric
35*0b57cec5SDimitry Andric static cl::opt<bool>
36*0b57cec5SDimitry Andric DisableDFASched("disable-dfa-sched", cl::Hidden,
37*0b57cec5SDimitry Andric cl::desc("Disable use of DFA during scheduling"));
38*0b57cec5SDimitry Andric
39*0b57cec5SDimitry Andric static cl::opt<int> RegPressureThreshold(
40*0b57cec5SDimitry Andric "dfa-sched-reg-pressure-threshold", cl::Hidden, cl::init(5),
41*0b57cec5SDimitry Andric cl::desc("Track reg pressure and switch priority to in-depth"));
42*0b57cec5SDimitry Andric
ResourcePriorityQueue(SelectionDAGISel * IS)43*0b57cec5SDimitry Andric ResourcePriorityQueue::ResourcePriorityQueue(SelectionDAGISel *IS)
44*0b57cec5SDimitry Andric : Picker(this), InstrItins(IS->MF->getSubtarget().getInstrItineraryData()) {
45*0b57cec5SDimitry Andric const TargetSubtargetInfo &STI = IS->MF->getSubtarget();
46*0b57cec5SDimitry Andric TRI = STI.getRegisterInfo();
47*0b57cec5SDimitry Andric TLI = IS->TLI;
48*0b57cec5SDimitry Andric TII = STI.getInstrInfo();
49*0b57cec5SDimitry Andric ResourcesModel.reset(TII->CreateTargetScheduleState(STI));
50*0b57cec5SDimitry Andric // This hard requirement could be relaxed, but for now
51*0b57cec5SDimitry Andric // do not let it proceed.
52*0b57cec5SDimitry Andric assert(ResourcesModel && "Unimplemented CreateTargetScheduleState.");
53*0b57cec5SDimitry Andric
54*0b57cec5SDimitry Andric unsigned NumRC = TRI->getNumRegClasses();
55*0b57cec5SDimitry Andric RegLimit.resize(NumRC);
56*0b57cec5SDimitry Andric RegPressure.resize(NumRC);
57*0b57cec5SDimitry Andric std::fill(RegLimit.begin(), RegLimit.end(), 0);
58*0b57cec5SDimitry Andric std::fill(RegPressure.begin(), RegPressure.end(), 0);
59*0b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses())
60*0b57cec5SDimitry Andric RegLimit[RC->getID()] = TRI->getRegPressureLimit(RC, *IS->MF);
61*0b57cec5SDimitry Andric
62*0b57cec5SDimitry Andric ParallelLiveRanges = 0;
63*0b57cec5SDimitry Andric HorizontalVerticalBalance = 0;
64*0b57cec5SDimitry Andric }
65*0b57cec5SDimitry Andric
66*0b57cec5SDimitry Andric unsigned
numberRCValPredInSU(SUnit * SU,unsigned RCId)67*0b57cec5SDimitry Andric ResourcePriorityQueue::numberRCValPredInSU(SUnit *SU, unsigned RCId) {
68*0b57cec5SDimitry Andric unsigned NumberDeps = 0;
69*0b57cec5SDimitry Andric for (SDep &Pred : SU->Preds) {
70*0b57cec5SDimitry Andric if (Pred.isCtrl())
71*0b57cec5SDimitry Andric continue;
72*0b57cec5SDimitry Andric
73*0b57cec5SDimitry Andric SUnit *PredSU = Pred.getSUnit();
74*0b57cec5SDimitry Andric const SDNode *ScegN = PredSU->getNode();
75*0b57cec5SDimitry Andric
76*0b57cec5SDimitry Andric if (!ScegN)
77*0b57cec5SDimitry Andric continue;
78*0b57cec5SDimitry Andric
79*0b57cec5SDimitry Andric // If value is passed to CopyToReg, it is probably
80*0b57cec5SDimitry Andric // live outside BB.
81*0b57cec5SDimitry Andric switch (ScegN->getOpcode()) {
82*0b57cec5SDimitry Andric default: break;
83*0b57cec5SDimitry Andric case ISD::TokenFactor: break;
84*0b57cec5SDimitry Andric case ISD::CopyFromReg: NumberDeps++; break;
85*0b57cec5SDimitry Andric case ISD::CopyToReg: break;
86*0b57cec5SDimitry Andric case ISD::INLINEASM: break;
87*0b57cec5SDimitry Andric case ISD::INLINEASM_BR: break;
88*0b57cec5SDimitry Andric }
89*0b57cec5SDimitry Andric if (!ScegN->isMachineOpcode())
90*0b57cec5SDimitry Andric continue;
91*0b57cec5SDimitry Andric
92*0b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
93*0b57cec5SDimitry Andric MVT VT = ScegN->getSimpleValueType(i);
94*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
95*0b57cec5SDimitry Andric && (TLI->getRegClassFor(VT)->getID() == RCId)) {
96*0b57cec5SDimitry Andric NumberDeps++;
97*0b57cec5SDimitry Andric break;
98*0b57cec5SDimitry Andric }
99*0b57cec5SDimitry Andric }
100*0b57cec5SDimitry Andric }
101*0b57cec5SDimitry Andric return NumberDeps;
102*0b57cec5SDimitry Andric }
103*0b57cec5SDimitry Andric
numberRCValSuccInSU(SUnit * SU,unsigned RCId)104*0b57cec5SDimitry Andric unsigned ResourcePriorityQueue::numberRCValSuccInSU(SUnit *SU,
105*0b57cec5SDimitry Andric unsigned RCId) {
106*0b57cec5SDimitry Andric unsigned NumberDeps = 0;
107*0b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs) {
108*0b57cec5SDimitry Andric if (Succ.isCtrl())
109*0b57cec5SDimitry Andric continue;
110*0b57cec5SDimitry Andric
111*0b57cec5SDimitry Andric SUnit *SuccSU = Succ.getSUnit();
112*0b57cec5SDimitry Andric const SDNode *ScegN = SuccSU->getNode();
113*0b57cec5SDimitry Andric if (!ScegN)
114*0b57cec5SDimitry Andric continue;
115*0b57cec5SDimitry Andric
116*0b57cec5SDimitry Andric // If value is passed to CopyToReg, it is probably
117*0b57cec5SDimitry Andric // live outside BB.
118*0b57cec5SDimitry Andric switch (ScegN->getOpcode()) {
119*0b57cec5SDimitry Andric default: break;
120*0b57cec5SDimitry Andric case ISD::TokenFactor: break;
121*0b57cec5SDimitry Andric case ISD::CopyFromReg: break;
122*0b57cec5SDimitry Andric case ISD::CopyToReg: NumberDeps++; break;
123*0b57cec5SDimitry Andric case ISD::INLINEASM: break;
124*0b57cec5SDimitry Andric case ISD::INLINEASM_BR: break;
125*0b57cec5SDimitry Andric }
126*0b57cec5SDimitry Andric if (!ScegN->isMachineOpcode())
127*0b57cec5SDimitry Andric continue;
128*0b57cec5SDimitry Andric
129*0b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
130*0b57cec5SDimitry Andric const SDValue &Op = ScegN->getOperand(i);
131*0b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
132*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
133*0b57cec5SDimitry Andric && (TLI->getRegClassFor(VT)->getID() == RCId)) {
134*0b57cec5SDimitry Andric NumberDeps++;
135*0b57cec5SDimitry Andric break;
136*0b57cec5SDimitry Andric }
137*0b57cec5SDimitry Andric }
138*0b57cec5SDimitry Andric }
139*0b57cec5SDimitry Andric return NumberDeps;
140*0b57cec5SDimitry Andric }
141*0b57cec5SDimitry Andric
numberCtrlDepsInSU(SUnit * SU)142*0b57cec5SDimitry Andric static unsigned numberCtrlDepsInSU(SUnit *SU) {
143*0b57cec5SDimitry Andric unsigned NumberDeps = 0;
144*0b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs)
145*0b57cec5SDimitry Andric if (Succ.isCtrl())
146*0b57cec5SDimitry Andric NumberDeps++;
147*0b57cec5SDimitry Andric
148*0b57cec5SDimitry Andric return NumberDeps;
149*0b57cec5SDimitry Andric }
150*0b57cec5SDimitry Andric
numberCtrlPredInSU(SUnit * SU)151*0b57cec5SDimitry Andric static unsigned numberCtrlPredInSU(SUnit *SU) {
152*0b57cec5SDimitry Andric unsigned NumberDeps = 0;
153*0b57cec5SDimitry Andric for (SDep &Pred : SU->Preds)
154*0b57cec5SDimitry Andric if (Pred.isCtrl())
155*0b57cec5SDimitry Andric NumberDeps++;
156*0b57cec5SDimitry Andric
157*0b57cec5SDimitry Andric return NumberDeps;
158*0b57cec5SDimitry Andric }
159*0b57cec5SDimitry Andric
160*0b57cec5SDimitry Andric ///
161*0b57cec5SDimitry Andric /// Initialize nodes.
162*0b57cec5SDimitry Andric ///
initNodes(std::vector<SUnit> & sunits)163*0b57cec5SDimitry Andric void ResourcePriorityQueue::initNodes(std::vector<SUnit> &sunits) {
164*0b57cec5SDimitry Andric SUnits = &sunits;
165*0b57cec5SDimitry Andric NumNodesSolelyBlocking.resize(SUnits->size(), 0);
166*0b57cec5SDimitry Andric
167*0b57cec5SDimitry Andric for (SUnit &SU : *SUnits) {
168*0b57cec5SDimitry Andric initNumRegDefsLeft(&SU);
169*0b57cec5SDimitry Andric SU.NodeQueueId = 0;
170*0b57cec5SDimitry Andric }
171*0b57cec5SDimitry Andric }
172*0b57cec5SDimitry Andric
173*0b57cec5SDimitry Andric /// This heuristic is used if DFA scheduling is not desired
174*0b57cec5SDimitry Andric /// for some VLIW platform.
operator ()(const SUnit * LHS,const SUnit * RHS) const175*0b57cec5SDimitry Andric bool resource_sort::operator()(const SUnit *LHS, const SUnit *RHS) const {
176*0b57cec5SDimitry Andric // The isScheduleHigh flag allows nodes with wraparound dependencies that
177*0b57cec5SDimitry Andric // cannot easily be modeled as edges with latencies to be scheduled as
178*0b57cec5SDimitry Andric // soon as possible in a top-down schedule.
179*0b57cec5SDimitry Andric if (LHS->isScheduleHigh && !RHS->isScheduleHigh)
180*0b57cec5SDimitry Andric return false;
181*0b57cec5SDimitry Andric
182*0b57cec5SDimitry Andric if (!LHS->isScheduleHigh && RHS->isScheduleHigh)
183*0b57cec5SDimitry Andric return true;
184*0b57cec5SDimitry Andric
185*0b57cec5SDimitry Andric unsigned LHSNum = LHS->NodeNum;
186*0b57cec5SDimitry Andric unsigned RHSNum = RHS->NodeNum;
187*0b57cec5SDimitry Andric
188*0b57cec5SDimitry Andric // The most important heuristic is scheduling the critical path.
189*0b57cec5SDimitry Andric unsigned LHSLatency = PQ->getLatency(LHSNum);
190*0b57cec5SDimitry Andric unsigned RHSLatency = PQ->getLatency(RHSNum);
191*0b57cec5SDimitry Andric if (LHSLatency < RHSLatency) return true;
192*0b57cec5SDimitry Andric if (LHSLatency > RHSLatency) return false;
193*0b57cec5SDimitry Andric
194*0b57cec5SDimitry Andric // After that, if two nodes have identical latencies, look to see if one will
195*0b57cec5SDimitry Andric // unblock more other nodes than the other.
196*0b57cec5SDimitry Andric unsigned LHSBlocked = PQ->getNumSolelyBlockNodes(LHSNum);
197*0b57cec5SDimitry Andric unsigned RHSBlocked = PQ->getNumSolelyBlockNodes(RHSNum);
198*0b57cec5SDimitry Andric if (LHSBlocked < RHSBlocked) return true;
199*0b57cec5SDimitry Andric if (LHSBlocked > RHSBlocked) return false;
200*0b57cec5SDimitry Andric
201*0b57cec5SDimitry Andric // Finally, just to provide a stable ordering, use the node number as a
202*0b57cec5SDimitry Andric // deciding factor.
203*0b57cec5SDimitry Andric return LHSNum < RHSNum;
204*0b57cec5SDimitry Andric }
205*0b57cec5SDimitry Andric
206*0b57cec5SDimitry Andric
207*0b57cec5SDimitry Andric /// getSingleUnscheduledPred - If there is exactly one unscheduled predecessor
208*0b57cec5SDimitry Andric /// of SU, return it, otherwise return null.
getSingleUnscheduledPred(SUnit * SU)209*0b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::getSingleUnscheduledPred(SUnit *SU) {
210*0b57cec5SDimitry Andric SUnit *OnlyAvailablePred = nullptr;
211*0b57cec5SDimitry Andric for (const SDep &Pred : SU->Preds) {
212*0b57cec5SDimitry Andric SUnit &PredSU = *Pred.getSUnit();
213*0b57cec5SDimitry Andric if (!PredSU.isScheduled) {
214*0b57cec5SDimitry Andric // We found an available, but not scheduled, predecessor. If it's the
215*0b57cec5SDimitry Andric // only one we have found, keep track of it... otherwise give up.
216*0b57cec5SDimitry Andric if (OnlyAvailablePred && OnlyAvailablePred != &PredSU)
217*0b57cec5SDimitry Andric return nullptr;
218*0b57cec5SDimitry Andric OnlyAvailablePred = &PredSU;
219*0b57cec5SDimitry Andric }
220*0b57cec5SDimitry Andric }
221*0b57cec5SDimitry Andric return OnlyAvailablePred;
222*0b57cec5SDimitry Andric }
223*0b57cec5SDimitry Andric
push(SUnit * SU)224*0b57cec5SDimitry Andric void ResourcePriorityQueue::push(SUnit *SU) {
225*0b57cec5SDimitry Andric // Look at all of the successors of this node. Count the number of nodes that
226*0b57cec5SDimitry Andric // this node is the sole unscheduled node for.
227*0b57cec5SDimitry Andric unsigned NumNodesBlocking = 0;
228*0b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs)
229*0b57cec5SDimitry Andric if (getSingleUnscheduledPred(Succ.getSUnit()) == SU)
230*0b57cec5SDimitry Andric ++NumNodesBlocking;
231*0b57cec5SDimitry Andric
232*0b57cec5SDimitry Andric NumNodesSolelyBlocking[SU->NodeNum] = NumNodesBlocking;
233*0b57cec5SDimitry Andric Queue.push_back(SU);
234*0b57cec5SDimitry Andric }
235*0b57cec5SDimitry Andric
236*0b57cec5SDimitry Andric /// Check if scheduling of this SU is possible
237*0b57cec5SDimitry Andric /// in the current packet.
isResourceAvailable(SUnit * SU)238*0b57cec5SDimitry Andric bool ResourcePriorityQueue::isResourceAvailable(SUnit *SU) {
239*0b57cec5SDimitry Andric if (!SU || !SU->getNode())
240*0b57cec5SDimitry Andric return false;
241*0b57cec5SDimitry Andric
242*0b57cec5SDimitry Andric // If this is a compound instruction,
243*0b57cec5SDimitry Andric // it is likely to be a call. Do not delay it.
244*0b57cec5SDimitry Andric if (SU->getNode()->getGluedNode())
245*0b57cec5SDimitry Andric return true;
246*0b57cec5SDimitry Andric
247*0b57cec5SDimitry Andric // First see if the pipeline could receive this instruction
248*0b57cec5SDimitry Andric // in the current cycle.
249*0b57cec5SDimitry Andric if (SU->getNode()->isMachineOpcode())
250*0b57cec5SDimitry Andric switch (SU->getNode()->getMachineOpcode()) {
251*0b57cec5SDimitry Andric default:
252*0b57cec5SDimitry Andric if (!ResourcesModel->canReserveResources(&TII->get(
253*0b57cec5SDimitry Andric SU->getNode()->getMachineOpcode())))
254*0b57cec5SDimitry Andric return false;
255*0b57cec5SDimitry Andric break;
256*0b57cec5SDimitry Andric case TargetOpcode::EXTRACT_SUBREG:
257*0b57cec5SDimitry Andric case TargetOpcode::INSERT_SUBREG:
258*0b57cec5SDimitry Andric case TargetOpcode::SUBREG_TO_REG:
259*0b57cec5SDimitry Andric case TargetOpcode::REG_SEQUENCE:
260*0b57cec5SDimitry Andric case TargetOpcode::IMPLICIT_DEF:
261*0b57cec5SDimitry Andric break;
262*0b57cec5SDimitry Andric }
263*0b57cec5SDimitry Andric
264*0b57cec5SDimitry Andric // Now see if there are no other dependencies
265*0b57cec5SDimitry Andric // to instructions already in the packet.
266*0b57cec5SDimitry Andric for (const SUnit *S : Packet)
267*0b57cec5SDimitry Andric for (const SDep &Succ : S->Succs) {
268*0b57cec5SDimitry Andric // Since we do not add pseudos to packets, might as well
269*0b57cec5SDimitry Andric // ignore order deps.
270*0b57cec5SDimitry Andric if (Succ.isCtrl())
271*0b57cec5SDimitry Andric continue;
272*0b57cec5SDimitry Andric
273*0b57cec5SDimitry Andric if (Succ.getSUnit() == SU)
274*0b57cec5SDimitry Andric return false;
275*0b57cec5SDimitry Andric }
276*0b57cec5SDimitry Andric
277*0b57cec5SDimitry Andric return true;
278*0b57cec5SDimitry Andric }
279*0b57cec5SDimitry Andric
280*0b57cec5SDimitry Andric /// Keep track of available resources.
reserveResources(SUnit * SU)281*0b57cec5SDimitry Andric void ResourcePriorityQueue::reserveResources(SUnit *SU) {
282*0b57cec5SDimitry Andric // If this SU does not fit in the packet
283*0b57cec5SDimitry Andric // start a new one.
284*0b57cec5SDimitry Andric if (!isResourceAvailable(SU) || SU->getNode()->getGluedNode()) {
285*0b57cec5SDimitry Andric ResourcesModel->clearResources();
286*0b57cec5SDimitry Andric Packet.clear();
287*0b57cec5SDimitry Andric }
288*0b57cec5SDimitry Andric
289*0b57cec5SDimitry Andric if (SU->getNode() && SU->getNode()->isMachineOpcode()) {
290*0b57cec5SDimitry Andric switch (SU->getNode()->getMachineOpcode()) {
291*0b57cec5SDimitry Andric default:
292*0b57cec5SDimitry Andric ResourcesModel->reserveResources(&TII->get(
293*0b57cec5SDimitry Andric SU->getNode()->getMachineOpcode()));
294*0b57cec5SDimitry Andric break;
295*0b57cec5SDimitry Andric case TargetOpcode::EXTRACT_SUBREG:
296*0b57cec5SDimitry Andric case TargetOpcode::INSERT_SUBREG:
297*0b57cec5SDimitry Andric case TargetOpcode::SUBREG_TO_REG:
298*0b57cec5SDimitry Andric case TargetOpcode::REG_SEQUENCE:
299*0b57cec5SDimitry Andric case TargetOpcode::IMPLICIT_DEF:
300*0b57cec5SDimitry Andric break;
301*0b57cec5SDimitry Andric }
302*0b57cec5SDimitry Andric Packet.push_back(SU);
303*0b57cec5SDimitry Andric }
304*0b57cec5SDimitry Andric // Forcefully end packet for PseudoOps.
305*0b57cec5SDimitry Andric else {
306*0b57cec5SDimitry Andric ResourcesModel->clearResources();
307*0b57cec5SDimitry Andric Packet.clear();
308*0b57cec5SDimitry Andric }
309*0b57cec5SDimitry Andric
310*0b57cec5SDimitry Andric // If packet is now full, reset the state so in the next cycle
311*0b57cec5SDimitry Andric // we start fresh.
312*0b57cec5SDimitry Andric if (Packet.size() >= InstrItins->SchedModel.IssueWidth) {
313*0b57cec5SDimitry Andric ResourcesModel->clearResources();
314*0b57cec5SDimitry Andric Packet.clear();
315*0b57cec5SDimitry Andric }
316*0b57cec5SDimitry Andric }
317*0b57cec5SDimitry Andric
rawRegPressureDelta(SUnit * SU,unsigned RCId)318*0b57cec5SDimitry Andric int ResourcePriorityQueue::rawRegPressureDelta(SUnit *SU, unsigned RCId) {
319*0b57cec5SDimitry Andric int RegBalance = 0;
320*0b57cec5SDimitry Andric
321*0b57cec5SDimitry Andric if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
322*0b57cec5SDimitry Andric return RegBalance;
323*0b57cec5SDimitry Andric
324*0b57cec5SDimitry Andric // Gen estimate.
325*0b57cec5SDimitry Andric for (unsigned i = 0, e = SU->getNode()->getNumValues(); i != e; ++i) {
326*0b57cec5SDimitry Andric MVT VT = SU->getNode()->getSimpleValueType(i);
327*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
328*0b57cec5SDimitry Andric && TLI->getRegClassFor(VT)
329*0b57cec5SDimitry Andric && TLI->getRegClassFor(VT)->getID() == RCId)
330*0b57cec5SDimitry Andric RegBalance += numberRCValSuccInSU(SU, RCId);
331*0b57cec5SDimitry Andric }
332*0b57cec5SDimitry Andric // Kill estimate.
333*0b57cec5SDimitry Andric for (unsigned i = 0, e = SU->getNode()->getNumOperands(); i != e; ++i) {
334*0b57cec5SDimitry Andric const SDValue &Op = SU->getNode()->getOperand(i);
335*0b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
336*0b57cec5SDimitry Andric if (isa<ConstantSDNode>(Op.getNode()))
337*0b57cec5SDimitry Andric continue;
338*0b57cec5SDimitry Andric
339*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT) && TLI->getRegClassFor(VT)
340*0b57cec5SDimitry Andric && TLI->getRegClassFor(VT)->getID() == RCId)
341*0b57cec5SDimitry Andric RegBalance -= numberRCValPredInSU(SU, RCId);
342*0b57cec5SDimitry Andric }
343*0b57cec5SDimitry Andric return RegBalance;
344*0b57cec5SDimitry Andric }
345*0b57cec5SDimitry Andric
346*0b57cec5SDimitry Andric /// Estimates change in reg pressure from this SU.
347*0b57cec5SDimitry Andric /// It is achieved by trivial tracking of defined
348*0b57cec5SDimitry Andric /// and used vregs in dependent instructions.
349*0b57cec5SDimitry Andric /// The RawPressure flag makes this function to ignore
350*0b57cec5SDimitry Andric /// existing reg file sizes, and report raw def/use
351*0b57cec5SDimitry Andric /// balance.
regPressureDelta(SUnit * SU,bool RawPressure)352*0b57cec5SDimitry Andric int ResourcePriorityQueue::regPressureDelta(SUnit *SU, bool RawPressure) {
353*0b57cec5SDimitry Andric int RegBalance = 0;
354*0b57cec5SDimitry Andric
355*0b57cec5SDimitry Andric if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
356*0b57cec5SDimitry Andric return RegBalance;
357*0b57cec5SDimitry Andric
358*0b57cec5SDimitry Andric if (RawPressure) {
359*0b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses())
360*0b57cec5SDimitry Andric RegBalance += rawRegPressureDelta(SU, RC->getID());
361*0b57cec5SDimitry Andric }
362*0b57cec5SDimitry Andric else {
363*0b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses()) {
364*0b57cec5SDimitry Andric if ((RegPressure[RC->getID()] +
365*0b57cec5SDimitry Andric rawRegPressureDelta(SU, RC->getID()) > 0) &&
366*0b57cec5SDimitry Andric (RegPressure[RC->getID()] +
367*0b57cec5SDimitry Andric rawRegPressureDelta(SU, RC->getID()) >= RegLimit[RC->getID()]))
368*0b57cec5SDimitry Andric RegBalance += rawRegPressureDelta(SU, RC->getID());
369*0b57cec5SDimitry Andric }
370*0b57cec5SDimitry Andric }
371*0b57cec5SDimitry Andric
372*0b57cec5SDimitry Andric return RegBalance;
373*0b57cec5SDimitry Andric }
374*0b57cec5SDimitry Andric
375*0b57cec5SDimitry Andric // Constants used to denote relative importance of
376*0b57cec5SDimitry Andric // heuristic components for cost computation.
377*0b57cec5SDimitry Andric static const unsigned PriorityOne = 200;
378*0b57cec5SDimitry Andric static const unsigned PriorityTwo = 50;
379*0b57cec5SDimitry Andric static const unsigned PriorityThree = 15;
380*0b57cec5SDimitry Andric static const unsigned PriorityFour = 5;
381*0b57cec5SDimitry Andric static const unsigned ScaleOne = 20;
382*0b57cec5SDimitry Andric static const unsigned ScaleTwo = 10;
383*0b57cec5SDimitry Andric static const unsigned ScaleThree = 5;
384*0b57cec5SDimitry Andric static const unsigned FactorOne = 2;
385*0b57cec5SDimitry Andric
386*0b57cec5SDimitry Andric /// Returns single number reflecting benefit of scheduling SU
387*0b57cec5SDimitry Andric /// in the current cycle.
SUSchedulingCost(SUnit * SU)388*0b57cec5SDimitry Andric int ResourcePriorityQueue::SUSchedulingCost(SUnit *SU) {
389*0b57cec5SDimitry Andric // Initial trivial priority.
390*0b57cec5SDimitry Andric int ResCount = 1;
391*0b57cec5SDimitry Andric
392*0b57cec5SDimitry Andric // Do not waste time on a node that is already scheduled.
393*0b57cec5SDimitry Andric if (SU->isScheduled)
394*0b57cec5SDimitry Andric return ResCount;
395*0b57cec5SDimitry Andric
396*0b57cec5SDimitry Andric // Forced priority is high.
397*0b57cec5SDimitry Andric if (SU->isScheduleHigh)
398*0b57cec5SDimitry Andric ResCount += PriorityOne;
399*0b57cec5SDimitry Andric
400*0b57cec5SDimitry Andric // Adaptable scheduling
401*0b57cec5SDimitry Andric // A small, but very parallel
402*0b57cec5SDimitry Andric // region, where reg pressure is an issue.
403*0b57cec5SDimitry Andric if (HorizontalVerticalBalance > RegPressureThreshold) {
404*0b57cec5SDimitry Andric // Critical path first
405*0b57cec5SDimitry Andric ResCount += (SU->getHeight() * ScaleTwo);
406*0b57cec5SDimitry Andric // If resources are available for it, multiply the
407*0b57cec5SDimitry Andric // chance of scheduling.
408*0b57cec5SDimitry Andric if (isResourceAvailable(SU))
409*0b57cec5SDimitry Andric ResCount <<= FactorOne;
410*0b57cec5SDimitry Andric
411*0b57cec5SDimitry Andric // Consider change to reg pressure from scheduling
412*0b57cec5SDimitry Andric // this SU.
413*0b57cec5SDimitry Andric ResCount -= (regPressureDelta(SU,true) * ScaleOne);
414*0b57cec5SDimitry Andric }
415*0b57cec5SDimitry Andric // Default heuristic, greeady and
416*0b57cec5SDimitry Andric // critical path driven.
417*0b57cec5SDimitry Andric else {
418*0b57cec5SDimitry Andric // Critical path first.
419*0b57cec5SDimitry Andric ResCount += (SU->getHeight() * ScaleTwo);
420*0b57cec5SDimitry Andric // Now see how many instructions is blocked by this SU.
421*0b57cec5SDimitry Andric ResCount += (NumNodesSolelyBlocking[SU->NodeNum] * ScaleTwo);
422*0b57cec5SDimitry Andric // If resources are available for it, multiply the
423*0b57cec5SDimitry Andric // chance of scheduling.
424*0b57cec5SDimitry Andric if (isResourceAvailable(SU))
425*0b57cec5SDimitry Andric ResCount <<= FactorOne;
426*0b57cec5SDimitry Andric
427*0b57cec5SDimitry Andric ResCount -= (regPressureDelta(SU) * ScaleTwo);
428*0b57cec5SDimitry Andric }
429*0b57cec5SDimitry Andric
430*0b57cec5SDimitry Andric // These are platform-specific things.
431*0b57cec5SDimitry Andric // Will need to go into the back end
432*0b57cec5SDimitry Andric // and accessed from here via a hook.
433*0b57cec5SDimitry Andric for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) {
434*0b57cec5SDimitry Andric if (N->isMachineOpcode()) {
435*0b57cec5SDimitry Andric const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
436*0b57cec5SDimitry Andric if (TID.isCall())
437*0b57cec5SDimitry Andric ResCount += (PriorityTwo + (ScaleThree*N->getNumValues()));
438*0b57cec5SDimitry Andric }
439*0b57cec5SDimitry Andric else
440*0b57cec5SDimitry Andric switch (N->getOpcode()) {
441*0b57cec5SDimitry Andric default: break;
442*0b57cec5SDimitry Andric case ISD::TokenFactor:
443*0b57cec5SDimitry Andric case ISD::CopyFromReg:
444*0b57cec5SDimitry Andric case ISD::CopyToReg:
445*0b57cec5SDimitry Andric ResCount += PriorityFour;
446*0b57cec5SDimitry Andric break;
447*0b57cec5SDimitry Andric
448*0b57cec5SDimitry Andric case ISD::INLINEASM:
449*0b57cec5SDimitry Andric case ISD::INLINEASM_BR:
450*0b57cec5SDimitry Andric ResCount += PriorityThree;
451*0b57cec5SDimitry Andric break;
452*0b57cec5SDimitry Andric }
453*0b57cec5SDimitry Andric }
454*0b57cec5SDimitry Andric return ResCount;
455*0b57cec5SDimitry Andric }
456*0b57cec5SDimitry Andric
457*0b57cec5SDimitry Andric
458*0b57cec5SDimitry Andric /// Main resource tracking point.
scheduledNode(SUnit * SU)459*0b57cec5SDimitry Andric void ResourcePriorityQueue::scheduledNode(SUnit *SU) {
460*0b57cec5SDimitry Andric // Use NULL entry as an event marker to reset
461*0b57cec5SDimitry Andric // the DFA state.
462*0b57cec5SDimitry Andric if (!SU) {
463*0b57cec5SDimitry Andric ResourcesModel->clearResources();
464*0b57cec5SDimitry Andric Packet.clear();
465*0b57cec5SDimitry Andric return;
466*0b57cec5SDimitry Andric }
467*0b57cec5SDimitry Andric
468*0b57cec5SDimitry Andric const SDNode *ScegN = SU->getNode();
469*0b57cec5SDimitry Andric // Update reg pressure tracking.
470*0b57cec5SDimitry Andric // First update current node.
471*0b57cec5SDimitry Andric if (ScegN->isMachineOpcode()) {
472*0b57cec5SDimitry Andric // Estimate generated regs.
473*0b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
474*0b57cec5SDimitry Andric MVT VT = ScegN->getSimpleValueType(i);
475*0b57cec5SDimitry Andric
476*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)) {
477*0b57cec5SDimitry Andric const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
478*0b57cec5SDimitry Andric if (RC)
479*0b57cec5SDimitry Andric RegPressure[RC->getID()] += numberRCValSuccInSU(SU, RC->getID());
480*0b57cec5SDimitry Andric }
481*0b57cec5SDimitry Andric }
482*0b57cec5SDimitry Andric // Estimate killed regs.
483*0b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
484*0b57cec5SDimitry Andric const SDValue &Op = ScegN->getOperand(i);
485*0b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
486*0b57cec5SDimitry Andric
487*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)) {
488*0b57cec5SDimitry Andric const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
489*0b57cec5SDimitry Andric if (RC) {
490*0b57cec5SDimitry Andric if (RegPressure[RC->getID()] >
491*0b57cec5SDimitry Andric (numberRCValPredInSU(SU, RC->getID())))
492*0b57cec5SDimitry Andric RegPressure[RC->getID()] -= numberRCValPredInSU(SU, RC->getID());
493*0b57cec5SDimitry Andric else RegPressure[RC->getID()] = 0;
494*0b57cec5SDimitry Andric }
495*0b57cec5SDimitry Andric }
496*0b57cec5SDimitry Andric }
497*0b57cec5SDimitry Andric for (SDep &Pred : SU->Preds) {
498*0b57cec5SDimitry Andric if (Pred.isCtrl() || (Pred.getSUnit()->NumRegDefsLeft == 0))
499*0b57cec5SDimitry Andric continue;
500*0b57cec5SDimitry Andric --Pred.getSUnit()->NumRegDefsLeft;
501*0b57cec5SDimitry Andric }
502*0b57cec5SDimitry Andric }
503*0b57cec5SDimitry Andric
504*0b57cec5SDimitry Andric // Reserve resources for this SU.
505*0b57cec5SDimitry Andric reserveResources(SU);
506*0b57cec5SDimitry Andric
507*0b57cec5SDimitry Andric // Adjust number of parallel live ranges.
508*0b57cec5SDimitry Andric // Heuristic is simple - node with no data successors reduces
509*0b57cec5SDimitry Andric // number of live ranges. All others, increase it.
510*0b57cec5SDimitry Andric unsigned NumberNonControlDeps = 0;
511*0b57cec5SDimitry Andric
512*0b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs) {
513*0b57cec5SDimitry Andric adjustPriorityOfUnscheduledPreds(Succ.getSUnit());
514*0b57cec5SDimitry Andric if (!Succ.isCtrl())
515*0b57cec5SDimitry Andric NumberNonControlDeps++;
516*0b57cec5SDimitry Andric }
517*0b57cec5SDimitry Andric
518*0b57cec5SDimitry Andric if (!NumberNonControlDeps) {
519*0b57cec5SDimitry Andric if (ParallelLiveRanges >= SU->NumPreds)
520*0b57cec5SDimitry Andric ParallelLiveRanges -= SU->NumPreds;
521*0b57cec5SDimitry Andric else
522*0b57cec5SDimitry Andric ParallelLiveRanges = 0;
523*0b57cec5SDimitry Andric
524*0b57cec5SDimitry Andric }
525*0b57cec5SDimitry Andric else
526*0b57cec5SDimitry Andric ParallelLiveRanges += SU->NumRegDefsLeft;
527*0b57cec5SDimitry Andric
528*0b57cec5SDimitry Andric // Track parallel live chains.
529*0b57cec5SDimitry Andric HorizontalVerticalBalance += (SU->Succs.size() - numberCtrlDepsInSU(SU));
530*0b57cec5SDimitry Andric HorizontalVerticalBalance -= (SU->Preds.size() - numberCtrlPredInSU(SU));
531*0b57cec5SDimitry Andric }
532*0b57cec5SDimitry Andric
initNumRegDefsLeft(SUnit * SU)533*0b57cec5SDimitry Andric void ResourcePriorityQueue::initNumRegDefsLeft(SUnit *SU) {
534*0b57cec5SDimitry Andric unsigned NodeNumDefs = 0;
535*0b57cec5SDimitry Andric for (SDNode *N = SU->getNode(); N; N = N->getGluedNode())
536*0b57cec5SDimitry Andric if (N->isMachineOpcode()) {
537*0b57cec5SDimitry Andric const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
538*0b57cec5SDimitry Andric // No register need be allocated for this.
539*0b57cec5SDimitry Andric if (N->getMachineOpcode() == TargetOpcode::IMPLICIT_DEF) {
540*0b57cec5SDimitry Andric NodeNumDefs = 0;
541*0b57cec5SDimitry Andric break;
542*0b57cec5SDimitry Andric }
543*0b57cec5SDimitry Andric NodeNumDefs = std::min(N->getNumValues(), TID.getNumDefs());
544*0b57cec5SDimitry Andric }
545*0b57cec5SDimitry Andric else
546*0b57cec5SDimitry Andric switch(N->getOpcode()) {
547*0b57cec5SDimitry Andric default: break;
548*0b57cec5SDimitry Andric case ISD::CopyFromReg:
549*0b57cec5SDimitry Andric NodeNumDefs++;
550*0b57cec5SDimitry Andric break;
551*0b57cec5SDimitry Andric case ISD::INLINEASM:
552*0b57cec5SDimitry Andric case ISD::INLINEASM_BR:
553*0b57cec5SDimitry Andric NodeNumDefs++;
554*0b57cec5SDimitry Andric break;
555*0b57cec5SDimitry Andric }
556*0b57cec5SDimitry Andric
557*0b57cec5SDimitry Andric SU->NumRegDefsLeft = NodeNumDefs;
558*0b57cec5SDimitry Andric }
559*0b57cec5SDimitry Andric
560*0b57cec5SDimitry Andric /// adjustPriorityOfUnscheduledPreds - One of the predecessors of SU was just
561*0b57cec5SDimitry Andric /// scheduled. If SU is not itself available, then there is at least one
562*0b57cec5SDimitry Andric /// predecessor node that has not been scheduled yet. If SU has exactly ONE
563*0b57cec5SDimitry Andric /// unscheduled predecessor, we want to increase its priority: it getting
564*0b57cec5SDimitry Andric /// scheduled will make this node available, so it is better than some other
565*0b57cec5SDimitry Andric /// node of the same priority that will not make a node available.
adjustPriorityOfUnscheduledPreds(SUnit * SU)566*0b57cec5SDimitry Andric void ResourcePriorityQueue::adjustPriorityOfUnscheduledPreds(SUnit *SU) {
567*0b57cec5SDimitry Andric if (SU->isAvailable) return; // All preds scheduled.
568*0b57cec5SDimitry Andric
569*0b57cec5SDimitry Andric SUnit *OnlyAvailablePred = getSingleUnscheduledPred(SU);
570*0b57cec5SDimitry Andric if (!OnlyAvailablePred || !OnlyAvailablePred->isAvailable)
571*0b57cec5SDimitry Andric return;
572*0b57cec5SDimitry Andric
573*0b57cec5SDimitry Andric // Okay, we found a single predecessor that is available, but not scheduled.
574*0b57cec5SDimitry Andric // Since it is available, it must be in the priority queue. First remove it.
575*0b57cec5SDimitry Andric remove(OnlyAvailablePred);
576*0b57cec5SDimitry Andric
577*0b57cec5SDimitry Andric // Reinsert the node into the priority queue, which recomputes its
578*0b57cec5SDimitry Andric // NumNodesSolelyBlocking value.
579*0b57cec5SDimitry Andric push(OnlyAvailablePred);
580*0b57cec5SDimitry Andric }
581*0b57cec5SDimitry Andric
582*0b57cec5SDimitry Andric
583*0b57cec5SDimitry Andric /// Main access point - returns next instructions
584*0b57cec5SDimitry Andric /// to be placed in scheduling sequence.
pop()585*0b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::pop() {
586*0b57cec5SDimitry Andric if (empty())
587*0b57cec5SDimitry Andric return nullptr;
588*0b57cec5SDimitry Andric
589*0b57cec5SDimitry Andric std::vector<SUnit *>::iterator Best = Queue.begin();
590*0b57cec5SDimitry Andric if (!DisableDFASched) {
591*0b57cec5SDimitry Andric int BestCost = SUSchedulingCost(*Best);
592*0b57cec5SDimitry Andric for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I) {
593*0b57cec5SDimitry Andric
594*0b57cec5SDimitry Andric if (SUSchedulingCost(*I) > BestCost) {
595*0b57cec5SDimitry Andric BestCost = SUSchedulingCost(*I);
596*0b57cec5SDimitry Andric Best = I;
597*0b57cec5SDimitry Andric }
598*0b57cec5SDimitry Andric }
599*0b57cec5SDimitry Andric }
600*0b57cec5SDimitry Andric // Use default TD scheduling mechanism.
601*0b57cec5SDimitry Andric else {
602*0b57cec5SDimitry Andric for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I)
603*0b57cec5SDimitry Andric if (Picker(*Best, *I))
604*0b57cec5SDimitry Andric Best = I;
605*0b57cec5SDimitry Andric }
606*0b57cec5SDimitry Andric
607*0b57cec5SDimitry Andric SUnit *V = *Best;
608*0b57cec5SDimitry Andric if (Best != std::prev(Queue.end()))
609*0b57cec5SDimitry Andric std::swap(*Best, Queue.back());
610*0b57cec5SDimitry Andric
611*0b57cec5SDimitry Andric Queue.pop_back();
612*0b57cec5SDimitry Andric
613*0b57cec5SDimitry Andric return V;
614*0b57cec5SDimitry Andric }
615*0b57cec5SDimitry Andric
616*0b57cec5SDimitry Andric
remove(SUnit * SU)617*0b57cec5SDimitry Andric void ResourcePriorityQueue::remove(SUnit *SU) {
618*0b57cec5SDimitry Andric assert(!Queue.empty() && "Queue is empty!");
619*0b57cec5SDimitry Andric std::vector<SUnit *>::iterator I = find(Queue, SU);
620*0b57cec5SDimitry Andric if (I != std::prev(Queue.end()))
621*0b57cec5SDimitry Andric std::swap(*I, Queue.back());
622*0b57cec5SDimitry Andric
623*0b57cec5SDimitry Andric Queue.pop_back();
624*0b57cec5SDimitry Andric }
625*0b57cec5SDimitry Andric