1*0b57cec5SDimitry Andric //===- ResourcePriorityQueue.cpp - A DFA-oriented priority queue -*- C++ -*-==//
2*0b57cec5SDimitry Andric //
3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
8*0b57cec5SDimitry Andric //
9*0b57cec5SDimitry Andric // This file implements the ResourcePriorityQueue class, which is a
10*0b57cec5SDimitry Andric // SchedulingPriorityQueue that prioritizes instructions using DFA state to
11*0b57cec5SDimitry Andric // reduce the length of the critical path through the basic block
12*0b57cec5SDimitry Andric // on VLIW platforms.
13*0b57cec5SDimitry Andric // The scheduler is basically a top-down adaptable list scheduler with DFA
14*0b57cec5SDimitry Andric // resource tracking added to the cost function.
15*0b57cec5SDimitry Andric // DFA is queried as a state machine to model "packets/bundles" during
16*0b57cec5SDimitry Andric // schedule. Currently packets/bundles are discarded at the end of
17*0b57cec5SDimitry Andric // scheduling, affecting only order of instructions.
18*0b57cec5SDimitry Andric //
19*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
20*0b57cec5SDimitry Andric
21*0b57cec5SDimitry Andric #include "llvm/CodeGen/ResourcePriorityQueue.h"
22*0b57cec5SDimitry Andric #include "llvm/CodeGen/DFAPacketizer.h"
23*0b57cec5SDimitry Andric #include "llvm/CodeGen/MachineInstr.h"
24*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGISel.h"
25*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGNodes.h"
26*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h"
27*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetLowering.h"
28*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetRegisterInfo.h"
29*0b57cec5SDimitry Andric #include "llvm/CodeGen/TargetSubtargetInfo.h"
30*0b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
31*0b57cec5SDimitry Andric #include "llvm/Support/Debug.h"
32*0b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h"
33*0b57cec5SDimitry Andric #include "llvm/Target/TargetMachine.h"
34*0b57cec5SDimitry Andric
35*0b57cec5SDimitry Andric using namespace llvm;
36*0b57cec5SDimitry Andric
37*0b57cec5SDimitry Andric #define DEBUG_TYPE "scheduler"
38*0b57cec5SDimitry Andric
39*0b57cec5SDimitry Andric static cl::opt<bool> DisableDFASched("disable-dfa-sched", cl::Hidden,
40*0b57cec5SDimitry Andric cl::ZeroOrMore, cl::init(false),
41*0b57cec5SDimitry Andric cl::desc("Disable use of DFA during scheduling"));
42*0b57cec5SDimitry Andric
43*0b57cec5SDimitry Andric static cl::opt<int> RegPressureThreshold(
44*0b57cec5SDimitry Andric "dfa-sched-reg-pressure-threshold", cl::Hidden, cl::ZeroOrMore, cl::init(5),
45*0b57cec5SDimitry Andric cl::desc("Track reg pressure and switch priority to in-depth"));
46*0b57cec5SDimitry Andric
ResourcePriorityQueue(SelectionDAGISel * IS)47*0b57cec5SDimitry Andric ResourcePriorityQueue::ResourcePriorityQueue(SelectionDAGISel *IS)
48*0b57cec5SDimitry Andric : Picker(this), InstrItins(IS->MF->getSubtarget().getInstrItineraryData()) {
49*0b57cec5SDimitry Andric const TargetSubtargetInfo &STI = IS->MF->getSubtarget();
50*0b57cec5SDimitry Andric TRI = STI.getRegisterInfo();
51*0b57cec5SDimitry Andric TLI = IS->TLI;
52*0b57cec5SDimitry Andric TII = STI.getInstrInfo();
53*0b57cec5SDimitry Andric ResourcesModel.reset(TII->CreateTargetScheduleState(STI));
54*0b57cec5SDimitry Andric // This hard requirement could be relaxed, but for now
55*0b57cec5SDimitry Andric // do not let it proceed.
56*0b57cec5SDimitry Andric assert(ResourcesModel && "Unimplemented CreateTargetScheduleState.");
57*0b57cec5SDimitry Andric
58*0b57cec5SDimitry Andric unsigned NumRC = TRI->getNumRegClasses();
59*0b57cec5SDimitry Andric RegLimit.resize(NumRC);
60*0b57cec5SDimitry Andric RegPressure.resize(NumRC);
61*0b57cec5SDimitry Andric std::fill(RegLimit.begin(), RegLimit.end(), 0);
62*0b57cec5SDimitry Andric std::fill(RegPressure.begin(), RegPressure.end(), 0);
63*0b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses())
64*0b57cec5SDimitry Andric RegLimit[RC->getID()] = TRI->getRegPressureLimit(RC, *IS->MF);
65*0b57cec5SDimitry Andric
66*0b57cec5SDimitry Andric ParallelLiveRanges = 0;
67*0b57cec5SDimitry Andric HorizontalVerticalBalance = 0;
68*0b57cec5SDimitry Andric }
69*0b57cec5SDimitry Andric
70*0b57cec5SDimitry Andric unsigned
numberRCValPredInSU(SUnit * SU,unsigned RCId)71*0b57cec5SDimitry Andric ResourcePriorityQueue::numberRCValPredInSU(SUnit *SU, unsigned RCId) {
72*0b57cec5SDimitry Andric unsigned NumberDeps = 0;
73*0b57cec5SDimitry Andric for (SDep &Pred : SU->Preds) {
74*0b57cec5SDimitry Andric if (Pred.isCtrl())
75*0b57cec5SDimitry Andric continue;
76*0b57cec5SDimitry Andric
77*0b57cec5SDimitry Andric SUnit *PredSU = Pred.getSUnit();
78*0b57cec5SDimitry Andric const SDNode *ScegN = PredSU->getNode();
79*0b57cec5SDimitry Andric
80*0b57cec5SDimitry Andric if (!ScegN)
81*0b57cec5SDimitry Andric continue;
82*0b57cec5SDimitry Andric
83*0b57cec5SDimitry Andric // If value is passed to CopyToReg, it is probably
84*0b57cec5SDimitry Andric // live outside BB.
85*0b57cec5SDimitry Andric switch (ScegN->getOpcode()) {
86*0b57cec5SDimitry Andric default: break;
87*0b57cec5SDimitry Andric case ISD::TokenFactor: break;
88*0b57cec5SDimitry Andric case ISD::CopyFromReg: NumberDeps++; break;
89*0b57cec5SDimitry Andric case ISD::CopyToReg: break;
90*0b57cec5SDimitry Andric case ISD::INLINEASM: break;
91*0b57cec5SDimitry Andric case ISD::INLINEASM_BR: break;
92*0b57cec5SDimitry Andric }
93*0b57cec5SDimitry Andric if (!ScegN->isMachineOpcode())
94*0b57cec5SDimitry Andric continue;
95*0b57cec5SDimitry Andric
96*0b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
97*0b57cec5SDimitry Andric MVT VT = ScegN->getSimpleValueType(i);
98*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
99*0b57cec5SDimitry Andric && (TLI->getRegClassFor(VT)->getID() == RCId)) {
100*0b57cec5SDimitry Andric NumberDeps++;
101*0b57cec5SDimitry Andric break;
102*0b57cec5SDimitry Andric }
103*0b57cec5SDimitry Andric }
104*0b57cec5SDimitry Andric }
105*0b57cec5SDimitry Andric return NumberDeps;
106*0b57cec5SDimitry Andric }
107*0b57cec5SDimitry Andric
numberRCValSuccInSU(SUnit * SU,unsigned RCId)108*0b57cec5SDimitry Andric unsigned ResourcePriorityQueue::numberRCValSuccInSU(SUnit *SU,
109*0b57cec5SDimitry Andric unsigned RCId) {
110*0b57cec5SDimitry Andric unsigned NumberDeps = 0;
111*0b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs) {
112*0b57cec5SDimitry Andric if (Succ.isCtrl())
113*0b57cec5SDimitry Andric continue;
114*0b57cec5SDimitry Andric
115*0b57cec5SDimitry Andric SUnit *SuccSU = Succ.getSUnit();
116*0b57cec5SDimitry Andric const SDNode *ScegN = SuccSU->getNode();
117*0b57cec5SDimitry Andric if (!ScegN)
118*0b57cec5SDimitry Andric continue;
119*0b57cec5SDimitry Andric
120*0b57cec5SDimitry Andric // If value is passed to CopyToReg, it is probably
121*0b57cec5SDimitry Andric // live outside BB.
122*0b57cec5SDimitry Andric switch (ScegN->getOpcode()) {
123*0b57cec5SDimitry Andric default: break;
124*0b57cec5SDimitry Andric case ISD::TokenFactor: break;
125*0b57cec5SDimitry Andric case ISD::CopyFromReg: break;
126*0b57cec5SDimitry Andric case ISD::CopyToReg: NumberDeps++; break;
127*0b57cec5SDimitry Andric case ISD::INLINEASM: break;
128*0b57cec5SDimitry Andric case ISD::INLINEASM_BR: break;
129*0b57cec5SDimitry Andric }
130*0b57cec5SDimitry Andric if (!ScegN->isMachineOpcode())
131*0b57cec5SDimitry Andric continue;
132*0b57cec5SDimitry Andric
133*0b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
134*0b57cec5SDimitry Andric const SDValue &Op = ScegN->getOperand(i);
135*0b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
136*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
137*0b57cec5SDimitry Andric && (TLI->getRegClassFor(VT)->getID() == RCId)) {
138*0b57cec5SDimitry Andric NumberDeps++;
139*0b57cec5SDimitry Andric break;
140*0b57cec5SDimitry Andric }
141*0b57cec5SDimitry Andric }
142*0b57cec5SDimitry Andric }
143*0b57cec5SDimitry Andric return NumberDeps;
144*0b57cec5SDimitry Andric }
145*0b57cec5SDimitry Andric
numberCtrlDepsInSU(SUnit * SU)146*0b57cec5SDimitry Andric static unsigned numberCtrlDepsInSU(SUnit *SU) {
147*0b57cec5SDimitry Andric unsigned NumberDeps = 0;
148*0b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs)
149*0b57cec5SDimitry Andric if (Succ.isCtrl())
150*0b57cec5SDimitry Andric NumberDeps++;
151*0b57cec5SDimitry Andric
152*0b57cec5SDimitry Andric return NumberDeps;
153*0b57cec5SDimitry Andric }
154*0b57cec5SDimitry Andric
numberCtrlPredInSU(SUnit * SU)155*0b57cec5SDimitry Andric static unsigned numberCtrlPredInSU(SUnit *SU) {
156*0b57cec5SDimitry Andric unsigned NumberDeps = 0;
157*0b57cec5SDimitry Andric for (SDep &Pred : SU->Preds)
158*0b57cec5SDimitry Andric if (Pred.isCtrl())
159*0b57cec5SDimitry Andric NumberDeps++;
160*0b57cec5SDimitry Andric
161*0b57cec5SDimitry Andric return NumberDeps;
162*0b57cec5SDimitry Andric }
163*0b57cec5SDimitry Andric
164*0b57cec5SDimitry Andric ///
165*0b57cec5SDimitry Andric /// Initialize nodes.
166*0b57cec5SDimitry Andric ///
initNodes(std::vector<SUnit> & sunits)167*0b57cec5SDimitry Andric void ResourcePriorityQueue::initNodes(std::vector<SUnit> &sunits) {
168*0b57cec5SDimitry Andric SUnits = &sunits;
169*0b57cec5SDimitry Andric NumNodesSolelyBlocking.resize(SUnits->size(), 0);
170*0b57cec5SDimitry Andric
171*0b57cec5SDimitry Andric for (unsigned i = 0, e = SUnits->size(); i != e; ++i) {
172*0b57cec5SDimitry Andric SUnit *SU = &(*SUnits)[i];
173*0b57cec5SDimitry Andric initNumRegDefsLeft(SU);
174*0b57cec5SDimitry Andric SU->NodeQueueId = 0;
175*0b57cec5SDimitry Andric }
176*0b57cec5SDimitry Andric }
177*0b57cec5SDimitry Andric
178*0b57cec5SDimitry Andric /// This heuristic is used if DFA scheduling is not desired
179*0b57cec5SDimitry Andric /// for some VLIW platform.
operator ()(const SUnit * LHS,const SUnit * RHS) const180*0b57cec5SDimitry Andric bool resource_sort::operator()(const SUnit *LHS, const SUnit *RHS) const {
181*0b57cec5SDimitry Andric // The isScheduleHigh flag allows nodes with wraparound dependencies that
182*0b57cec5SDimitry Andric // cannot easily be modeled as edges with latencies to be scheduled as
183*0b57cec5SDimitry Andric // soon as possible in a top-down schedule.
184*0b57cec5SDimitry Andric if (LHS->isScheduleHigh && !RHS->isScheduleHigh)
185*0b57cec5SDimitry Andric return false;
186*0b57cec5SDimitry Andric
187*0b57cec5SDimitry Andric if (!LHS->isScheduleHigh && RHS->isScheduleHigh)
188*0b57cec5SDimitry Andric return true;
189*0b57cec5SDimitry Andric
190*0b57cec5SDimitry Andric unsigned LHSNum = LHS->NodeNum;
191*0b57cec5SDimitry Andric unsigned RHSNum = RHS->NodeNum;
192*0b57cec5SDimitry Andric
193*0b57cec5SDimitry Andric // The most important heuristic is scheduling the critical path.
194*0b57cec5SDimitry Andric unsigned LHSLatency = PQ->getLatency(LHSNum);
195*0b57cec5SDimitry Andric unsigned RHSLatency = PQ->getLatency(RHSNum);
196*0b57cec5SDimitry Andric if (LHSLatency < RHSLatency) return true;
197*0b57cec5SDimitry Andric if (LHSLatency > RHSLatency) return false;
198*0b57cec5SDimitry Andric
199*0b57cec5SDimitry Andric // After that, if two nodes have identical latencies, look to see if one will
200*0b57cec5SDimitry Andric // unblock more other nodes than the other.
201*0b57cec5SDimitry Andric unsigned LHSBlocked = PQ->getNumSolelyBlockNodes(LHSNum);
202*0b57cec5SDimitry Andric unsigned RHSBlocked = PQ->getNumSolelyBlockNodes(RHSNum);
203*0b57cec5SDimitry Andric if (LHSBlocked < RHSBlocked) return true;
204*0b57cec5SDimitry Andric if (LHSBlocked > RHSBlocked) return false;
205*0b57cec5SDimitry Andric
206*0b57cec5SDimitry Andric // Finally, just to provide a stable ordering, use the node number as a
207*0b57cec5SDimitry Andric // deciding factor.
208*0b57cec5SDimitry Andric return LHSNum < RHSNum;
209*0b57cec5SDimitry Andric }
210*0b57cec5SDimitry Andric
211*0b57cec5SDimitry Andric
212*0b57cec5SDimitry Andric /// getSingleUnscheduledPred - If there is exactly one unscheduled predecessor
213*0b57cec5SDimitry Andric /// of SU, return it, otherwise return null.
getSingleUnscheduledPred(SUnit * SU)214*0b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::getSingleUnscheduledPred(SUnit *SU) {
215*0b57cec5SDimitry Andric SUnit *OnlyAvailablePred = nullptr;
216*0b57cec5SDimitry Andric for (const SDep &Pred : SU->Preds) {
217*0b57cec5SDimitry Andric SUnit &PredSU = *Pred.getSUnit();
218*0b57cec5SDimitry Andric if (!PredSU.isScheduled) {
219*0b57cec5SDimitry Andric // We found an available, but not scheduled, predecessor. If it's the
220*0b57cec5SDimitry Andric // only one we have found, keep track of it... otherwise give up.
221*0b57cec5SDimitry Andric if (OnlyAvailablePred && OnlyAvailablePred != &PredSU)
222*0b57cec5SDimitry Andric return nullptr;
223*0b57cec5SDimitry Andric OnlyAvailablePred = &PredSU;
224*0b57cec5SDimitry Andric }
225*0b57cec5SDimitry Andric }
226*0b57cec5SDimitry Andric return OnlyAvailablePred;
227*0b57cec5SDimitry Andric }
228*0b57cec5SDimitry Andric
push(SUnit * SU)229*0b57cec5SDimitry Andric void ResourcePriorityQueue::push(SUnit *SU) {
230*0b57cec5SDimitry Andric // Look at all of the successors of this node. Count the number of nodes that
231*0b57cec5SDimitry Andric // this node is the sole unscheduled node for.
232*0b57cec5SDimitry Andric unsigned NumNodesBlocking = 0;
233*0b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs)
234*0b57cec5SDimitry Andric if (getSingleUnscheduledPred(Succ.getSUnit()) == SU)
235*0b57cec5SDimitry Andric ++NumNodesBlocking;
236*0b57cec5SDimitry Andric
237*0b57cec5SDimitry Andric NumNodesSolelyBlocking[SU->NodeNum] = NumNodesBlocking;
238*0b57cec5SDimitry Andric Queue.push_back(SU);
239*0b57cec5SDimitry Andric }
240*0b57cec5SDimitry Andric
241*0b57cec5SDimitry Andric /// Check if scheduling of this SU is possible
242*0b57cec5SDimitry Andric /// in the current packet.
isResourceAvailable(SUnit * SU)243*0b57cec5SDimitry Andric bool ResourcePriorityQueue::isResourceAvailable(SUnit *SU) {
244*0b57cec5SDimitry Andric if (!SU || !SU->getNode())
245*0b57cec5SDimitry Andric return false;
246*0b57cec5SDimitry Andric
247*0b57cec5SDimitry Andric // If this is a compound instruction,
248*0b57cec5SDimitry Andric // it is likely to be a call. Do not delay it.
249*0b57cec5SDimitry Andric if (SU->getNode()->getGluedNode())
250*0b57cec5SDimitry Andric return true;
251*0b57cec5SDimitry Andric
252*0b57cec5SDimitry Andric // First see if the pipeline could receive this instruction
253*0b57cec5SDimitry Andric // in the current cycle.
254*0b57cec5SDimitry Andric if (SU->getNode()->isMachineOpcode())
255*0b57cec5SDimitry Andric switch (SU->getNode()->getMachineOpcode()) {
256*0b57cec5SDimitry Andric default:
257*0b57cec5SDimitry Andric if (!ResourcesModel->canReserveResources(&TII->get(
258*0b57cec5SDimitry Andric SU->getNode()->getMachineOpcode())))
259*0b57cec5SDimitry Andric return false;
260*0b57cec5SDimitry Andric break;
261*0b57cec5SDimitry Andric case TargetOpcode::EXTRACT_SUBREG:
262*0b57cec5SDimitry Andric case TargetOpcode::INSERT_SUBREG:
263*0b57cec5SDimitry Andric case TargetOpcode::SUBREG_TO_REG:
264*0b57cec5SDimitry Andric case TargetOpcode::REG_SEQUENCE:
265*0b57cec5SDimitry Andric case TargetOpcode::IMPLICIT_DEF:
266*0b57cec5SDimitry Andric break;
267*0b57cec5SDimitry Andric }
268*0b57cec5SDimitry Andric
269*0b57cec5SDimitry Andric // Now see if there are no other dependencies
270*0b57cec5SDimitry Andric // to instructions already in the packet.
271*0b57cec5SDimitry Andric for (unsigned i = 0, e = Packet.size(); i != e; ++i)
272*0b57cec5SDimitry Andric for (const SDep &Succ : Packet[i]->Succs) {
273*0b57cec5SDimitry Andric // Since we do not add pseudos to packets, might as well
274*0b57cec5SDimitry Andric // ignore order deps.
275*0b57cec5SDimitry Andric if (Succ.isCtrl())
276*0b57cec5SDimitry Andric continue;
277*0b57cec5SDimitry Andric
278*0b57cec5SDimitry Andric if (Succ.getSUnit() == SU)
279*0b57cec5SDimitry Andric return false;
280*0b57cec5SDimitry Andric }
281*0b57cec5SDimitry Andric
282*0b57cec5SDimitry Andric return true;
283*0b57cec5SDimitry Andric }
284*0b57cec5SDimitry Andric
285*0b57cec5SDimitry Andric /// Keep track of available resources.
reserveResources(SUnit * SU)286*0b57cec5SDimitry Andric void ResourcePriorityQueue::reserveResources(SUnit *SU) {
287*0b57cec5SDimitry Andric // If this SU does not fit in the packet
288*0b57cec5SDimitry Andric // start a new one.
289*0b57cec5SDimitry Andric if (!isResourceAvailable(SU) || SU->getNode()->getGluedNode()) {
290*0b57cec5SDimitry Andric ResourcesModel->clearResources();
291*0b57cec5SDimitry Andric Packet.clear();
292*0b57cec5SDimitry Andric }
293*0b57cec5SDimitry Andric
294*0b57cec5SDimitry Andric if (SU->getNode() && SU->getNode()->isMachineOpcode()) {
295*0b57cec5SDimitry Andric switch (SU->getNode()->getMachineOpcode()) {
296*0b57cec5SDimitry Andric default:
297*0b57cec5SDimitry Andric ResourcesModel->reserveResources(&TII->get(
298*0b57cec5SDimitry Andric SU->getNode()->getMachineOpcode()));
299*0b57cec5SDimitry Andric break;
300*0b57cec5SDimitry Andric case TargetOpcode::EXTRACT_SUBREG:
301*0b57cec5SDimitry Andric case TargetOpcode::INSERT_SUBREG:
302*0b57cec5SDimitry Andric case TargetOpcode::SUBREG_TO_REG:
303*0b57cec5SDimitry Andric case TargetOpcode::REG_SEQUENCE:
304*0b57cec5SDimitry Andric case TargetOpcode::IMPLICIT_DEF:
305*0b57cec5SDimitry Andric break;
306*0b57cec5SDimitry Andric }
307*0b57cec5SDimitry Andric Packet.push_back(SU);
308*0b57cec5SDimitry Andric }
309*0b57cec5SDimitry Andric // Forcefully end packet for PseudoOps.
310*0b57cec5SDimitry Andric else {
311*0b57cec5SDimitry Andric ResourcesModel->clearResources();
312*0b57cec5SDimitry Andric Packet.clear();
313*0b57cec5SDimitry Andric }
314*0b57cec5SDimitry Andric
315*0b57cec5SDimitry Andric // If packet is now full, reset the state so in the next cycle
316*0b57cec5SDimitry Andric // we start fresh.
317*0b57cec5SDimitry Andric if (Packet.size() >= InstrItins->SchedModel.IssueWidth) {
318*0b57cec5SDimitry Andric ResourcesModel->clearResources();
319*0b57cec5SDimitry Andric Packet.clear();
320*0b57cec5SDimitry Andric }
321*0b57cec5SDimitry Andric }
322*0b57cec5SDimitry Andric
rawRegPressureDelta(SUnit * SU,unsigned RCId)323*0b57cec5SDimitry Andric int ResourcePriorityQueue::rawRegPressureDelta(SUnit *SU, unsigned RCId) {
324*0b57cec5SDimitry Andric int RegBalance = 0;
325*0b57cec5SDimitry Andric
326*0b57cec5SDimitry Andric if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
327*0b57cec5SDimitry Andric return RegBalance;
328*0b57cec5SDimitry Andric
329*0b57cec5SDimitry Andric // Gen estimate.
330*0b57cec5SDimitry Andric for (unsigned i = 0, e = SU->getNode()->getNumValues(); i != e; ++i) {
331*0b57cec5SDimitry Andric MVT VT = SU->getNode()->getSimpleValueType(i);
332*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
333*0b57cec5SDimitry Andric && TLI->getRegClassFor(VT)
334*0b57cec5SDimitry Andric && TLI->getRegClassFor(VT)->getID() == RCId)
335*0b57cec5SDimitry Andric RegBalance += numberRCValSuccInSU(SU, RCId);
336*0b57cec5SDimitry Andric }
337*0b57cec5SDimitry Andric // Kill estimate.
338*0b57cec5SDimitry Andric for (unsigned i = 0, e = SU->getNode()->getNumOperands(); i != e; ++i) {
339*0b57cec5SDimitry Andric const SDValue &Op = SU->getNode()->getOperand(i);
340*0b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
341*0b57cec5SDimitry Andric if (isa<ConstantSDNode>(Op.getNode()))
342*0b57cec5SDimitry Andric continue;
343*0b57cec5SDimitry Andric
344*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT) && TLI->getRegClassFor(VT)
345*0b57cec5SDimitry Andric && TLI->getRegClassFor(VT)->getID() == RCId)
346*0b57cec5SDimitry Andric RegBalance -= numberRCValPredInSU(SU, RCId);
347*0b57cec5SDimitry Andric }
348*0b57cec5SDimitry Andric return RegBalance;
349*0b57cec5SDimitry Andric }
350*0b57cec5SDimitry Andric
351*0b57cec5SDimitry Andric /// Estimates change in reg pressure from this SU.
352*0b57cec5SDimitry Andric /// It is achieved by trivial tracking of defined
353*0b57cec5SDimitry Andric /// and used vregs in dependent instructions.
354*0b57cec5SDimitry Andric /// The RawPressure flag makes this function to ignore
355*0b57cec5SDimitry Andric /// existing reg file sizes, and report raw def/use
356*0b57cec5SDimitry Andric /// balance.
regPressureDelta(SUnit * SU,bool RawPressure)357*0b57cec5SDimitry Andric int ResourcePriorityQueue::regPressureDelta(SUnit *SU, bool RawPressure) {
358*0b57cec5SDimitry Andric int RegBalance = 0;
359*0b57cec5SDimitry Andric
360*0b57cec5SDimitry Andric if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
361*0b57cec5SDimitry Andric return RegBalance;
362*0b57cec5SDimitry Andric
363*0b57cec5SDimitry Andric if (RawPressure) {
364*0b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses())
365*0b57cec5SDimitry Andric RegBalance += rawRegPressureDelta(SU, RC->getID());
366*0b57cec5SDimitry Andric }
367*0b57cec5SDimitry Andric else {
368*0b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses()) {
369*0b57cec5SDimitry Andric if ((RegPressure[RC->getID()] +
370*0b57cec5SDimitry Andric rawRegPressureDelta(SU, RC->getID()) > 0) &&
371*0b57cec5SDimitry Andric (RegPressure[RC->getID()] +
372*0b57cec5SDimitry Andric rawRegPressureDelta(SU, RC->getID()) >= RegLimit[RC->getID()]))
373*0b57cec5SDimitry Andric RegBalance += rawRegPressureDelta(SU, RC->getID());
374*0b57cec5SDimitry Andric }
375*0b57cec5SDimitry Andric }
376*0b57cec5SDimitry Andric
377*0b57cec5SDimitry Andric return RegBalance;
378*0b57cec5SDimitry Andric }
379*0b57cec5SDimitry Andric
380*0b57cec5SDimitry Andric // Constants used to denote relative importance of
381*0b57cec5SDimitry Andric // heuristic components for cost computation.
382*0b57cec5SDimitry Andric static const unsigned PriorityOne = 200;
383*0b57cec5SDimitry Andric static const unsigned PriorityTwo = 50;
384*0b57cec5SDimitry Andric static const unsigned PriorityThree = 15;
385*0b57cec5SDimitry Andric static const unsigned PriorityFour = 5;
386*0b57cec5SDimitry Andric static const unsigned ScaleOne = 20;
387*0b57cec5SDimitry Andric static const unsigned ScaleTwo = 10;
388*0b57cec5SDimitry Andric static const unsigned ScaleThree = 5;
389*0b57cec5SDimitry Andric static const unsigned FactorOne = 2;
390*0b57cec5SDimitry Andric
391*0b57cec5SDimitry Andric /// Returns single number reflecting benefit of scheduling SU
392*0b57cec5SDimitry Andric /// in the current cycle.
SUSchedulingCost(SUnit * SU)393*0b57cec5SDimitry Andric int ResourcePriorityQueue::SUSchedulingCost(SUnit *SU) {
394*0b57cec5SDimitry Andric // Initial trivial priority.
395*0b57cec5SDimitry Andric int ResCount = 1;
396*0b57cec5SDimitry Andric
397*0b57cec5SDimitry Andric // Do not waste time on a node that is already scheduled.
398*0b57cec5SDimitry Andric if (SU->isScheduled)
399*0b57cec5SDimitry Andric return ResCount;
400*0b57cec5SDimitry Andric
401*0b57cec5SDimitry Andric // Forced priority is high.
402*0b57cec5SDimitry Andric if (SU->isScheduleHigh)
403*0b57cec5SDimitry Andric ResCount += PriorityOne;
404*0b57cec5SDimitry Andric
405*0b57cec5SDimitry Andric // Adaptable scheduling
406*0b57cec5SDimitry Andric // A small, but very parallel
407*0b57cec5SDimitry Andric // region, where reg pressure is an issue.
408*0b57cec5SDimitry Andric if (HorizontalVerticalBalance > RegPressureThreshold) {
409*0b57cec5SDimitry Andric // Critical path first
410*0b57cec5SDimitry Andric ResCount += (SU->getHeight() * ScaleTwo);
411*0b57cec5SDimitry Andric // If resources are available for it, multiply the
412*0b57cec5SDimitry Andric // chance of scheduling.
413*0b57cec5SDimitry Andric if (isResourceAvailable(SU))
414*0b57cec5SDimitry Andric ResCount <<= FactorOne;
415*0b57cec5SDimitry Andric
416*0b57cec5SDimitry Andric // Consider change to reg pressure from scheduling
417*0b57cec5SDimitry Andric // this SU.
418*0b57cec5SDimitry Andric ResCount -= (regPressureDelta(SU,true) * ScaleOne);
419*0b57cec5SDimitry Andric }
420*0b57cec5SDimitry Andric // Default heuristic, greeady and
421*0b57cec5SDimitry Andric // critical path driven.
422*0b57cec5SDimitry Andric else {
423*0b57cec5SDimitry Andric // Critical path first.
424*0b57cec5SDimitry Andric ResCount += (SU->getHeight() * ScaleTwo);
425*0b57cec5SDimitry Andric // Now see how many instructions is blocked by this SU.
426*0b57cec5SDimitry Andric ResCount += (NumNodesSolelyBlocking[SU->NodeNum] * ScaleTwo);
427*0b57cec5SDimitry Andric // If resources are available for it, multiply the
428*0b57cec5SDimitry Andric // chance of scheduling.
429*0b57cec5SDimitry Andric if (isResourceAvailable(SU))
430*0b57cec5SDimitry Andric ResCount <<= FactorOne;
431*0b57cec5SDimitry Andric
432*0b57cec5SDimitry Andric ResCount -= (regPressureDelta(SU) * ScaleTwo);
433*0b57cec5SDimitry Andric }
434*0b57cec5SDimitry Andric
435*0b57cec5SDimitry Andric // These are platform-specific things.
436*0b57cec5SDimitry Andric // Will need to go into the back end
437*0b57cec5SDimitry Andric // and accessed from here via a hook.
438*0b57cec5SDimitry Andric for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) {
439*0b57cec5SDimitry Andric if (N->isMachineOpcode()) {
440*0b57cec5SDimitry Andric const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
441*0b57cec5SDimitry Andric if (TID.isCall())
442*0b57cec5SDimitry Andric ResCount += (PriorityTwo + (ScaleThree*N->getNumValues()));
443*0b57cec5SDimitry Andric }
444*0b57cec5SDimitry Andric else
445*0b57cec5SDimitry Andric switch (N->getOpcode()) {
446*0b57cec5SDimitry Andric default: break;
447*0b57cec5SDimitry Andric case ISD::TokenFactor:
448*0b57cec5SDimitry Andric case ISD::CopyFromReg:
449*0b57cec5SDimitry Andric case ISD::CopyToReg:
450*0b57cec5SDimitry Andric ResCount += PriorityFour;
451*0b57cec5SDimitry Andric break;
452*0b57cec5SDimitry Andric
453*0b57cec5SDimitry Andric case ISD::INLINEASM:
454*0b57cec5SDimitry Andric case ISD::INLINEASM_BR:
455*0b57cec5SDimitry Andric ResCount += PriorityThree;
456*0b57cec5SDimitry Andric break;
457*0b57cec5SDimitry Andric }
458*0b57cec5SDimitry Andric }
459*0b57cec5SDimitry Andric return ResCount;
460*0b57cec5SDimitry Andric }
461*0b57cec5SDimitry Andric
462*0b57cec5SDimitry Andric
463*0b57cec5SDimitry Andric /// Main resource tracking point.
scheduledNode(SUnit * SU)464*0b57cec5SDimitry Andric void ResourcePriorityQueue::scheduledNode(SUnit *SU) {
465*0b57cec5SDimitry Andric // Use NULL entry as an event marker to reset
466*0b57cec5SDimitry Andric // the DFA state.
467*0b57cec5SDimitry Andric if (!SU) {
468*0b57cec5SDimitry Andric ResourcesModel->clearResources();
469*0b57cec5SDimitry Andric Packet.clear();
470*0b57cec5SDimitry Andric return;
471*0b57cec5SDimitry Andric }
472*0b57cec5SDimitry Andric
473*0b57cec5SDimitry Andric const SDNode *ScegN = SU->getNode();
474*0b57cec5SDimitry Andric // Update reg pressure tracking.
475*0b57cec5SDimitry Andric // First update current node.
476*0b57cec5SDimitry Andric if (ScegN->isMachineOpcode()) {
477*0b57cec5SDimitry Andric // Estimate generated regs.
478*0b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
479*0b57cec5SDimitry Andric MVT VT = ScegN->getSimpleValueType(i);
480*0b57cec5SDimitry Andric
481*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)) {
482*0b57cec5SDimitry Andric const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
483*0b57cec5SDimitry Andric if (RC)
484*0b57cec5SDimitry Andric RegPressure[RC->getID()] += numberRCValSuccInSU(SU, RC->getID());
485*0b57cec5SDimitry Andric }
486*0b57cec5SDimitry Andric }
487*0b57cec5SDimitry Andric // Estimate killed regs.
488*0b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
489*0b57cec5SDimitry Andric const SDValue &Op = ScegN->getOperand(i);
490*0b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
491*0b57cec5SDimitry Andric
492*0b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)) {
493*0b57cec5SDimitry Andric const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
494*0b57cec5SDimitry Andric if (RC) {
495*0b57cec5SDimitry Andric if (RegPressure[RC->getID()] >
496*0b57cec5SDimitry Andric (numberRCValPredInSU(SU, RC->getID())))
497*0b57cec5SDimitry Andric RegPressure[RC->getID()] -= numberRCValPredInSU(SU, RC->getID());
498*0b57cec5SDimitry Andric else RegPressure[RC->getID()] = 0;
499*0b57cec5SDimitry Andric }
500*0b57cec5SDimitry Andric }
501*0b57cec5SDimitry Andric }
502*0b57cec5SDimitry Andric for (SDep &Pred : SU->Preds) {
503*0b57cec5SDimitry Andric if (Pred.isCtrl() || (Pred.getSUnit()->NumRegDefsLeft == 0))
504*0b57cec5SDimitry Andric continue;
505*0b57cec5SDimitry Andric --Pred.getSUnit()->NumRegDefsLeft;
506*0b57cec5SDimitry Andric }
507*0b57cec5SDimitry Andric }
508*0b57cec5SDimitry Andric
509*0b57cec5SDimitry Andric // Reserve resources for this SU.
510*0b57cec5SDimitry Andric reserveResources(SU);
511*0b57cec5SDimitry Andric
512*0b57cec5SDimitry Andric // Adjust number of parallel live ranges.
513*0b57cec5SDimitry Andric // Heuristic is simple - node with no data successors reduces
514*0b57cec5SDimitry Andric // number of live ranges. All others, increase it.
515*0b57cec5SDimitry Andric unsigned NumberNonControlDeps = 0;
516*0b57cec5SDimitry Andric
517*0b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs) {
518*0b57cec5SDimitry Andric adjustPriorityOfUnscheduledPreds(Succ.getSUnit());
519*0b57cec5SDimitry Andric if (!Succ.isCtrl())
520*0b57cec5SDimitry Andric NumberNonControlDeps++;
521*0b57cec5SDimitry Andric }
522*0b57cec5SDimitry Andric
523*0b57cec5SDimitry Andric if (!NumberNonControlDeps) {
524*0b57cec5SDimitry Andric if (ParallelLiveRanges >= SU->NumPreds)
525*0b57cec5SDimitry Andric ParallelLiveRanges -= SU->NumPreds;
526*0b57cec5SDimitry Andric else
527*0b57cec5SDimitry Andric ParallelLiveRanges = 0;
528*0b57cec5SDimitry Andric
529*0b57cec5SDimitry Andric }
530*0b57cec5SDimitry Andric else
531*0b57cec5SDimitry Andric ParallelLiveRanges += SU->NumRegDefsLeft;
532*0b57cec5SDimitry Andric
533*0b57cec5SDimitry Andric // Track parallel live chains.
534*0b57cec5SDimitry Andric HorizontalVerticalBalance += (SU->Succs.size() - numberCtrlDepsInSU(SU));
535*0b57cec5SDimitry Andric HorizontalVerticalBalance -= (SU->Preds.size() - numberCtrlPredInSU(SU));
536*0b57cec5SDimitry Andric }
537*0b57cec5SDimitry Andric
initNumRegDefsLeft(SUnit * SU)538*0b57cec5SDimitry Andric void ResourcePriorityQueue::initNumRegDefsLeft(SUnit *SU) {
539*0b57cec5SDimitry Andric unsigned NodeNumDefs = 0;
540*0b57cec5SDimitry Andric for (SDNode *N = SU->getNode(); N; N = N->getGluedNode())
541*0b57cec5SDimitry Andric if (N->isMachineOpcode()) {
542*0b57cec5SDimitry Andric const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
543*0b57cec5SDimitry Andric // No register need be allocated for this.
544*0b57cec5SDimitry Andric if (N->getMachineOpcode() == TargetOpcode::IMPLICIT_DEF) {
545*0b57cec5SDimitry Andric NodeNumDefs = 0;
546*0b57cec5SDimitry Andric break;
547*0b57cec5SDimitry Andric }
548*0b57cec5SDimitry Andric NodeNumDefs = std::min(N->getNumValues(), TID.getNumDefs());
549*0b57cec5SDimitry Andric }
550*0b57cec5SDimitry Andric else
551*0b57cec5SDimitry Andric switch(N->getOpcode()) {
552*0b57cec5SDimitry Andric default: break;
553*0b57cec5SDimitry Andric case ISD::CopyFromReg:
554*0b57cec5SDimitry Andric NodeNumDefs++;
555*0b57cec5SDimitry Andric break;
556*0b57cec5SDimitry Andric case ISD::INLINEASM:
557*0b57cec5SDimitry Andric case ISD::INLINEASM_BR:
558*0b57cec5SDimitry Andric NodeNumDefs++;
559*0b57cec5SDimitry Andric break;
560*0b57cec5SDimitry Andric }
561*0b57cec5SDimitry Andric
562*0b57cec5SDimitry Andric SU->NumRegDefsLeft = NodeNumDefs;
563*0b57cec5SDimitry Andric }
564*0b57cec5SDimitry Andric
565*0b57cec5SDimitry Andric /// adjustPriorityOfUnscheduledPreds - One of the predecessors of SU was just
566*0b57cec5SDimitry Andric /// scheduled. If SU is not itself available, then there is at least one
567*0b57cec5SDimitry Andric /// predecessor node that has not been scheduled yet. If SU has exactly ONE
568*0b57cec5SDimitry Andric /// unscheduled predecessor, we want to increase its priority: it getting
569*0b57cec5SDimitry Andric /// scheduled will make this node available, so it is better than some other
570*0b57cec5SDimitry Andric /// node of the same priority that will not make a node available.
adjustPriorityOfUnscheduledPreds(SUnit * SU)571*0b57cec5SDimitry Andric void ResourcePriorityQueue::adjustPriorityOfUnscheduledPreds(SUnit *SU) {
572*0b57cec5SDimitry Andric if (SU->isAvailable) return; // All preds scheduled.
573*0b57cec5SDimitry Andric
574*0b57cec5SDimitry Andric SUnit *OnlyAvailablePred = getSingleUnscheduledPred(SU);
575*0b57cec5SDimitry Andric if (!OnlyAvailablePred || !OnlyAvailablePred->isAvailable)
576*0b57cec5SDimitry Andric return;
577*0b57cec5SDimitry Andric
578*0b57cec5SDimitry Andric // Okay, we found a single predecessor that is available, but not scheduled.
579*0b57cec5SDimitry Andric // Since it is available, it must be in the priority queue. First remove it.
580*0b57cec5SDimitry Andric remove(OnlyAvailablePred);
581*0b57cec5SDimitry Andric
582*0b57cec5SDimitry Andric // Reinsert the node into the priority queue, which recomputes its
583*0b57cec5SDimitry Andric // NumNodesSolelyBlocking value.
584*0b57cec5SDimitry Andric push(OnlyAvailablePred);
585*0b57cec5SDimitry Andric }
586*0b57cec5SDimitry Andric
587*0b57cec5SDimitry Andric
588*0b57cec5SDimitry Andric /// Main access point - returns next instructions
589*0b57cec5SDimitry Andric /// to be placed in scheduling sequence.
pop()590*0b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::pop() {
591*0b57cec5SDimitry Andric if (empty())
592*0b57cec5SDimitry Andric return nullptr;
593*0b57cec5SDimitry Andric
594*0b57cec5SDimitry Andric std::vector<SUnit *>::iterator Best = Queue.begin();
595*0b57cec5SDimitry Andric if (!DisableDFASched) {
596*0b57cec5SDimitry Andric int BestCost = SUSchedulingCost(*Best);
597*0b57cec5SDimitry Andric for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I) {
598*0b57cec5SDimitry Andric
599*0b57cec5SDimitry Andric if (SUSchedulingCost(*I) > BestCost) {
600*0b57cec5SDimitry Andric BestCost = SUSchedulingCost(*I);
601*0b57cec5SDimitry Andric Best = I;
602*0b57cec5SDimitry Andric }
603*0b57cec5SDimitry Andric }
604*0b57cec5SDimitry Andric }
605*0b57cec5SDimitry Andric // Use default TD scheduling mechanism.
606*0b57cec5SDimitry Andric else {
607*0b57cec5SDimitry Andric for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I)
608*0b57cec5SDimitry Andric if (Picker(*Best, *I))
609*0b57cec5SDimitry Andric Best = I;
610*0b57cec5SDimitry Andric }
611*0b57cec5SDimitry Andric
612*0b57cec5SDimitry Andric SUnit *V = *Best;
613*0b57cec5SDimitry Andric if (Best != std::prev(Queue.end()))
614*0b57cec5SDimitry Andric std::swap(*Best, Queue.back());
615*0b57cec5SDimitry Andric
616*0b57cec5SDimitry Andric Queue.pop_back();
617*0b57cec5SDimitry Andric
618*0b57cec5SDimitry Andric return V;
619*0b57cec5SDimitry Andric }
620*0b57cec5SDimitry Andric
621*0b57cec5SDimitry Andric
remove(SUnit * SU)622*0b57cec5SDimitry Andric void ResourcePriorityQueue::remove(SUnit *SU) {
623*0b57cec5SDimitry Andric assert(!Queue.empty() && "Queue is empty!");
624*0b57cec5SDimitry Andric std::vector<SUnit *>::iterator I = find(Queue, SU);
625*0b57cec5SDimitry Andric if (I != std::prev(Queue.end()))
626 std::swap(*I, Queue.back());
627
628 Queue.pop_back();
629 }
630