10b57cec5SDimitry Andric //=- llvm/CodeGen/DFAPacketizer.cpp - DFA Packetizer for VLIW -*- C++ -*-=====//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric // This class implements a deterministic finite automaton (DFA) based
90b57cec5SDimitry Andric // packetizing mechanism for VLIW architectures. It provides APIs to
100b57cec5SDimitry Andric // determine whether there exists a legal mapping of instructions to
110b57cec5SDimitry Andric // functional unit assignments in a packet. The DFA is auto-generated from
120b57cec5SDimitry Andric // the target's Schedule.td file.
130b57cec5SDimitry Andric //
140b57cec5SDimitry Andric // A DFA consists of 3 major elements: states, inputs, and transitions. For
150b57cec5SDimitry Andric // the packetizing mechanism, the input is the set of instruction classes for
160b57cec5SDimitry Andric // a target. The state models all possible combinations of functional unit
170b57cec5SDimitry Andric // consumption for a given set of instructions in a packet. A transition
180b57cec5SDimitry Andric // models the addition of an instruction to a packet. In the DFA constructed
190b57cec5SDimitry Andric // by this class, if an instruction can be added to a packet, then a valid
200b57cec5SDimitry Andric // transition exists from the corresponding state. Invalid transitions
210b57cec5SDimitry Andric // indicate that the instruction cannot be added to the current packet.
220b57cec5SDimitry Andric //
230b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
240b57cec5SDimitry Andric 
250b57cec5SDimitry Andric #include "llvm/CodeGen/DFAPacketizer.h"
268bcb0991SDimitry Andric #include "llvm/ADT/StringExtras.h"
278bcb0991SDimitry Andric #include "llvm/Analysis/AliasAnalysis.h"
280b57cec5SDimitry Andric #include "llvm/CodeGen/MachineFunction.h"
290b57cec5SDimitry Andric #include "llvm/CodeGen/MachineInstr.h"
300b57cec5SDimitry Andric #include "llvm/CodeGen/MachineInstrBundle.h"
310b57cec5SDimitry Andric #include "llvm/CodeGen/ScheduleDAG.h"
320b57cec5SDimitry Andric #include "llvm/CodeGen/ScheduleDAGInstrs.h"
330b57cec5SDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h"
340b57cec5SDimitry Andric #include "llvm/CodeGen/TargetSubtargetInfo.h"
350b57cec5SDimitry Andric #include "llvm/MC/MCInstrDesc.h"
360b57cec5SDimitry Andric #include "llvm/MC/MCInstrItineraries.h"
370b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
380b57cec5SDimitry Andric #include "llvm/Support/Debug.h"
390b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h"
400b57cec5SDimitry Andric #include <algorithm>
410b57cec5SDimitry Andric #include <cassert>
420b57cec5SDimitry Andric #include <iterator>
430b57cec5SDimitry Andric #include <memory>
440b57cec5SDimitry Andric #include <vector>
450b57cec5SDimitry Andric 
460b57cec5SDimitry Andric using namespace llvm;
470b57cec5SDimitry Andric 
480b57cec5SDimitry Andric #define DEBUG_TYPE "packets"
490b57cec5SDimitry Andric 
500b57cec5SDimitry Andric static cl::opt<unsigned> InstrLimit("dfa-instr-limit", cl::Hidden,
510b57cec5SDimitry Andric   cl::init(0), cl::desc("If present, stops packetizing after N instructions"));
520b57cec5SDimitry Andric 
530b57cec5SDimitry Andric static unsigned InstrCount = 0;
540b57cec5SDimitry Andric 
550b57cec5SDimitry Andric // Check if the resources occupied by a MCInstrDesc are available in the
560b57cec5SDimitry Andric // current state.
canReserveResources(const MCInstrDesc * MID)570b57cec5SDimitry Andric bool DFAPacketizer::canReserveResources(const MCInstrDesc *MID) {
58480093f4SDimitry Andric   unsigned Action = ItinActions[MID->getSchedClass()];
59480093f4SDimitry Andric   if (MID->getSchedClass() == 0 || Action == 0)
60480093f4SDimitry Andric     return false;
61480093f4SDimitry Andric   return A.canAdd(Action);
620b57cec5SDimitry Andric }
630b57cec5SDimitry Andric 
640b57cec5SDimitry Andric // Reserve the resources occupied by a MCInstrDesc and change the current
650b57cec5SDimitry Andric // state to reflect that change.
reserveResources(const MCInstrDesc * MID)660b57cec5SDimitry Andric void DFAPacketizer::reserveResources(const MCInstrDesc *MID) {
67480093f4SDimitry Andric   unsigned Action = ItinActions[MID->getSchedClass()];
68480093f4SDimitry Andric   if (MID->getSchedClass() == 0 || Action == 0)
69480093f4SDimitry Andric     return;
70480093f4SDimitry Andric   A.add(Action);
710b57cec5SDimitry Andric }
720b57cec5SDimitry Andric 
730b57cec5SDimitry Andric // Check if the resources occupied by a machine instruction are available
740b57cec5SDimitry Andric // in the current state.
canReserveResources(MachineInstr & MI)750b57cec5SDimitry Andric bool DFAPacketizer::canReserveResources(MachineInstr &MI) {
760b57cec5SDimitry Andric   const MCInstrDesc &MID = MI.getDesc();
770b57cec5SDimitry Andric   return canReserveResources(&MID);
780b57cec5SDimitry Andric }
790b57cec5SDimitry Andric 
800b57cec5SDimitry Andric // Reserve the resources occupied by a machine instruction and change the
810b57cec5SDimitry Andric // current state to reflect that change.
reserveResources(MachineInstr & MI)820b57cec5SDimitry Andric void DFAPacketizer::reserveResources(MachineInstr &MI) {
830b57cec5SDimitry Andric   const MCInstrDesc &MID = MI.getDesc();
840b57cec5SDimitry Andric   reserveResources(&MID);
850b57cec5SDimitry Andric }
860b57cec5SDimitry Andric 
getUsedResources(unsigned InstIdx)878bcb0991SDimitry Andric unsigned DFAPacketizer::getUsedResources(unsigned InstIdx) {
888bcb0991SDimitry Andric   ArrayRef<NfaPath> NfaPaths = A.getNfaPaths();
898bcb0991SDimitry Andric   assert(!NfaPaths.empty() && "Invalid bundle!");
908bcb0991SDimitry Andric   const NfaPath &RS = NfaPaths.front();
918bcb0991SDimitry Andric 
928bcb0991SDimitry Andric   // RS stores the cumulative resources used up to and including the I'th
938bcb0991SDimitry Andric   // instruction. The 0th instruction is the base case.
948bcb0991SDimitry Andric   if (InstIdx == 0)
958bcb0991SDimitry Andric     return RS[0];
968bcb0991SDimitry Andric   // Return the difference between the cumulative resources used by InstIdx and
978bcb0991SDimitry Andric   // its predecessor.
988bcb0991SDimitry Andric   return RS[InstIdx] ^ RS[InstIdx - 1];
998bcb0991SDimitry Andric }
1008bcb0991SDimitry Andric 
1010b57cec5SDimitry Andric namespace llvm {
1020b57cec5SDimitry Andric 
1030b57cec5SDimitry Andric // This class extends ScheduleDAGInstrs and overrides the schedule method
1040b57cec5SDimitry Andric // to build the dependence graph.
1050b57cec5SDimitry Andric class DefaultVLIWScheduler : public ScheduleDAGInstrs {
1060b57cec5SDimitry Andric private:
1078bcb0991SDimitry Andric   AAResults *AA;
1080b57cec5SDimitry Andric   /// Ordered list of DAG postprocessing steps.
1090b57cec5SDimitry Andric   std::vector<std::unique_ptr<ScheduleDAGMutation>> Mutations;
1100b57cec5SDimitry Andric 
1110b57cec5SDimitry Andric public:
1120b57cec5SDimitry Andric   DefaultVLIWScheduler(MachineFunction &MF, MachineLoopInfo &MLI,
1138bcb0991SDimitry Andric                        AAResults *AA);
1140b57cec5SDimitry Andric 
1150b57cec5SDimitry Andric   // Actual scheduling work.
1160b57cec5SDimitry Andric   void schedule() override;
1170b57cec5SDimitry Andric 
1180b57cec5SDimitry Andric   /// DefaultVLIWScheduler takes ownership of the Mutation object.
addMutation(std::unique_ptr<ScheduleDAGMutation> Mutation)1190b57cec5SDimitry Andric   void addMutation(std::unique_ptr<ScheduleDAGMutation> Mutation) {
1200b57cec5SDimitry Andric     Mutations.push_back(std::move(Mutation));
1210b57cec5SDimitry Andric   }
1220b57cec5SDimitry Andric 
1230b57cec5SDimitry Andric protected:
1240b57cec5SDimitry Andric   void postprocessDAG();
1250b57cec5SDimitry Andric };
1260b57cec5SDimitry Andric 
1270b57cec5SDimitry Andric } // end namespace llvm
1280b57cec5SDimitry Andric 
DefaultVLIWScheduler(MachineFunction & MF,MachineLoopInfo & MLI,AAResults * AA)1290b57cec5SDimitry Andric DefaultVLIWScheduler::DefaultVLIWScheduler(MachineFunction &MF,
1300b57cec5SDimitry Andric                                            MachineLoopInfo &MLI,
1318bcb0991SDimitry Andric                                            AAResults *AA)
1320b57cec5SDimitry Andric     : ScheduleDAGInstrs(MF, &MLI), AA(AA) {
1330b57cec5SDimitry Andric   CanHandleTerminators = true;
1340b57cec5SDimitry Andric }
1350b57cec5SDimitry Andric 
1360b57cec5SDimitry Andric /// Apply each ScheduleDAGMutation step in order.
postprocessDAG()1370b57cec5SDimitry Andric void DefaultVLIWScheduler::postprocessDAG() {
1380b57cec5SDimitry Andric   for (auto &M : Mutations)
1390b57cec5SDimitry Andric     M->apply(this);
1400b57cec5SDimitry Andric }
1410b57cec5SDimitry Andric 
schedule()1420b57cec5SDimitry Andric void DefaultVLIWScheduler::schedule() {
1430b57cec5SDimitry Andric   // Build the scheduling graph.
1440b57cec5SDimitry Andric   buildSchedGraph(AA);
1450b57cec5SDimitry Andric   postprocessDAG();
1460b57cec5SDimitry Andric }
1470b57cec5SDimitry Andric 
VLIWPacketizerList(MachineFunction & mf,MachineLoopInfo & mli,AAResults * aa)1480b57cec5SDimitry Andric VLIWPacketizerList::VLIWPacketizerList(MachineFunction &mf,
1498bcb0991SDimitry Andric                                        MachineLoopInfo &mli, AAResults *aa)
1500b57cec5SDimitry Andric     : MF(mf), TII(mf.getSubtarget().getInstrInfo()), AA(aa) {
1510b57cec5SDimitry Andric   ResourceTracker = TII->CreateTargetScheduleState(MF.getSubtarget());
1528bcb0991SDimitry Andric   ResourceTracker->setTrackResources(true);
1530b57cec5SDimitry Andric   VLIWScheduler = new DefaultVLIWScheduler(MF, mli, AA);
1540b57cec5SDimitry Andric }
1550b57cec5SDimitry Andric 
~VLIWPacketizerList()1560b57cec5SDimitry Andric VLIWPacketizerList::~VLIWPacketizerList() {
1570b57cec5SDimitry Andric   delete VLIWScheduler;
1580b57cec5SDimitry Andric   delete ResourceTracker;
1590b57cec5SDimitry Andric }
1600b57cec5SDimitry Andric 
1610b57cec5SDimitry Andric // End the current packet, bundle packet instructions and reset DFA state.
endPacket(MachineBasicBlock * MBB,MachineBasicBlock::iterator MI)1620b57cec5SDimitry Andric void VLIWPacketizerList::endPacket(MachineBasicBlock *MBB,
1630b57cec5SDimitry Andric                                    MachineBasicBlock::iterator MI) {
1640b57cec5SDimitry Andric   LLVM_DEBUG({
1650b57cec5SDimitry Andric     if (!CurrentPacketMIs.empty()) {
1660b57cec5SDimitry Andric       dbgs() << "Finalizing packet:\n";
1678bcb0991SDimitry Andric       unsigned Idx = 0;
1688bcb0991SDimitry Andric       for (MachineInstr *MI : CurrentPacketMIs) {
1698bcb0991SDimitry Andric         unsigned R = ResourceTracker->getUsedResources(Idx++);
1708bcb0991SDimitry Andric         dbgs() << " * [res:0x" << utohexstr(R) << "] " << *MI;
1718bcb0991SDimitry Andric       }
1720b57cec5SDimitry Andric     }
1730b57cec5SDimitry Andric   });
1740b57cec5SDimitry Andric   if (CurrentPacketMIs.size() > 1) {
1750b57cec5SDimitry Andric     MachineInstr &MIFirst = *CurrentPacketMIs.front();
1760b57cec5SDimitry Andric     finalizeBundle(*MBB, MIFirst.getIterator(), MI.getInstrIterator());
1770b57cec5SDimitry Andric   }
1780b57cec5SDimitry Andric   CurrentPacketMIs.clear();
1790b57cec5SDimitry Andric   ResourceTracker->clearResources();
1800b57cec5SDimitry Andric   LLVM_DEBUG(dbgs() << "End packet\n");
1810b57cec5SDimitry Andric }
1820b57cec5SDimitry Andric 
1830b57cec5SDimitry Andric // Bundle machine instructions into packets.
PacketizeMIs(MachineBasicBlock * MBB,MachineBasicBlock::iterator BeginItr,MachineBasicBlock::iterator EndItr)1840b57cec5SDimitry Andric void VLIWPacketizerList::PacketizeMIs(MachineBasicBlock *MBB,
1850b57cec5SDimitry Andric                                       MachineBasicBlock::iterator BeginItr,
1860b57cec5SDimitry Andric                                       MachineBasicBlock::iterator EndItr) {
1870b57cec5SDimitry Andric   assert(VLIWScheduler && "VLIW Scheduler is not initialized!");
1880b57cec5SDimitry Andric   VLIWScheduler->startBlock(MBB);
1890b57cec5SDimitry Andric   VLIWScheduler->enterRegion(MBB, BeginItr, EndItr,
1900b57cec5SDimitry Andric                              std::distance(BeginItr, EndItr));
1910b57cec5SDimitry Andric   VLIWScheduler->schedule();
1920b57cec5SDimitry Andric 
1930b57cec5SDimitry Andric   LLVM_DEBUG({
1940b57cec5SDimitry Andric     dbgs() << "Scheduling DAG of the packetize region\n";
1950b57cec5SDimitry Andric     VLIWScheduler->dump();
1960b57cec5SDimitry Andric   });
1970b57cec5SDimitry Andric 
1980b57cec5SDimitry Andric   // Generate MI -> SU map.
1990b57cec5SDimitry Andric   MIToSUnit.clear();
2000b57cec5SDimitry Andric   for (SUnit &SU : VLIWScheduler->SUnits)
2010b57cec5SDimitry Andric     MIToSUnit[SU.getInstr()] = &SU;
2020b57cec5SDimitry Andric 
2030b57cec5SDimitry Andric   bool LimitPresent = InstrLimit.getPosition();
2040b57cec5SDimitry Andric 
2050b57cec5SDimitry Andric   // The main packetizer loop.
2060b57cec5SDimitry Andric   for (; BeginItr != EndItr; ++BeginItr) {
2070b57cec5SDimitry Andric     if (LimitPresent) {
2080b57cec5SDimitry Andric       if (InstrCount >= InstrLimit) {
2090b57cec5SDimitry Andric         EndItr = BeginItr;
2100b57cec5SDimitry Andric         break;
2110b57cec5SDimitry Andric       }
2120b57cec5SDimitry Andric       InstrCount++;
2130b57cec5SDimitry Andric     }
2140b57cec5SDimitry Andric     MachineInstr &MI = *BeginItr;
2150b57cec5SDimitry Andric     initPacketizerState();
2160b57cec5SDimitry Andric 
2170b57cec5SDimitry Andric     // End the current packet if needed.
2180b57cec5SDimitry Andric     if (isSoloInstruction(MI)) {
2190b57cec5SDimitry Andric       endPacket(MBB, MI);
2200b57cec5SDimitry Andric       continue;
2210b57cec5SDimitry Andric     }
2220b57cec5SDimitry Andric 
2230b57cec5SDimitry Andric     // Ignore pseudo instructions.
2240b57cec5SDimitry Andric     if (ignorePseudoInstruction(MI, MBB))
2250b57cec5SDimitry Andric       continue;
2260b57cec5SDimitry Andric 
2270b57cec5SDimitry Andric     SUnit *SUI = MIToSUnit[&MI];
2280b57cec5SDimitry Andric     assert(SUI && "Missing SUnit Info!");
2290b57cec5SDimitry Andric 
2300b57cec5SDimitry Andric     // Ask DFA if machine resource is available for MI.
2310b57cec5SDimitry Andric     LLVM_DEBUG(dbgs() << "Checking resources for adding MI to packet " << MI);
2320b57cec5SDimitry Andric 
2330b57cec5SDimitry Andric     bool ResourceAvail = ResourceTracker->canReserveResources(MI);
2340b57cec5SDimitry Andric     LLVM_DEBUG({
2350b57cec5SDimitry Andric       if (ResourceAvail)
2360b57cec5SDimitry Andric         dbgs() << "  Resources are available for adding MI to packet\n";
2370b57cec5SDimitry Andric       else
2380b57cec5SDimitry Andric         dbgs() << "  Resources NOT available\n";
2390b57cec5SDimitry Andric     });
2400b57cec5SDimitry Andric     if (ResourceAvail && shouldAddToPacket(MI)) {
2410b57cec5SDimitry Andric       // Dependency check for MI with instructions in CurrentPacketMIs.
2420b57cec5SDimitry Andric       for (auto MJ : CurrentPacketMIs) {
2430b57cec5SDimitry Andric         SUnit *SUJ = MIToSUnit[MJ];
2440b57cec5SDimitry Andric         assert(SUJ && "Missing SUnit Info!");
2450b57cec5SDimitry Andric 
2460b57cec5SDimitry Andric         LLVM_DEBUG(dbgs() << "  Checking against MJ " << *MJ);
2470b57cec5SDimitry Andric         // Is it legal to packetize SUI and SUJ together.
2480b57cec5SDimitry Andric         if (!isLegalToPacketizeTogether(SUI, SUJ)) {
2490b57cec5SDimitry Andric           LLVM_DEBUG(dbgs() << "  Not legal to add MI, try to prune\n");
2500b57cec5SDimitry Andric           // Allow packetization if dependency can be pruned.
2510b57cec5SDimitry Andric           if (!isLegalToPruneDependencies(SUI, SUJ)) {
2520b57cec5SDimitry Andric             // End the packet if dependency cannot be pruned.
2530b57cec5SDimitry Andric             LLVM_DEBUG(dbgs()
2540b57cec5SDimitry Andric                        << "  Could not prune dependencies for adding MI\n");
2550b57cec5SDimitry Andric             endPacket(MBB, MI);
2560b57cec5SDimitry Andric             break;
2570b57cec5SDimitry Andric           }
2580b57cec5SDimitry Andric           LLVM_DEBUG(dbgs() << "  Pruned dependence for adding MI\n");
2590b57cec5SDimitry Andric         }
2600b57cec5SDimitry Andric       }
2610b57cec5SDimitry Andric     } else {
2620b57cec5SDimitry Andric       LLVM_DEBUG(if (ResourceAvail) dbgs()
2630b57cec5SDimitry Andric                  << "Resources are available, but instruction should not be "
2640b57cec5SDimitry Andric                     "added to packet\n  "
2650b57cec5SDimitry Andric                  << MI);
2660b57cec5SDimitry Andric       // End the packet if resource is not available, or if the instruction
2670b57cec5SDimitry Andric       // shoud not be added to the current packet.
2680b57cec5SDimitry Andric       endPacket(MBB, MI);
2690b57cec5SDimitry Andric     }
2700b57cec5SDimitry Andric 
2710b57cec5SDimitry Andric     // Add MI to the current packet.
2720b57cec5SDimitry Andric     LLVM_DEBUG(dbgs() << "* Adding MI to packet " << MI << '\n');
2730b57cec5SDimitry Andric     BeginItr = addToPacket(MI);
2740b57cec5SDimitry Andric   } // For all instructions in the packetization range.
2750b57cec5SDimitry Andric 
2760b57cec5SDimitry Andric   // End any packet left behind.
2770b57cec5SDimitry Andric   endPacket(MBB, EndItr);
2780b57cec5SDimitry Andric   VLIWScheduler->exitRegion();
2790b57cec5SDimitry Andric   VLIWScheduler->finishBlock();
2800b57cec5SDimitry Andric }
2810b57cec5SDimitry Andric 
alias(const MachineMemOperand & Op1,const MachineMemOperand & Op2,bool UseTBAA) const2820b57cec5SDimitry Andric bool VLIWPacketizerList::alias(const MachineMemOperand &Op1,
2830b57cec5SDimitry Andric                                const MachineMemOperand &Op2,
2840b57cec5SDimitry Andric                                bool UseTBAA) const {
2850b57cec5SDimitry Andric   if (!Op1.getValue() || !Op2.getValue())
2860b57cec5SDimitry Andric     return true;
2870b57cec5SDimitry Andric 
2880b57cec5SDimitry Andric   int64_t MinOffset = std::min(Op1.getOffset(), Op2.getOffset());
2890b57cec5SDimitry Andric   int64_t Overlapa = Op1.getSize() + Op1.getOffset() - MinOffset;
2900b57cec5SDimitry Andric   int64_t Overlapb = Op2.getSize() + Op2.getOffset() - MinOffset;
2910b57cec5SDimitry Andric 
2920b57cec5SDimitry Andric   AliasResult AAResult =
2930b57cec5SDimitry Andric       AA->alias(MemoryLocation(Op1.getValue(), Overlapa,
2940b57cec5SDimitry Andric                                UseTBAA ? Op1.getAAInfo() : AAMDNodes()),
2950b57cec5SDimitry Andric                 MemoryLocation(Op2.getValue(), Overlapb,
2960b57cec5SDimitry Andric                                UseTBAA ? Op2.getAAInfo() : AAMDNodes()));
2970b57cec5SDimitry Andric 
298*5f7ddb14SDimitry Andric   return AAResult != AliasResult::NoAlias;
2990b57cec5SDimitry Andric }
3000b57cec5SDimitry Andric 
alias(const MachineInstr & MI1,const MachineInstr & MI2,bool UseTBAA) const3010b57cec5SDimitry Andric bool VLIWPacketizerList::alias(const MachineInstr &MI1,
3020b57cec5SDimitry Andric                                const MachineInstr &MI2,
3030b57cec5SDimitry Andric                                bool UseTBAA) const {
3040b57cec5SDimitry Andric   if (MI1.memoperands_empty() || MI2.memoperands_empty())
3050b57cec5SDimitry Andric     return true;
3060b57cec5SDimitry Andric 
3070b57cec5SDimitry Andric   for (const MachineMemOperand *Op1 : MI1.memoperands())
3080b57cec5SDimitry Andric     for (const MachineMemOperand *Op2 : MI2.memoperands())
3090b57cec5SDimitry Andric       if (alias(*Op1, *Op2, UseTBAA))
3100b57cec5SDimitry Andric         return true;
3110b57cec5SDimitry Andric   return false;
3120b57cec5SDimitry Andric }
3130b57cec5SDimitry Andric 
3140b57cec5SDimitry Andric // Add a DAG mutation object to the ordered list.
addMutation(std::unique_ptr<ScheduleDAGMutation> Mutation)3150b57cec5SDimitry Andric void VLIWPacketizerList::addMutation(
3160b57cec5SDimitry Andric       std::unique_ptr<ScheduleDAGMutation> Mutation) {
3170b57cec5SDimitry Andric   VLIWScheduler->addMutation(std::move(Mutation));
3180b57cec5SDimitry Andric }
319