1 //===- CodeGenSchedule.cpp - Scheduling MachineModels ---------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file defines structures to encapsulate the machine model as described in
10 // the target description.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "CodeGenSchedule.h"
15 #include "CodeGenInstruction.h"
16 #include "CodeGenTarget.h"
17 #include "llvm/ADT/MapVector.h"
18 #include "llvm/ADT/STLExtras.h"
19 #include "llvm/ADT/SmallPtrSet.h"
20 #include "llvm/ADT/SmallSet.h"
21 #include "llvm/ADT/SmallVector.h"
22 #include "llvm/Support/Casting.h"
23 #include "llvm/Support/Debug.h"
24 #include "llvm/Support/Regex.h"
25 #include "llvm/Support/raw_ostream.h"
26 #include "llvm/TableGen/Error.h"
27 #include <algorithm>
28 #include <iterator>
29 #include <utility>
30 
31 using namespace llvm;
32 
33 #define DEBUG_TYPE "subtarget-emitter"
34 
35 #ifndef NDEBUG
36 static void dumpIdxVec(ArrayRef<unsigned> V) {
37   for (unsigned Idx : V)
38     dbgs() << Idx << ", ";
39 }
40 #endif
41 
42 namespace {
43 
44 // (instrs a, b, ...) Evaluate and union all arguments. Identical to AddOp.
45 struct InstrsOp : public SetTheory::Operator {
46   void apply(SetTheory &ST, DagInit *Expr, SetTheory::RecSet &Elts,
47              ArrayRef<SMLoc> Loc) override {
48     ST.evaluate(Expr->arg_begin(), Expr->arg_end(), Elts, Loc);
49   }
50 };
51 
52 // (instregex "OpcPat",...) Find all instructions matching an opcode pattern.
53 struct InstRegexOp : public SetTheory::Operator {
54   const CodeGenTarget &Target;
55   InstRegexOp(const CodeGenTarget &t): Target(t) {}
56 
57   /// Remove any text inside of parentheses from S.
58   static std::string removeParens(llvm::StringRef S) {
59     std::string Result;
60     unsigned Paren = 0;
61     // NB: We don't care about escaped parens here.
62     for (char C : S) {
63       switch (C) {
64       case '(':
65         ++Paren;
66         break;
67       case ')':
68         --Paren;
69         break;
70       default:
71         if (Paren == 0)
72           Result += C;
73       }
74     }
75     return Result;
76   }
77 
78   void apply(SetTheory &ST, DagInit *Expr, SetTheory::RecSet &Elts,
79              ArrayRef<SMLoc> Loc) override {
80     ArrayRef<const CodeGenInstruction *> Instructions =
81         Target.getInstructionsByEnumValue();
82 
83     unsigned NumGeneric = Target.getNumFixedInstructions();
84     unsigned NumPseudos = Target.getNumPseudoInstructions();
85     auto Generics = Instructions.slice(0, NumGeneric);
86     auto Pseudos = Instructions.slice(NumGeneric, NumPseudos);
87     auto NonPseudos = Instructions.slice(NumGeneric + NumPseudos);
88 
89     for (Init *Arg : make_range(Expr->arg_begin(), Expr->arg_end())) {
90       StringInit *SI = dyn_cast<StringInit>(Arg);
91       if (!SI)
92         PrintFatalError(Loc, "instregex requires pattern string: " +
93                                  Expr->getAsString());
94       StringRef Original = SI->getValue();
95 
96       // Extract a prefix that we can binary search on.
97       static const char RegexMetachars[] = "()^$|*+?.[]\\{}";
98       auto FirstMeta = Original.find_first_of(RegexMetachars);
99 
100       // Look for top-level | or ?. We cannot optimize them to binary search.
101       if (removeParens(Original).find_first_of("|?") != std::string::npos)
102         FirstMeta = 0;
103 
104       Optional<Regex> Regexpr = None;
105       StringRef Prefix = Original.substr(0, FirstMeta);
106       StringRef PatStr = Original.substr(FirstMeta);
107       if (!PatStr.empty()) {
108         // For the rest use a python-style prefix match.
109         std::string pat = std::string(PatStr);
110         if (pat[0] != '^') {
111           pat.insert(0, "^(");
112           pat.insert(pat.end(), ')');
113         }
114         Regexpr = Regex(pat);
115       }
116 
117       int NumMatches = 0;
118 
119       // The generic opcodes are unsorted, handle them manually.
120       for (auto *Inst : Generics) {
121         StringRef InstName = Inst->TheDef->getName();
122         if (InstName.startswith(Prefix) &&
123             (!Regexpr || Regexpr->match(InstName.substr(Prefix.size())))) {
124           Elts.insert(Inst->TheDef);
125           NumMatches++;
126         }
127       }
128 
129       // Target instructions are split into two ranges: pseudo instructions
130       // first, than non-pseudos. Each range is in lexicographical order
131       // sorted by name. Find the sub-ranges that start with our prefix.
132       struct Comp {
133         bool operator()(const CodeGenInstruction *LHS, StringRef RHS) {
134           return LHS->TheDef->getName() < RHS;
135         }
136         bool operator()(StringRef LHS, const CodeGenInstruction *RHS) {
137           return LHS < RHS->TheDef->getName() &&
138                  !RHS->TheDef->getName().startswith(LHS);
139         }
140       };
141       auto Range1 =
142           std::equal_range(Pseudos.begin(), Pseudos.end(), Prefix, Comp());
143       auto Range2 = std::equal_range(NonPseudos.begin(), NonPseudos.end(),
144                                      Prefix, Comp());
145 
146       // For these ranges we know that instruction names start with the prefix.
147       // Check if there's a regex that needs to be checked.
148       const auto HandleNonGeneric = [&](const CodeGenInstruction *Inst) {
149         StringRef InstName = Inst->TheDef->getName();
150         if (!Regexpr || Regexpr->match(InstName.substr(Prefix.size()))) {
151           Elts.insert(Inst->TheDef);
152           NumMatches++;
153         }
154       };
155       std::for_each(Range1.first, Range1.second, HandleNonGeneric);
156       std::for_each(Range2.first, Range2.second, HandleNonGeneric);
157 
158       if (0 == NumMatches)
159         PrintFatalError(Loc, "instregex has no matches: " + Original);
160     }
161   }
162 };
163 
164 } // end anonymous namespace
165 
166 /// CodeGenModels ctor interprets machine model records and populates maps.
167 CodeGenSchedModels::CodeGenSchedModels(RecordKeeper &RK,
168                                        const CodeGenTarget &TGT):
169   Records(RK), Target(TGT) {
170 
171   Sets.addFieldExpander("InstRW", "Instrs");
172 
173   // Allow Set evaluation to recognize the dags used in InstRW records:
174   // (instrs Op1, Op1...)
175   Sets.addOperator("instrs", std::make_unique<InstrsOp>());
176   Sets.addOperator("instregex", std::make_unique<InstRegexOp>(Target));
177 
178   // Instantiate a CodeGenProcModel for each SchedMachineModel with the values
179   // that are explicitly referenced in tablegen records. Resources associated
180   // with each processor will be derived later. Populate ProcModelMap with the
181   // CodeGenProcModel instances.
182   collectProcModels();
183 
184   // Instantiate a CodeGenSchedRW for each SchedReadWrite record explicitly
185   // defined, and populate SchedReads and SchedWrites vectors. Implicit
186   // SchedReadWrites that represent sequences derived from expanded variant will
187   // be inferred later.
188   collectSchedRW();
189 
190   // Instantiate a CodeGenSchedClass for each unique SchedRW signature directly
191   // required by an instruction definition, and populate SchedClassIdxMap. Set
192   // NumItineraryClasses to the number of explicit itinerary classes referenced
193   // by instructions. Set NumInstrSchedClasses to the number of itinerary
194   // classes plus any classes implied by instructions that derive from class
195   // Sched and provide SchedRW list. This does not infer any new classes from
196   // SchedVariant.
197   collectSchedClasses();
198 
199   // Find instruction itineraries for each processor. Sort and populate
200   // CodeGenProcModel::ItinDefList. (Cycle-to-cycle itineraries). This requires
201   // all itinerary classes to be discovered.
202   collectProcItins();
203 
204   // Find ItinRW records for each processor and itinerary class.
205   // (For per-operand resources mapped to itinerary classes).
206   collectProcItinRW();
207 
208   // Find UnsupportedFeatures records for each processor.
209   // (For per-operand resources mapped to itinerary classes).
210   collectProcUnsupportedFeatures();
211 
212   // Infer new SchedClasses from SchedVariant.
213   inferSchedClasses();
214 
215   // Populate each CodeGenProcModel's WriteResDefs, ReadAdvanceDefs, and
216   // ProcResourceDefs.
217   LLVM_DEBUG(
218       dbgs() << "\n+++ RESOURCE DEFINITIONS (collectProcResources) +++\n");
219   collectProcResources();
220 
221   // Collect optional processor description.
222   collectOptionalProcessorInfo();
223 
224   // Check MCInstPredicate definitions.
225   checkMCInstPredicates();
226 
227   // Check STIPredicate definitions.
228   checkSTIPredicates();
229 
230   // Find STIPredicate definitions for each processor model, and construct
231   // STIPredicateFunction objects.
232   collectSTIPredicates();
233 
234   checkCompleteness();
235 }
236 
237 void CodeGenSchedModels::checkSTIPredicates() const {
238   DenseMap<StringRef, const Record *> Declarations;
239 
240   // There cannot be multiple declarations with the same name.
241   const RecVec Decls = Records.getAllDerivedDefinitions("STIPredicateDecl");
242   for (const Record *R : Decls) {
243     StringRef Name = R->getValueAsString("Name");
244     const auto It = Declarations.find(Name);
245     if (It == Declarations.end()) {
246       Declarations[Name] = R;
247       continue;
248     }
249 
250     PrintError(R->getLoc(), "STIPredicate " + Name + " multiply declared.");
251     PrintFatalNote(It->second->getLoc(), "Previous declaration was here.");
252   }
253 
254   // Disallow InstructionEquivalenceClasses with an empty instruction list.
255   const RecVec Defs =
256       Records.getAllDerivedDefinitions("InstructionEquivalenceClass");
257   for (const Record *R : Defs) {
258     RecVec Opcodes = R->getValueAsListOfDefs("Opcodes");
259     if (Opcodes.empty()) {
260       PrintFatalError(R->getLoc(), "Invalid InstructionEquivalenceClass "
261                                    "defined with an empty opcode list.");
262     }
263   }
264 }
265 
266 // Used by function `processSTIPredicate` to construct a mask of machine
267 // instruction operands.
268 static APInt constructOperandMask(ArrayRef<int64_t> Indices) {
269   APInt OperandMask;
270   if (Indices.empty())
271     return OperandMask;
272 
273   int64_t MaxIndex = *std::max_element(Indices.begin(), Indices.end());
274   assert(MaxIndex >= 0 && "Invalid negative indices in input!");
275   OperandMask = OperandMask.zext(MaxIndex + 1);
276   for (const int64_t Index : Indices) {
277     assert(Index >= 0 && "Invalid negative indices!");
278     OperandMask.setBit(Index);
279   }
280 
281   return OperandMask;
282 }
283 
284 static void
285 processSTIPredicate(STIPredicateFunction &Fn,
286                     const DenseMap<Record *, unsigned> &ProcModelMap) {
287   DenseMap<const Record *, unsigned> Opcode2Index;
288   using OpcodeMapPair = std::pair<const Record *, OpcodeInfo>;
289   std::vector<OpcodeMapPair> OpcodeMappings;
290   std::vector<std::pair<APInt, APInt>> OpcodeMasks;
291 
292   DenseMap<const Record *, unsigned> Predicate2Index;
293   unsigned NumUniquePredicates = 0;
294 
295   // Number unique predicates and opcodes used by InstructionEquivalenceClass
296   // definitions. Each unique opcode will be associated with an OpcodeInfo
297   // object.
298   for (const Record *Def : Fn.getDefinitions()) {
299     RecVec Classes = Def->getValueAsListOfDefs("Classes");
300     for (const Record *EC : Classes) {
301       const Record *Pred = EC->getValueAsDef("Predicate");
302       if (Predicate2Index.find(Pred) == Predicate2Index.end())
303         Predicate2Index[Pred] = NumUniquePredicates++;
304 
305       RecVec Opcodes = EC->getValueAsListOfDefs("Opcodes");
306       for (const Record *Opcode : Opcodes) {
307         if (Opcode2Index.find(Opcode) == Opcode2Index.end()) {
308           Opcode2Index[Opcode] = OpcodeMappings.size();
309           OpcodeMappings.emplace_back(Opcode, OpcodeInfo());
310         }
311       }
312     }
313   }
314 
315   // Initialize vector `OpcodeMasks` with default values.  We want to keep track
316   // of which processors "use" which opcodes.  We also want to be able to
317   // identify predicates that are used by different processors for a same
318   // opcode.
319   // This information is used later on by this algorithm to sort OpcodeMapping
320   // elements based on their processor and predicate sets.
321   OpcodeMasks.resize(OpcodeMappings.size());
322   APInt DefaultProcMask(ProcModelMap.size(), 0);
323   APInt DefaultPredMask(NumUniquePredicates, 0);
324   for (std::pair<APInt, APInt> &MaskPair : OpcodeMasks)
325     MaskPair = std::make_pair(DefaultProcMask, DefaultPredMask);
326 
327   // Construct a OpcodeInfo object for every unique opcode declared by an
328   // InstructionEquivalenceClass definition.
329   for (const Record *Def : Fn.getDefinitions()) {
330     RecVec Classes = Def->getValueAsListOfDefs("Classes");
331     const Record *SchedModel = Def->getValueAsDef("SchedModel");
332     unsigned ProcIndex = ProcModelMap.find(SchedModel)->second;
333     APInt ProcMask(ProcModelMap.size(), 0);
334     ProcMask.setBit(ProcIndex);
335 
336     for (const Record *EC : Classes) {
337       RecVec Opcodes = EC->getValueAsListOfDefs("Opcodes");
338 
339       std::vector<int64_t> OpIndices =
340           EC->getValueAsListOfInts("OperandIndices");
341       APInt OperandMask = constructOperandMask(OpIndices);
342 
343       const Record *Pred = EC->getValueAsDef("Predicate");
344       APInt PredMask(NumUniquePredicates, 0);
345       PredMask.setBit(Predicate2Index[Pred]);
346 
347       for (const Record *Opcode : Opcodes) {
348         unsigned OpcodeIdx = Opcode2Index[Opcode];
349         if (OpcodeMasks[OpcodeIdx].first[ProcIndex]) {
350           std::string Message =
351               "Opcode " + Opcode->getName().str() +
352               " used by multiple InstructionEquivalenceClass definitions.";
353           PrintFatalError(EC->getLoc(), Message);
354         }
355         OpcodeMasks[OpcodeIdx].first |= ProcMask;
356         OpcodeMasks[OpcodeIdx].second |= PredMask;
357         OpcodeInfo &OI = OpcodeMappings[OpcodeIdx].second;
358 
359         OI.addPredicateForProcModel(ProcMask, OperandMask, Pred);
360       }
361     }
362   }
363 
364   // Sort OpcodeMappings elements based on their CPU and predicate masks.
365   // As a last resort, order elements by opcode identifier.
366   llvm::sort(OpcodeMappings,
367              [&](const OpcodeMapPair &Lhs, const OpcodeMapPair &Rhs) {
368                unsigned LhsIdx = Opcode2Index[Lhs.first];
369                unsigned RhsIdx = Opcode2Index[Rhs.first];
370                const std::pair<APInt, APInt> &LhsMasks = OpcodeMasks[LhsIdx];
371                const std::pair<APInt, APInt> &RhsMasks = OpcodeMasks[RhsIdx];
372 
373                auto LessThan = [](const APInt &Lhs, const APInt &Rhs) {
374                  unsigned LhsCountPopulation = Lhs.countPopulation();
375                  unsigned RhsCountPopulation = Rhs.countPopulation();
376                  return ((LhsCountPopulation < RhsCountPopulation) ||
377                          ((LhsCountPopulation == RhsCountPopulation) &&
378                           (Lhs.countLeadingZeros() > Rhs.countLeadingZeros())));
379                };
380 
381                if (LhsMasks.first != RhsMasks.first)
382                  return LessThan(LhsMasks.first, RhsMasks.first);
383 
384                if (LhsMasks.second != RhsMasks.second)
385                  return LessThan(LhsMasks.second, RhsMasks.second);
386 
387                return LhsIdx < RhsIdx;
388              });
389 
390   // Now construct opcode groups. Groups are used by the SubtargetEmitter when
391   // expanding the body of a STIPredicate function. In particular, each opcode
392   // group is expanded into a sequence of labels in a switch statement.
393   // It identifies opcodes for which different processors define same predicates
394   // and same opcode masks.
395   for (OpcodeMapPair &Info : OpcodeMappings)
396     Fn.addOpcode(Info.first, std::move(Info.second));
397 }
398 
399 void CodeGenSchedModels::collectSTIPredicates() {
400   // Map STIPredicateDecl records to elements of vector
401   // CodeGenSchedModels::STIPredicates.
402   DenseMap<const Record *, unsigned> Decl2Index;
403 
404   RecVec RV = Records.getAllDerivedDefinitions("STIPredicate");
405   for (const Record *R : RV) {
406     const Record *Decl = R->getValueAsDef("Declaration");
407 
408     const auto It = Decl2Index.find(Decl);
409     if (It == Decl2Index.end()) {
410       Decl2Index[Decl] = STIPredicates.size();
411       STIPredicateFunction Predicate(Decl);
412       Predicate.addDefinition(R);
413       STIPredicates.emplace_back(std::move(Predicate));
414       continue;
415     }
416 
417     STIPredicateFunction &PreviousDef = STIPredicates[It->second];
418     PreviousDef.addDefinition(R);
419   }
420 
421   for (STIPredicateFunction &Fn : STIPredicates)
422     processSTIPredicate(Fn, ProcModelMap);
423 }
424 
425 void OpcodeInfo::addPredicateForProcModel(const llvm::APInt &CpuMask,
426                                           const llvm::APInt &OperandMask,
427                                           const Record *Predicate) {
428   auto It = llvm::find_if(
429       Predicates, [&OperandMask, &Predicate](const PredicateInfo &P) {
430         return P.Predicate == Predicate && P.OperandMask == OperandMask;
431       });
432   if (It == Predicates.end()) {
433     Predicates.emplace_back(CpuMask, OperandMask, Predicate);
434     return;
435   }
436   It->ProcModelMask |= CpuMask;
437 }
438 
439 void CodeGenSchedModels::checkMCInstPredicates() const {
440   RecVec MCPredicates = Records.getAllDerivedDefinitions("TIIPredicate");
441   if (MCPredicates.empty())
442     return;
443 
444   // A target cannot have multiple TIIPredicate definitions with a same name.
445   llvm::StringMap<const Record *> TIIPredicates(MCPredicates.size());
446   for (const Record *TIIPred : MCPredicates) {
447     StringRef Name = TIIPred->getValueAsString("FunctionName");
448     StringMap<const Record *>::const_iterator It = TIIPredicates.find(Name);
449     if (It == TIIPredicates.end()) {
450       TIIPredicates[Name] = TIIPred;
451       continue;
452     }
453 
454     PrintError(TIIPred->getLoc(),
455                "TIIPredicate " + Name + " is multiply defined.");
456     PrintFatalNote(It->second->getLoc(),
457                    " Previous definition of " + Name + " was here.");
458   }
459 }
460 
461 void CodeGenSchedModels::collectRetireControlUnits() {
462   RecVec Units = Records.getAllDerivedDefinitions("RetireControlUnit");
463 
464   for (Record *RCU : Units) {
465     CodeGenProcModel &PM = getProcModel(RCU->getValueAsDef("SchedModel"));
466     if (PM.RetireControlUnit) {
467       PrintError(RCU->getLoc(),
468                  "Expected a single RetireControlUnit definition");
469       PrintNote(PM.RetireControlUnit->getLoc(),
470                 "Previous definition of RetireControlUnit was here");
471     }
472     PM.RetireControlUnit = RCU;
473   }
474 }
475 
476 void CodeGenSchedModels::collectLoadStoreQueueInfo() {
477   RecVec Queues = Records.getAllDerivedDefinitions("MemoryQueue");
478 
479   for (Record *Queue : Queues) {
480     CodeGenProcModel &PM = getProcModel(Queue->getValueAsDef("SchedModel"));
481     if (Queue->isSubClassOf("LoadQueue")) {
482       if (PM.LoadQueue) {
483         PrintError(Queue->getLoc(),
484                    "Expected a single LoadQueue definition");
485         PrintNote(PM.LoadQueue->getLoc(),
486                   "Previous definition of LoadQueue was here");
487       }
488 
489       PM.LoadQueue = Queue;
490     }
491 
492     if (Queue->isSubClassOf("StoreQueue")) {
493       if (PM.StoreQueue) {
494         PrintError(Queue->getLoc(),
495                    "Expected a single StoreQueue definition");
496         PrintNote(PM.LoadQueue->getLoc(),
497                   "Previous definition of StoreQueue was here");
498       }
499 
500       PM.StoreQueue = Queue;
501     }
502   }
503 }
504 
505 /// Collect optional processor information.
506 void CodeGenSchedModels::collectOptionalProcessorInfo() {
507   // Find register file definitions for each processor.
508   collectRegisterFiles();
509 
510   // Collect processor RetireControlUnit descriptors if available.
511   collectRetireControlUnits();
512 
513   // Collect information about load/store queues.
514   collectLoadStoreQueueInfo();
515 
516   checkCompleteness();
517 }
518 
519 /// Gather all processor models.
520 void CodeGenSchedModels::collectProcModels() {
521   RecVec ProcRecords = Records.getAllDerivedDefinitions("Processor");
522   llvm::sort(ProcRecords, LessRecordFieldName());
523 
524   // Reserve space because we can. Reallocation would be ok.
525   ProcModels.reserve(ProcRecords.size()+1);
526 
527   // Use idx=0 for NoModel/NoItineraries.
528   Record *NoModelDef = Records.getDef("NoSchedModel");
529   Record *NoItinsDef = Records.getDef("NoItineraries");
530   ProcModels.emplace_back(0, "NoSchedModel", NoModelDef, NoItinsDef);
531   ProcModelMap[NoModelDef] = 0;
532 
533   // For each processor, find a unique machine model.
534   LLVM_DEBUG(dbgs() << "+++ PROCESSOR MODELs (addProcModel) +++\n");
535   for (Record *ProcRecord : ProcRecords)
536     addProcModel(ProcRecord);
537 }
538 
539 /// Get a unique processor model based on the defined MachineModel and
540 /// ProcessorItineraries.
541 void CodeGenSchedModels::addProcModel(Record *ProcDef) {
542   Record *ModelKey = getModelOrItinDef(ProcDef);
543   if (!ProcModelMap.insert(std::make_pair(ModelKey, ProcModels.size())).second)
544     return;
545 
546   std::string Name = std::string(ModelKey->getName());
547   if (ModelKey->isSubClassOf("SchedMachineModel")) {
548     Record *ItinsDef = ModelKey->getValueAsDef("Itineraries");
549     ProcModels.emplace_back(ProcModels.size(), Name, ModelKey, ItinsDef);
550   }
551   else {
552     // An itinerary is defined without a machine model. Infer a new model.
553     if (!ModelKey->getValueAsListOfDefs("IID").empty())
554       Name = Name + "Model";
555     ProcModels.emplace_back(ProcModels.size(), Name,
556                             ProcDef->getValueAsDef("SchedModel"), ModelKey);
557   }
558   LLVM_DEBUG(ProcModels.back().dump());
559 }
560 
561 // Recursively find all reachable SchedReadWrite records.
562 static void scanSchedRW(Record *RWDef, RecVec &RWDefs,
563                         SmallPtrSet<Record*, 16> &RWSet) {
564   if (!RWSet.insert(RWDef).second)
565     return;
566   RWDefs.push_back(RWDef);
567   // Reads don't currently have sequence records, but it can be added later.
568   if (RWDef->isSubClassOf("WriteSequence")) {
569     RecVec Seq = RWDef->getValueAsListOfDefs("Writes");
570     for (Record *WSRec : Seq)
571       scanSchedRW(WSRec, RWDefs, RWSet);
572   }
573   else if (RWDef->isSubClassOf("SchedVariant")) {
574     // Visit each variant (guarded by a different predicate).
575     RecVec Vars = RWDef->getValueAsListOfDefs("Variants");
576     for (Record *Variant : Vars) {
577       // Visit each RW in the sequence selected by the current variant.
578       RecVec Selected = Variant->getValueAsListOfDefs("Selected");
579       for (Record *SelDef : Selected)
580         scanSchedRW(SelDef, RWDefs, RWSet);
581     }
582   }
583 }
584 
585 // Collect and sort all SchedReadWrites reachable via tablegen records.
586 // More may be inferred later when inferring new SchedClasses from variants.
587 void CodeGenSchedModels::collectSchedRW() {
588   // Reserve idx=0 for invalid writes/reads.
589   SchedWrites.resize(1);
590   SchedReads.resize(1);
591 
592   SmallPtrSet<Record*, 16> RWSet;
593 
594   // Find all SchedReadWrites referenced by instruction defs.
595   RecVec SWDefs, SRDefs;
596   for (const CodeGenInstruction *Inst : Target.getInstructionsByEnumValue()) {
597     Record *SchedDef = Inst->TheDef;
598     if (SchedDef->isValueUnset("SchedRW"))
599       continue;
600     RecVec RWs = SchedDef->getValueAsListOfDefs("SchedRW");
601     for (Record *RW : RWs) {
602       if (RW->isSubClassOf("SchedWrite"))
603         scanSchedRW(RW, SWDefs, RWSet);
604       else {
605         assert(RW->isSubClassOf("SchedRead") && "Unknown SchedReadWrite");
606         scanSchedRW(RW, SRDefs, RWSet);
607       }
608     }
609   }
610   // Find all ReadWrites referenced by InstRW.
611   RecVec InstRWDefs = Records.getAllDerivedDefinitions("InstRW");
612   for (Record *InstRWDef : InstRWDefs) {
613     // For all OperandReadWrites.
614     RecVec RWDefs = InstRWDef->getValueAsListOfDefs("OperandReadWrites");
615     for (Record *RWDef : RWDefs) {
616       if (RWDef->isSubClassOf("SchedWrite"))
617         scanSchedRW(RWDef, SWDefs, RWSet);
618       else {
619         assert(RWDef->isSubClassOf("SchedRead") && "Unknown SchedReadWrite");
620         scanSchedRW(RWDef, SRDefs, RWSet);
621       }
622     }
623   }
624   // Find all ReadWrites referenced by ItinRW.
625   RecVec ItinRWDefs = Records.getAllDerivedDefinitions("ItinRW");
626   for (Record *ItinRWDef : ItinRWDefs) {
627     // For all OperandReadWrites.
628     RecVec RWDefs = ItinRWDef->getValueAsListOfDefs("OperandReadWrites");
629     for (Record *RWDef : RWDefs) {
630       if (RWDef->isSubClassOf("SchedWrite"))
631         scanSchedRW(RWDef, SWDefs, RWSet);
632       else {
633         assert(RWDef->isSubClassOf("SchedRead") && "Unknown SchedReadWrite");
634         scanSchedRW(RWDef, SRDefs, RWSet);
635       }
636     }
637   }
638   // Find all ReadWrites referenced by SchedAlias. AliasDefs needs to be sorted
639   // for the loop below that initializes Alias vectors.
640   RecVec AliasDefs = Records.getAllDerivedDefinitions("SchedAlias");
641   llvm::sort(AliasDefs, LessRecord());
642   for (Record *ADef : AliasDefs) {
643     Record *MatchDef = ADef->getValueAsDef("MatchRW");
644     Record *AliasDef = ADef->getValueAsDef("AliasRW");
645     if (MatchDef->isSubClassOf("SchedWrite")) {
646       if (!AliasDef->isSubClassOf("SchedWrite"))
647         PrintFatalError(ADef->getLoc(), "SchedWrite Alias must be SchedWrite");
648       scanSchedRW(AliasDef, SWDefs, RWSet);
649     }
650     else {
651       assert(MatchDef->isSubClassOf("SchedRead") && "Unknown SchedReadWrite");
652       if (!AliasDef->isSubClassOf("SchedRead"))
653         PrintFatalError(ADef->getLoc(), "SchedRead Alias must be SchedRead");
654       scanSchedRW(AliasDef, SRDefs, RWSet);
655     }
656   }
657   // Sort and add the SchedReadWrites directly referenced by instructions or
658   // itinerary resources. Index reads and writes in separate domains.
659   llvm::sort(SWDefs, LessRecord());
660   for (Record *SWDef : SWDefs) {
661     assert(!getSchedRWIdx(SWDef, /*IsRead=*/false) && "duplicate SchedWrite");
662     SchedWrites.emplace_back(SchedWrites.size(), SWDef);
663   }
664   llvm::sort(SRDefs, LessRecord());
665   for (Record *SRDef : SRDefs) {
666     assert(!getSchedRWIdx(SRDef, /*IsRead-*/true) && "duplicate SchedWrite");
667     SchedReads.emplace_back(SchedReads.size(), SRDef);
668   }
669   // Initialize WriteSequence vectors.
670   for (CodeGenSchedRW &CGRW : SchedWrites) {
671     if (!CGRW.IsSequence)
672       continue;
673     findRWs(CGRW.TheDef->getValueAsListOfDefs("Writes"), CGRW.Sequence,
674             /*IsRead=*/false);
675   }
676   // Initialize Aliases vectors.
677   for (Record *ADef : AliasDefs) {
678     Record *AliasDef = ADef->getValueAsDef("AliasRW");
679     getSchedRW(AliasDef).IsAlias = true;
680     Record *MatchDef = ADef->getValueAsDef("MatchRW");
681     CodeGenSchedRW &RW = getSchedRW(MatchDef);
682     if (RW.IsAlias)
683       PrintFatalError(ADef->getLoc(), "Cannot Alias an Alias");
684     RW.Aliases.push_back(ADef);
685   }
686   LLVM_DEBUG(
687       dbgs() << "\n+++ SCHED READS and WRITES (collectSchedRW) +++\n";
688       for (unsigned WIdx = 0, WEnd = SchedWrites.size(); WIdx != WEnd; ++WIdx) {
689         dbgs() << WIdx << ": ";
690         SchedWrites[WIdx].dump();
691         dbgs() << '\n';
692       } for (unsigned RIdx = 0, REnd = SchedReads.size(); RIdx != REnd;
693              ++RIdx) {
694         dbgs() << RIdx << ": ";
695         SchedReads[RIdx].dump();
696         dbgs() << '\n';
697       } RecVec RWDefs = Records.getAllDerivedDefinitions("SchedReadWrite");
698       for (Record *RWDef
699            : RWDefs) {
700         if (!getSchedRWIdx(RWDef, RWDef->isSubClassOf("SchedRead"))) {
701           StringRef Name = RWDef->getName();
702           if (Name != "NoWrite" && Name != "ReadDefault")
703             dbgs() << "Unused SchedReadWrite " << Name << '\n';
704         }
705       });
706 }
707 
708 /// Compute a SchedWrite name from a sequence of writes.
709 std::string CodeGenSchedModels::genRWName(ArrayRef<unsigned> Seq, bool IsRead) {
710   std::string Name("(");
711   for (auto I = Seq.begin(), E = Seq.end(); I != E; ++I) {
712     if (I != Seq.begin())
713       Name += '_';
714     Name += getSchedRW(*I, IsRead).Name;
715   }
716   Name += ')';
717   return Name;
718 }
719 
720 unsigned CodeGenSchedModels::getSchedRWIdx(const Record *Def,
721                                            bool IsRead) const {
722   const std::vector<CodeGenSchedRW> &RWVec = IsRead ? SchedReads : SchedWrites;
723   const auto I = find_if(
724       RWVec, [Def](const CodeGenSchedRW &RW) { return RW.TheDef == Def; });
725   return I == RWVec.end() ? 0 : std::distance(RWVec.begin(), I);
726 }
727 
728 bool CodeGenSchedModels::hasReadOfWrite(Record *WriteDef) const {
729   for (const CodeGenSchedRW &Read : SchedReads) {
730     Record *ReadDef = Read.TheDef;
731     if (!ReadDef || !ReadDef->isSubClassOf("ProcReadAdvance"))
732       continue;
733 
734     RecVec ValidWrites = ReadDef->getValueAsListOfDefs("ValidWrites");
735     if (is_contained(ValidWrites, WriteDef)) {
736       return true;
737     }
738   }
739   return false;
740 }
741 
742 static void splitSchedReadWrites(const RecVec &RWDefs,
743                                  RecVec &WriteDefs, RecVec &ReadDefs) {
744   for (Record *RWDef : RWDefs) {
745     if (RWDef->isSubClassOf("SchedWrite"))
746       WriteDefs.push_back(RWDef);
747     else {
748       assert(RWDef->isSubClassOf("SchedRead") && "unknown SchedReadWrite");
749       ReadDefs.push_back(RWDef);
750     }
751   }
752 }
753 
754 // Split the SchedReadWrites defs and call findRWs for each list.
755 void CodeGenSchedModels::findRWs(const RecVec &RWDefs,
756                                  IdxVec &Writes, IdxVec &Reads) const {
757   RecVec WriteDefs;
758   RecVec ReadDefs;
759   splitSchedReadWrites(RWDefs, WriteDefs, ReadDefs);
760   findRWs(WriteDefs, Writes, false);
761   findRWs(ReadDefs, Reads, true);
762 }
763 
764 // Call getSchedRWIdx for all elements in a sequence of SchedRW defs.
765 void CodeGenSchedModels::findRWs(const RecVec &RWDefs, IdxVec &RWs,
766                                  bool IsRead) const {
767   for (Record *RWDef : RWDefs) {
768     unsigned Idx = getSchedRWIdx(RWDef, IsRead);
769     assert(Idx && "failed to collect SchedReadWrite");
770     RWs.push_back(Idx);
771   }
772 }
773 
774 void CodeGenSchedModels::expandRWSequence(unsigned RWIdx, IdxVec &RWSeq,
775                                           bool IsRead) const {
776   const CodeGenSchedRW &SchedRW = getSchedRW(RWIdx, IsRead);
777   if (!SchedRW.IsSequence) {
778     RWSeq.push_back(RWIdx);
779     return;
780   }
781   int Repeat =
782     SchedRW.TheDef ? SchedRW.TheDef->getValueAsInt("Repeat") : 1;
783   for (int i = 0; i < Repeat; ++i) {
784     for (unsigned I : SchedRW.Sequence) {
785       expandRWSequence(I, RWSeq, IsRead);
786     }
787   }
788 }
789 
790 // Expand a SchedWrite as a sequence following any aliases that coincide with
791 // the given processor model.
792 void CodeGenSchedModels::expandRWSeqForProc(
793   unsigned RWIdx, IdxVec &RWSeq, bool IsRead,
794   const CodeGenProcModel &ProcModel) const {
795 
796   const CodeGenSchedRW &SchedWrite = getSchedRW(RWIdx, IsRead);
797   Record *AliasDef = nullptr;
798   for (const Record *Rec : SchedWrite.Aliases) {
799     const CodeGenSchedRW &AliasRW = getSchedRW(Rec->getValueAsDef("AliasRW"));
800     if (Rec->getValueInit("SchedModel")->isComplete()) {
801       Record *ModelDef = Rec->getValueAsDef("SchedModel");
802       if (&getProcModel(ModelDef) != &ProcModel)
803         continue;
804     }
805     if (AliasDef)
806       PrintFatalError(AliasRW.TheDef->getLoc(), "Multiple aliases "
807                       "defined for processor " + ProcModel.ModelName +
808                       " Ensure only one SchedAlias exists per RW.");
809     AliasDef = AliasRW.TheDef;
810   }
811   if (AliasDef) {
812     expandRWSeqForProc(getSchedRWIdx(AliasDef, IsRead),
813                        RWSeq, IsRead,ProcModel);
814     return;
815   }
816   if (!SchedWrite.IsSequence) {
817     RWSeq.push_back(RWIdx);
818     return;
819   }
820   int Repeat =
821     SchedWrite.TheDef ? SchedWrite.TheDef->getValueAsInt("Repeat") : 1;
822   for (int I = 0, E = Repeat; I < E; ++I) {
823     for (unsigned Idx : SchedWrite.Sequence) {
824       expandRWSeqForProc(Idx, RWSeq, IsRead, ProcModel);
825     }
826   }
827 }
828 
829 // Find the existing SchedWrite that models this sequence of writes.
830 unsigned CodeGenSchedModels::findRWForSequence(ArrayRef<unsigned> Seq,
831                                                bool IsRead) {
832   std::vector<CodeGenSchedRW> &RWVec = IsRead ? SchedReads : SchedWrites;
833 
834   auto I = find_if(RWVec, [Seq](CodeGenSchedRW &RW) {
835     return makeArrayRef(RW.Sequence) == Seq;
836   });
837   // Index zero reserved for invalid RW.
838   return I == RWVec.end() ? 0 : std::distance(RWVec.begin(), I);
839 }
840 
841 /// Add this ReadWrite if it doesn't already exist.
842 unsigned CodeGenSchedModels::findOrInsertRW(ArrayRef<unsigned> Seq,
843                                             bool IsRead) {
844   assert(!Seq.empty() && "cannot insert empty sequence");
845   if (Seq.size() == 1)
846     return Seq.back();
847 
848   unsigned Idx = findRWForSequence(Seq, IsRead);
849   if (Idx)
850     return Idx;
851 
852   std::vector<CodeGenSchedRW> &RWVec = IsRead ? SchedReads : SchedWrites;
853   unsigned RWIdx = RWVec.size();
854   CodeGenSchedRW SchedRW(RWIdx, IsRead, Seq, genRWName(Seq, IsRead));
855   RWVec.push_back(SchedRW);
856   return RWIdx;
857 }
858 
859 /// Visit all the instruction definitions for this target to gather and
860 /// enumerate the itinerary classes. These are the explicitly specified
861 /// SchedClasses. More SchedClasses may be inferred.
862 void CodeGenSchedModels::collectSchedClasses() {
863 
864   // NoItinerary is always the first class at Idx=0
865   assert(SchedClasses.empty() && "Expected empty sched class");
866   SchedClasses.emplace_back(0, "NoInstrModel",
867                             Records.getDef("NoItinerary"));
868   SchedClasses.back().ProcIndices.push_back(0);
869 
870   // Create a SchedClass for each unique combination of itinerary class and
871   // SchedRW list.
872   for (const CodeGenInstruction *Inst : Target.getInstructionsByEnumValue()) {
873     Record *ItinDef = Inst->TheDef->getValueAsDef("Itinerary");
874     IdxVec Writes, Reads;
875     if (!Inst->TheDef->isValueUnset("SchedRW"))
876       findRWs(Inst->TheDef->getValueAsListOfDefs("SchedRW"), Writes, Reads);
877 
878     // ProcIdx == 0 indicates the class applies to all processors.
879     unsigned SCIdx = addSchedClass(ItinDef, Writes, Reads, /*ProcIndices*/{0});
880     InstrClassMap[Inst->TheDef] = SCIdx;
881   }
882   // Create classes for InstRW defs.
883   RecVec InstRWDefs = Records.getAllDerivedDefinitions("InstRW");
884   llvm::sort(InstRWDefs, LessRecord());
885   LLVM_DEBUG(dbgs() << "\n+++ SCHED CLASSES (createInstRWClass) +++\n");
886   for (Record *RWDef : InstRWDefs)
887     createInstRWClass(RWDef);
888 
889   NumInstrSchedClasses = SchedClasses.size();
890 
891   bool EnableDump = false;
892   LLVM_DEBUG(EnableDump = true);
893   if (!EnableDump)
894     return;
895 
896   LLVM_DEBUG(
897       dbgs()
898       << "\n+++ ITINERARIES and/or MACHINE MODELS (collectSchedClasses) +++\n");
899   for (const CodeGenInstruction *Inst : Target.getInstructionsByEnumValue()) {
900     StringRef InstName = Inst->TheDef->getName();
901     unsigned SCIdx = getSchedClassIdx(*Inst);
902     if (!SCIdx) {
903       LLVM_DEBUG({
904         if (!Inst->hasNoSchedulingInfo)
905           dbgs() << "No machine model for " << Inst->TheDef->getName() << '\n';
906       });
907       continue;
908     }
909     CodeGenSchedClass &SC = getSchedClass(SCIdx);
910     if (SC.ProcIndices[0] != 0)
911       PrintFatalError(Inst->TheDef->getLoc(), "Instruction's sched class "
912                       "must not be subtarget specific.");
913 
914     IdxVec ProcIndices;
915     if (SC.ItinClassDef->getName() != "NoItinerary") {
916       ProcIndices.push_back(0);
917       dbgs() << "Itinerary for " << InstName << ": "
918              << SC.ItinClassDef->getName() << '\n';
919     }
920     if (!SC.Writes.empty()) {
921       ProcIndices.push_back(0);
922       LLVM_DEBUG({
923         dbgs() << "SchedRW machine model for " << InstName;
924         for (IdxIter WI = SC.Writes.begin(), WE = SC.Writes.end(); WI != WE;
925              ++WI)
926           dbgs() << " " << SchedWrites[*WI].Name;
927         for (IdxIter RI = SC.Reads.begin(), RE = SC.Reads.end(); RI != RE; ++RI)
928           dbgs() << " " << SchedReads[*RI].Name;
929         dbgs() << '\n';
930       });
931     }
932     const RecVec &RWDefs = SchedClasses[SCIdx].InstRWs;
933     for (Record *RWDef : RWDefs) {
934       const CodeGenProcModel &ProcModel =
935           getProcModel(RWDef->getValueAsDef("SchedModel"));
936       ProcIndices.push_back(ProcModel.Index);
937       LLVM_DEBUG(dbgs() << "InstRW on " << ProcModel.ModelName << " for "
938                         << InstName);
939       IdxVec Writes;
940       IdxVec Reads;
941       findRWs(RWDef->getValueAsListOfDefs("OperandReadWrites"),
942               Writes, Reads);
943       LLVM_DEBUG({
944         for (unsigned WIdx : Writes)
945           dbgs() << " " << SchedWrites[WIdx].Name;
946         for (unsigned RIdx : Reads)
947           dbgs() << " " << SchedReads[RIdx].Name;
948         dbgs() << '\n';
949       });
950     }
951     // If ProcIndices contains zero, the class applies to all processors.
952     LLVM_DEBUG({
953       if (!std::count(ProcIndices.begin(), ProcIndices.end(), 0)) {
954         for (const CodeGenProcModel &PM : ProcModels) {
955           if (!std::count(ProcIndices.begin(), ProcIndices.end(), PM.Index))
956             dbgs() << "No machine model for " << Inst->TheDef->getName()
957                    << " on processor " << PM.ModelName << '\n';
958         }
959       }
960     });
961   }
962 }
963 
964 // Get the SchedClass index for an instruction.
965 unsigned
966 CodeGenSchedModels::getSchedClassIdx(const CodeGenInstruction &Inst) const {
967   return InstrClassMap.lookup(Inst.TheDef);
968 }
969 
970 std::string
971 CodeGenSchedModels::createSchedClassName(Record *ItinClassDef,
972                                          ArrayRef<unsigned> OperWrites,
973                                          ArrayRef<unsigned> OperReads) {
974 
975   std::string Name;
976   if (ItinClassDef && ItinClassDef->getName() != "NoItinerary")
977     Name = std::string(ItinClassDef->getName());
978   for (unsigned Idx : OperWrites) {
979     if (!Name.empty())
980       Name += '_';
981     Name += SchedWrites[Idx].Name;
982   }
983   for (unsigned Idx : OperReads) {
984     Name += '_';
985     Name += SchedReads[Idx].Name;
986   }
987   return Name;
988 }
989 
990 std::string CodeGenSchedModels::createSchedClassName(const RecVec &InstDefs) {
991 
992   std::string Name;
993   for (RecIter I = InstDefs.begin(), E = InstDefs.end(); I != E; ++I) {
994     if (I != InstDefs.begin())
995       Name += '_';
996     Name += (*I)->getName();
997   }
998   return Name;
999 }
1000 
1001 /// Add an inferred sched class from an itinerary class and per-operand list of
1002 /// SchedWrites and SchedReads. ProcIndices contains the set of IDs of
1003 /// processors that may utilize this class.
1004 unsigned CodeGenSchedModels::addSchedClass(Record *ItinClassDef,
1005                                            ArrayRef<unsigned> OperWrites,
1006                                            ArrayRef<unsigned> OperReads,
1007                                            ArrayRef<unsigned> ProcIndices) {
1008   assert(!ProcIndices.empty() && "expect at least one ProcIdx");
1009 
1010   auto IsKeyEqual = [=](const CodeGenSchedClass &SC) {
1011                      return SC.isKeyEqual(ItinClassDef, OperWrites, OperReads);
1012                    };
1013 
1014   auto I = find_if(make_range(schedClassBegin(), schedClassEnd()), IsKeyEqual);
1015   unsigned Idx = I == schedClassEnd() ? 0 : std::distance(schedClassBegin(), I);
1016   if (Idx || SchedClasses[0].isKeyEqual(ItinClassDef, OperWrites, OperReads)) {
1017     IdxVec PI;
1018     std::set_union(SchedClasses[Idx].ProcIndices.begin(),
1019                    SchedClasses[Idx].ProcIndices.end(),
1020                    ProcIndices.begin(), ProcIndices.end(),
1021                    std::back_inserter(PI));
1022     SchedClasses[Idx].ProcIndices = std::move(PI);
1023     return Idx;
1024   }
1025   Idx = SchedClasses.size();
1026   SchedClasses.emplace_back(Idx,
1027                             createSchedClassName(ItinClassDef, OperWrites,
1028                                                  OperReads),
1029                             ItinClassDef);
1030   CodeGenSchedClass &SC = SchedClasses.back();
1031   SC.Writes = OperWrites;
1032   SC.Reads = OperReads;
1033   SC.ProcIndices = ProcIndices;
1034 
1035   return Idx;
1036 }
1037 
1038 // Create classes for each set of opcodes that are in the same InstReadWrite
1039 // definition across all processors.
1040 void CodeGenSchedModels::createInstRWClass(Record *InstRWDef) {
1041   // ClassInstrs will hold an entry for each subset of Instrs in InstRWDef that
1042   // intersects with an existing class via a previous InstRWDef. Instrs that do
1043   // not intersect with an existing class refer back to their former class as
1044   // determined from ItinDef or SchedRW.
1045   SmallMapVector<unsigned, SmallVector<Record *, 8>, 4> ClassInstrs;
1046   // Sort Instrs into sets.
1047   const RecVec *InstDefs = Sets.expand(InstRWDef);
1048   if (InstDefs->empty())
1049     PrintFatalError(InstRWDef->getLoc(), "No matching instruction opcodes");
1050 
1051   for (Record *InstDef : *InstDefs) {
1052     InstClassMapTy::const_iterator Pos = InstrClassMap.find(InstDef);
1053     if (Pos == InstrClassMap.end())
1054       PrintFatalError(InstDef->getLoc(), "No sched class for instruction.");
1055     unsigned SCIdx = Pos->second;
1056     ClassInstrs[SCIdx].push_back(InstDef);
1057   }
1058   // For each set of Instrs, create a new class if necessary, and map or remap
1059   // the Instrs to it.
1060   for (auto &Entry : ClassInstrs) {
1061     unsigned OldSCIdx = Entry.first;
1062     ArrayRef<Record*> InstDefs = Entry.second;
1063     // If the all instrs in the current class are accounted for, then leave
1064     // them mapped to their old class.
1065     if (OldSCIdx) {
1066       const RecVec &RWDefs = SchedClasses[OldSCIdx].InstRWs;
1067       if (!RWDefs.empty()) {
1068         const RecVec *OrigInstDefs = Sets.expand(RWDefs[0]);
1069         unsigned OrigNumInstrs =
1070           count_if(*OrigInstDefs, [&](Record *OIDef) {
1071                      return InstrClassMap[OIDef] == OldSCIdx;
1072                    });
1073         if (OrigNumInstrs == InstDefs.size()) {
1074           assert(SchedClasses[OldSCIdx].ProcIndices[0] == 0 &&
1075                  "expected a generic SchedClass");
1076           Record *RWModelDef = InstRWDef->getValueAsDef("SchedModel");
1077           // Make sure we didn't already have a InstRW containing this
1078           // instruction on this model.
1079           for (Record *RWD : RWDefs) {
1080             if (RWD->getValueAsDef("SchedModel") == RWModelDef &&
1081                 RWModelDef->getValueAsBit("FullInstRWOverlapCheck")) {
1082               assert(!InstDefs.empty()); // Checked at function start.
1083               PrintError(
1084                   InstRWDef->getLoc(),
1085                   "Overlapping InstRW definition for \"" +
1086                       InstDefs.front()->getName() +
1087                       "\" also matches previous \"" +
1088                       RWD->getValue("Instrs")->getValue()->getAsString() +
1089                       "\".");
1090               PrintFatalNote(RWD->getLoc(), "Previous match was here.");
1091             }
1092           }
1093           LLVM_DEBUG(dbgs() << "InstRW: Reuse SC " << OldSCIdx << ":"
1094                             << SchedClasses[OldSCIdx].Name << " on "
1095                             << RWModelDef->getName() << "\n");
1096           SchedClasses[OldSCIdx].InstRWs.push_back(InstRWDef);
1097           continue;
1098         }
1099       }
1100     }
1101     unsigned SCIdx = SchedClasses.size();
1102     SchedClasses.emplace_back(SCIdx, createSchedClassName(InstDefs), nullptr);
1103     CodeGenSchedClass &SC = SchedClasses.back();
1104     LLVM_DEBUG(dbgs() << "InstRW: New SC " << SCIdx << ":" << SC.Name << " on "
1105                       << InstRWDef->getValueAsDef("SchedModel")->getName()
1106                       << "\n");
1107 
1108     // Preserve ItinDef and Writes/Reads for processors without an InstRW entry.
1109     SC.ItinClassDef = SchedClasses[OldSCIdx].ItinClassDef;
1110     SC.Writes = SchedClasses[OldSCIdx].Writes;
1111     SC.Reads = SchedClasses[OldSCIdx].Reads;
1112     SC.ProcIndices.push_back(0);
1113     // If we had an old class, copy it's InstRWs to this new class.
1114     if (OldSCIdx) {
1115       Record *RWModelDef = InstRWDef->getValueAsDef("SchedModel");
1116       for (Record *OldRWDef : SchedClasses[OldSCIdx].InstRWs) {
1117         if (OldRWDef->getValueAsDef("SchedModel") == RWModelDef) {
1118           assert(!InstDefs.empty()); // Checked at function start.
1119           PrintError(
1120               InstRWDef->getLoc(),
1121               "Overlapping InstRW definition for \"" +
1122                   InstDefs.front()->getName() + "\" also matches previous \"" +
1123                   OldRWDef->getValue("Instrs")->getValue()->getAsString() +
1124                   "\".");
1125           PrintFatalNote(OldRWDef->getLoc(), "Previous match was here.");
1126         }
1127         assert(OldRWDef != InstRWDef &&
1128                "SchedClass has duplicate InstRW def");
1129         SC.InstRWs.push_back(OldRWDef);
1130       }
1131     }
1132     // Map each Instr to this new class.
1133     for (Record *InstDef : InstDefs)
1134       InstrClassMap[InstDef] = SCIdx;
1135     SC.InstRWs.push_back(InstRWDef);
1136   }
1137 }
1138 
1139 // True if collectProcItins found anything.
1140 bool CodeGenSchedModels::hasItineraries() const {
1141   for (const CodeGenProcModel &PM : make_range(procModelBegin(),procModelEnd()))
1142     if (PM.hasItineraries())
1143       return true;
1144   return false;
1145 }
1146 
1147 // Gather the processor itineraries.
1148 void CodeGenSchedModels::collectProcItins() {
1149   LLVM_DEBUG(dbgs() << "\n+++ PROBLEM ITINERARIES (collectProcItins) +++\n");
1150   for (CodeGenProcModel &ProcModel : ProcModels) {
1151     if (!ProcModel.hasItineraries())
1152       continue;
1153 
1154     RecVec ItinRecords = ProcModel.ItinsDef->getValueAsListOfDefs("IID");
1155     assert(!ItinRecords.empty() && "ProcModel.hasItineraries is incorrect");
1156 
1157     // Populate ItinDefList with Itinerary records.
1158     ProcModel.ItinDefList.resize(NumInstrSchedClasses);
1159 
1160     // Insert each itinerary data record in the correct position within
1161     // the processor model's ItinDefList.
1162     for (Record *ItinData : ItinRecords) {
1163       const Record *ItinDef = ItinData->getValueAsDef("TheClass");
1164       bool FoundClass = false;
1165 
1166       for (const CodeGenSchedClass &SC :
1167            make_range(schedClassBegin(), schedClassEnd())) {
1168         // Multiple SchedClasses may share an itinerary. Update all of them.
1169         if (SC.ItinClassDef == ItinDef) {
1170           ProcModel.ItinDefList[SC.Index] = ItinData;
1171           FoundClass = true;
1172         }
1173       }
1174       if (!FoundClass) {
1175         LLVM_DEBUG(dbgs() << ProcModel.ItinsDef->getName()
1176                           << " missing class for itinerary "
1177                           << ItinDef->getName() << '\n');
1178       }
1179     }
1180     // Check for missing itinerary entries.
1181     assert(!ProcModel.ItinDefList[0] && "NoItinerary class can't have rec");
1182     LLVM_DEBUG(
1183         for (unsigned i = 1, N = ProcModel.ItinDefList.size(); i < N; ++i) {
1184           if (!ProcModel.ItinDefList[i])
1185             dbgs() << ProcModel.ItinsDef->getName()
1186                    << " missing itinerary for class " << SchedClasses[i].Name
1187                    << '\n';
1188         });
1189   }
1190 }
1191 
1192 // Gather the read/write types for each itinerary class.
1193 void CodeGenSchedModels::collectProcItinRW() {
1194   RecVec ItinRWDefs = Records.getAllDerivedDefinitions("ItinRW");
1195   llvm::sort(ItinRWDefs, LessRecord());
1196   for (Record *RWDef  : ItinRWDefs) {
1197     if (!RWDef->getValueInit("SchedModel")->isComplete())
1198       PrintFatalError(RWDef->getLoc(), "SchedModel is undefined");
1199     Record *ModelDef = RWDef->getValueAsDef("SchedModel");
1200     ProcModelMapTy::const_iterator I = ProcModelMap.find(ModelDef);
1201     if (I == ProcModelMap.end()) {
1202       PrintFatalError(RWDef->getLoc(), "Undefined SchedMachineModel "
1203                     + ModelDef->getName());
1204     }
1205     ProcModels[I->second].ItinRWDefs.push_back(RWDef);
1206   }
1207 }
1208 
1209 // Gather the unsupported features for processor models.
1210 void CodeGenSchedModels::collectProcUnsupportedFeatures() {
1211   for (CodeGenProcModel &ProcModel : ProcModels) {
1212     for (Record *Pred : ProcModel.ModelDef->getValueAsListOfDefs("UnsupportedFeatures")) {
1213        ProcModel.UnsupportedFeaturesDefs.push_back(Pred);
1214     }
1215   }
1216 }
1217 
1218 /// Infer new classes from existing classes. In the process, this may create new
1219 /// SchedWrites from sequences of existing SchedWrites.
1220 void CodeGenSchedModels::inferSchedClasses() {
1221   LLVM_DEBUG(
1222       dbgs() << "\n+++ INFERRING SCHED CLASSES (inferSchedClasses) +++\n");
1223   LLVM_DEBUG(dbgs() << NumInstrSchedClasses << " instr sched classes.\n");
1224 
1225   // Visit all existing classes and newly created classes.
1226   for (unsigned Idx = 0; Idx != SchedClasses.size(); ++Idx) {
1227     assert(SchedClasses[Idx].Index == Idx && "bad SCIdx");
1228 
1229     if (SchedClasses[Idx].ItinClassDef)
1230       inferFromItinClass(SchedClasses[Idx].ItinClassDef, Idx);
1231     if (!SchedClasses[Idx].InstRWs.empty())
1232       inferFromInstRWs(Idx);
1233     if (!SchedClasses[Idx].Writes.empty()) {
1234       inferFromRW(SchedClasses[Idx].Writes, SchedClasses[Idx].Reads,
1235                   Idx, SchedClasses[Idx].ProcIndices);
1236     }
1237     assert(SchedClasses.size() < (NumInstrSchedClasses*6) &&
1238            "too many SchedVariants");
1239   }
1240 }
1241 
1242 /// Infer classes from per-processor itinerary resources.
1243 void CodeGenSchedModels::inferFromItinClass(Record *ItinClassDef,
1244                                             unsigned FromClassIdx) {
1245   for (unsigned PIdx = 0, PEnd = ProcModels.size(); PIdx != PEnd; ++PIdx) {
1246     const CodeGenProcModel &PM = ProcModels[PIdx];
1247     // For all ItinRW entries.
1248     bool HasMatch = false;
1249     for (const Record *Rec : PM.ItinRWDefs) {
1250       RecVec Matched = Rec->getValueAsListOfDefs("MatchedItinClasses");
1251       if (!std::count(Matched.begin(), Matched.end(), ItinClassDef))
1252         continue;
1253       if (HasMatch)
1254         PrintFatalError(Rec->getLoc(), "Duplicate itinerary class "
1255                       + ItinClassDef->getName()
1256                       + " in ItinResources for " + PM.ModelName);
1257       HasMatch = true;
1258       IdxVec Writes, Reads;
1259       findRWs(Rec->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);
1260       inferFromRW(Writes, Reads, FromClassIdx, PIdx);
1261     }
1262   }
1263 }
1264 
1265 /// Infer classes from per-processor InstReadWrite definitions.
1266 void CodeGenSchedModels::inferFromInstRWs(unsigned SCIdx) {
1267   for (unsigned I = 0, E = SchedClasses[SCIdx].InstRWs.size(); I != E; ++I) {
1268     assert(SchedClasses[SCIdx].InstRWs.size() == E && "InstrRWs was mutated!");
1269     Record *Rec = SchedClasses[SCIdx].InstRWs[I];
1270     const RecVec *InstDefs = Sets.expand(Rec);
1271     RecIter II = InstDefs->begin(), IE = InstDefs->end();
1272     for (; II != IE; ++II) {
1273       if (InstrClassMap[*II] == SCIdx)
1274         break;
1275     }
1276     // If this class no longer has any instructions mapped to it, it has become
1277     // irrelevant.
1278     if (II == IE)
1279       continue;
1280     IdxVec Writes, Reads;
1281     findRWs(Rec->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);
1282     unsigned PIdx = getProcModel(Rec->getValueAsDef("SchedModel")).Index;
1283     inferFromRW(Writes, Reads, SCIdx, PIdx); // May mutate SchedClasses.
1284     SchedClasses[SCIdx].InstRWProcIndices.insert(PIdx);
1285   }
1286 }
1287 
1288 namespace {
1289 
1290 // Helper for substituteVariantOperand.
1291 struct TransVariant {
1292   Record *VarOrSeqDef;  // Variant or sequence.
1293   unsigned RWIdx;       // Index of this variant or sequence's matched type.
1294   unsigned ProcIdx;     // Processor model index or zero for any.
1295   unsigned TransVecIdx; // Index into PredTransitions::TransVec.
1296 
1297   TransVariant(Record *def, unsigned rwi, unsigned pi, unsigned ti):
1298     VarOrSeqDef(def), RWIdx(rwi), ProcIdx(pi), TransVecIdx(ti) {}
1299 };
1300 
1301 // Associate a predicate with the SchedReadWrite that it guards.
1302 // RWIdx is the index of the read/write variant.
1303 struct PredCheck {
1304   bool IsRead;
1305   unsigned RWIdx;
1306   Record *Predicate;
1307 
1308   PredCheck(bool r, unsigned w, Record *p): IsRead(r), RWIdx(w), Predicate(p) {}
1309 };
1310 
1311 // A Predicate transition is a list of RW sequences guarded by a PredTerm.
1312 struct PredTransition {
1313   // A predicate term is a conjunction of PredChecks.
1314   SmallVector<PredCheck, 4> PredTerm;
1315   SmallVector<SmallVector<unsigned,4>, 16> WriteSequences;
1316   SmallVector<SmallVector<unsigned,4>, 16> ReadSequences;
1317   SmallVector<unsigned, 4> ProcIndices;
1318 
1319   PredTransition() = default;
1320   PredTransition(ArrayRef<PredCheck> PT) {
1321     PredTerm.assign(PT.begin(), PT.end());
1322     ProcIndices.assign(1, 0);
1323   }
1324   PredTransition(ArrayRef<PredCheck> PT, ArrayRef<unsigned> PIds) {
1325     PredTerm.assign(PT.begin(), PT.end());
1326     ProcIndices.assign(PIds.begin(), PIds.end());
1327   }
1328 };
1329 
1330 // Encapsulate a set of partially constructed transitions.
1331 // The results are built by repeated calls to substituteVariants.
1332 class PredTransitions {
1333   CodeGenSchedModels &SchedModels;
1334 
1335 public:
1336   std::vector<PredTransition> TransVec;
1337 
1338   PredTransitions(CodeGenSchedModels &sm): SchedModels(sm) {}
1339 
1340   bool substituteVariantOperand(const SmallVectorImpl<unsigned> &RWSeq,
1341                                 bool IsRead, bool IsForAnyCPU,
1342                                 unsigned StartIdx);
1343 
1344   bool substituteVariants(const PredTransition &Trans);
1345 
1346 #ifndef NDEBUG
1347   void dump() const;
1348 #endif
1349 
1350 private:
1351   bool mutuallyExclusive(Record *PredDef, ArrayRef<Record *> Preds,
1352                          ArrayRef<PredCheck> Term);
1353   void getIntersectingVariants(
1354     const CodeGenSchedRW &SchedRW, unsigned TransIdx,
1355     std::vector<TransVariant> &IntersectingVariants);
1356   void pushVariant(const TransVariant &VInfo, bool IsRead);
1357 };
1358 
1359 } // end anonymous namespace
1360 
1361 // Return true if this predicate is mutually exclusive with a PredTerm. This
1362 // degenerates into checking if the predicate is mutually exclusive with any
1363 // predicate in the Term's conjunction.
1364 //
1365 // All predicates associated with a given SchedRW are considered mutually
1366 // exclusive. This should work even if the conditions expressed by the
1367 // predicates are not exclusive because the predicates for a given SchedWrite
1368 // are always checked in the order they are defined in the .td file. Later
1369 // conditions implicitly negate any prior condition.
1370 bool PredTransitions::mutuallyExclusive(Record *PredDef,
1371                                         ArrayRef<Record *> Preds,
1372                                         ArrayRef<PredCheck> Term) {
1373   for (const PredCheck &PC: Term) {
1374     if (PC.Predicate == PredDef)
1375       return false;
1376 
1377     const CodeGenSchedRW &SchedRW = SchedModels.getSchedRW(PC.RWIdx, PC.IsRead);
1378     assert(SchedRW.HasVariants && "PredCheck must refer to a SchedVariant");
1379     RecVec Variants = SchedRW.TheDef->getValueAsListOfDefs("Variants");
1380     if (any_of(Variants, [PredDef](const Record *R) {
1381           return R->getValueAsDef("Predicate") == PredDef;
1382         })) {
1383       // To check if PredDef is mutually exclusive with PC we also need to
1384       // check that PC.Predicate is exclusive with all predicates from variant
1385       // we're expanding. Consider following RW sequence with two variants
1386       // (1 & 2), where A, B and C are predicates from corresponding SchedVars:
1387       //
1388       // 1:A/B - 2:C/B
1389       //
1390       // Here C is not mutually exclusive with variant (1), because A doesn't
1391       // exist in variant (2). This means we have possible transitions from A
1392       // to C and from A to B, and fully expanded sequence would look like:
1393       //
1394       // if (A & C) return ...;
1395       // if (A & B) return ...;
1396       // if (B) return ...;
1397       //
1398       // Now let's consider another sequence:
1399       //
1400       // 1:A/B - 2:A/B
1401       //
1402       // Here A in variant (2) is mutually exclusive with variant (1), because
1403       // A also exists in (2). This means A->B transition is impossible and
1404       // expanded sequence would look like:
1405       //
1406       // if (A) return ...;
1407       // if (B) return ...;
1408       if (!count(Preds, PC.Predicate))
1409         continue;
1410       return true;
1411     }
1412   }
1413   return false;
1414 }
1415 
1416 static bool hasAliasedVariants(const CodeGenSchedRW &RW,
1417                                CodeGenSchedModels &SchedModels) {
1418   if (RW.HasVariants)
1419     return true;
1420 
1421   for (Record *Alias : RW.Aliases) {
1422     const CodeGenSchedRW &AliasRW =
1423         SchedModels.getSchedRW(Alias->getValueAsDef("AliasRW"));
1424     if (AliasRW.HasVariants)
1425       return true;
1426     if (AliasRW.IsSequence) {
1427       IdxVec ExpandedRWs;
1428       SchedModels.expandRWSequence(AliasRW.Index, ExpandedRWs, AliasRW.IsRead);
1429       for (unsigned SI : ExpandedRWs) {
1430         if (hasAliasedVariants(SchedModels.getSchedRW(SI, AliasRW.IsRead),
1431                                SchedModels))
1432           return true;
1433       }
1434     }
1435   }
1436   return false;
1437 }
1438 
1439 static std::vector<Record *> getAllPredicates(ArrayRef<TransVariant> Variants,
1440                                               ArrayRef<unsigned> ProcIndices) {
1441   std::vector<Record *> Preds;
1442   for (auto &Variant : Variants) {
1443     if (!Variant.VarOrSeqDef->isSubClassOf("SchedVar"))
1444       continue;
1445 
1446     if (ProcIndices[0] && Variant.ProcIdx)
1447       if (!llvm::count(ProcIndices, Variant.ProcIdx))
1448         continue;
1449 
1450     Preds.push_back(Variant.VarOrSeqDef->getValueAsDef("Predicate"));
1451   }
1452   return Preds;
1453 }
1454 
1455 // Populate IntersectingVariants with any variants or aliased sequences of the
1456 // given SchedRW whose processor indices and predicates are not mutually
1457 // exclusive with the given transition.
1458 void PredTransitions::getIntersectingVariants(
1459   const CodeGenSchedRW &SchedRW, unsigned TransIdx,
1460   std::vector<TransVariant> &IntersectingVariants) {
1461 
1462   bool GenericRW = false;
1463 
1464   std::vector<TransVariant> Variants;
1465   if (SchedRW.HasVariants) {
1466     unsigned VarProcIdx = 0;
1467     if (SchedRW.TheDef->getValueInit("SchedModel")->isComplete()) {
1468       Record *ModelDef = SchedRW.TheDef->getValueAsDef("SchedModel");
1469       VarProcIdx = SchedModels.getProcModel(ModelDef).Index;
1470     }
1471     // Push each variant. Assign TransVecIdx later.
1472     const RecVec VarDefs = SchedRW.TheDef->getValueAsListOfDefs("Variants");
1473     for (Record *VarDef : VarDefs)
1474       Variants.emplace_back(VarDef, SchedRW.Index, VarProcIdx, 0);
1475     if (VarProcIdx == 0)
1476       GenericRW = true;
1477   }
1478   for (RecIter AI = SchedRW.Aliases.begin(), AE = SchedRW.Aliases.end();
1479        AI != AE; ++AI) {
1480     // If either the SchedAlias itself or the SchedReadWrite that it aliases
1481     // to is defined within a processor model, constrain all variants to
1482     // that processor.
1483     unsigned AliasProcIdx = 0;
1484     if ((*AI)->getValueInit("SchedModel")->isComplete()) {
1485       Record *ModelDef = (*AI)->getValueAsDef("SchedModel");
1486       AliasProcIdx = SchedModels.getProcModel(ModelDef).Index;
1487     }
1488     const CodeGenSchedRW &AliasRW =
1489       SchedModels.getSchedRW((*AI)->getValueAsDef("AliasRW"));
1490 
1491     if (AliasRW.HasVariants) {
1492       const RecVec VarDefs = AliasRW.TheDef->getValueAsListOfDefs("Variants");
1493       for (Record *VD : VarDefs)
1494         Variants.emplace_back(VD, AliasRW.Index, AliasProcIdx, 0);
1495     }
1496     if (AliasRW.IsSequence)
1497       Variants.emplace_back(AliasRW.TheDef, SchedRW.Index, AliasProcIdx, 0);
1498     if (AliasProcIdx == 0)
1499       GenericRW = true;
1500   }
1501   std::vector<Record *> AllPreds =
1502       getAllPredicates(Variants, TransVec[TransIdx].ProcIndices);
1503   for (TransVariant &Variant : Variants) {
1504     // Don't expand variants if the processor models don't intersect.
1505     // A zero processor index means any processor.
1506     SmallVectorImpl<unsigned> &ProcIndices = TransVec[TransIdx].ProcIndices;
1507     if (ProcIndices[0] && Variant.ProcIdx) {
1508       unsigned Cnt = std::count(ProcIndices.begin(), ProcIndices.end(),
1509                                 Variant.ProcIdx);
1510       if (!Cnt)
1511         continue;
1512       if (Cnt > 1) {
1513         const CodeGenProcModel &PM =
1514           *(SchedModels.procModelBegin() + Variant.ProcIdx);
1515         PrintFatalError(Variant.VarOrSeqDef->getLoc(),
1516                         "Multiple variants defined for processor " +
1517                         PM.ModelName +
1518                         " Ensure only one SchedAlias exists per RW.");
1519       }
1520     }
1521     if (Variant.VarOrSeqDef->isSubClassOf("SchedVar")) {
1522       Record *PredDef = Variant.VarOrSeqDef->getValueAsDef("Predicate");
1523       if (mutuallyExclusive(PredDef, AllPreds, TransVec[TransIdx].PredTerm))
1524         continue;
1525     }
1526 
1527     if (IntersectingVariants.empty()) {
1528       // The first variant builds on the existing transition.
1529       Variant.TransVecIdx = TransIdx;
1530       IntersectingVariants.push_back(Variant);
1531     }
1532     else {
1533       // Push another copy of the current transition for more variants.
1534       Variant.TransVecIdx = TransVec.size();
1535       IntersectingVariants.push_back(Variant);
1536       TransVec.push_back(TransVec[TransIdx]);
1537     }
1538   }
1539   if (GenericRW && IntersectingVariants.empty()) {
1540     PrintFatalError(SchedRW.TheDef->getLoc(), "No variant of this type has "
1541                     "a matching predicate on any processor");
1542   }
1543 }
1544 
1545 // Push the Reads/Writes selected by this variant onto the PredTransition
1546 // specified by VInfo.
1547 void PredTransitions::
1548 pushVariant(const TransVariant &VInfo, bool IsRead) {
1549   PredTransition &Trans = TransVec[VInfo.TransVecIdx];
1550 
1551   // If this operand transition is reached through a processor-specific alias,
1552   // then the whole transition is specific to this processor.
1553   if (VInfo.ProcIdx != 0)
1554     Trans.ProcIndices.assign(1, VInfo.ProcIdx);
1555 
1556   IdxVec SelectedRWs;
1557   if (VInfo.VarOrSeqDef->isSubClassOf("SchedVar")) {
1558     Record *PredDef = VInfo.VarOrSeqDef->getValueAsDef("Predicate");
1559     Trans.PredTerm.emplace_back(IsRead, VInfo.RWIdx,PredDef);
1560     RecVec SelectedDefs = VInfo.VarOrSeqDef->getValueAsListOfDefs("Selected");
1561     SchedModels.findRWs(SelectedDefs, SelectedRWs, IsRead);
1562   }
1563   else {
1564     assert(VInfo.VarOrSeqDef->isSubClassOf("WriteSequence") &&
1565            "variant must be a SchedVariant or aliased WriteSequence");
1566     SelectedRWs.push_back(SchedModels.getSchedRWIdx(VInfo.VarOrSeqDef, IsRead));
1567   }
1568 
1569   const CodeGenSchedRW &SchedRW = SchedModels.getSchedRW(VInfo.RWIdx, IsRead);
1570 
1571   SmallVectorImpl<SmallVector<unsigned,4>> &RWSequences = IsRead
1572     ? Trans.ReadSequences : Trans.WriteSequences;
1573   if (SchedRW.IsVariadic) {
1574     unsigned OperIdx = RWSequences.size()-1;
1575     // Make N-1 copies of this transition's last sequence.
1576     RWSequences.reserve(RWSequences.size() + SelectedRWs.size() - 1);
1577     RWSequences.insert(RWSequences.end(), SelectedRWs.size() - 1,
1578                        RWSequences[OperIdx]);
1579     // Push each of the N elements of the SelectedRWs onto a copy of the last
1580     // sequence (split the current operand into N operands).
1581     // Note that write sequences should be expanded within this loop--the entire
1582     // sequence belongs to a single operand.
1583     for (IdxIter RWI = SelectedRWs.begin(), RWE = SelectedRWs.end();
1584          RWI != RWE; ++RWI, ++OperIdx) {
1585       IdxVec ExpandedRWs;
1586       if (IsRead)
1587         ExpandedRWs.push_back(*RWI);
1588       else
1589         SchedModels.expandRWSequence(*RWI, ExpandedRWs, IsRead);
1590       RWSequences[OperIdx].insert(RWSequences[OperIdx].end(),
1591                                   ExpandedRWs.begin(), ExpandedRWs.end());
1592     }
1593     assert(OperIdx == RWSequences.size() && "missed a sequence");
1594   }
1595   else {
1596     // Push this transition's expanded sequence onto this transition's last
1597     // sequence (add to the current operand's sequence).
1598     SmallVectorImpl<unsigned> &Seq = RWSequences.back();
1599     IdxVec ExpandedRWs;
1600     for (IdxIter RWI = SelectedRWs.begin(), RWE = SelectedRWs.end();
1601          RWI != RWE; ++RWI) {
1602       if (IsRead)
1603         ExpandedRWs.push_back(*RWI);
1604       else
1605         SchedModels.expandRWSequence(*RWI, ExpandedRWs, IsRead);
1606     }
1607     Seq.insert(Seq.end(), ExpandedRWs.begin(), ExpandedRWs.end());
1608   }
1609 }
1610 
1611 // RWSeq is a sequence of all Reads or all Writes for the next read or write
1612 // operand. StartIdx is an index into TransVec where partial results
1613 // starts. RWSeq must be applied to all transitions between StartIdx and the end
1614 // of TransVec.
1615 bool PredTransitions::substituteVariantOperand(
1616     const SmallVectorImpl<unsigned> &RWSeq, bool IsRead, bool IsForAnyCPU,
1617     unsigned StartIdx) {
1618 
1619   auto CollectAndAddVariants = [&](unsigned TransIdx,
1620                                    const CodeGenSchedRW &SchedRW) {
1621     // Distribute this partial PredTransition across intersecting variants.
1622     // This will push a copies of TransVec[TransIdx] on the back of TransVec.
1623     std::vector<TransVariant> IntersectingVariants;
1624     getIntersectingVariants(SchedRW, TransIdx, IntersectingVariants);
1625     // Now expand each variant on top of its copy of the transition.
1626     for (const TransVariant &IV : IntersectingVariants)
1627       pushVariant(IV, IsRead);
1628     return !IntersectingVariants.empty();
1629   };
1630 
1631   bool Subst = false;
1632   // Visit each original RW within the current sequence.
1633   for (SmallVectorImpl<unsigned>::const_iterator
1634          RWI = RWSeq.begin(), RWE = RWSeq.end(); RWI != RWE; ++RWI) {
1635     const CodeGenSchedRW &SchedRW = SchedModels.getSchedRW(*RWI, IsRead);
1636     // Push this RW on all partial PredTransitions or distribute variants.
1637     // New PredTransitions may be pushed within this loop which should not be
1638     // revisited (TransEnd must be loop invariant).
1639     bool HasAliases = false, WasPushed = false;
1640     for (unsigned TransIdx = StartIdx, TransEnd = TransVec.size();
1641          TransIdx != TransEnd; ++TransIdx) {
1642       // In the common case, push RW onto the current operand's sequence.
1643       if (!hasAliasedVariants(SchedRW, SchedModels)) {
1644         if (IsRead)
1645           TransVec[TransIdx].ReadSequences.back().push_back(*RWI);
1646         else
1647           TransVec[TransIdx].WriteSequences.back().push_back(*RWI);
1648         continue;
1649       }
1650       HasAliases = true;
1651       WasPushed |= CollectAndAddVariants(TransIdx, SchedRW);
1652       Subst |= WasPushed;
1653     }
1654     if (IsRead && IsForAnyCPU && HasAliases && !WasPushed) {
1655       // If we're here this means that in some sched class:
1656       // a) We have read variant for CPU A
1657       // b) We have write variant for CPU B
1658       // b) We don't have write variant for CPU A
1659       // d) We must expand all read/write variants (IsForAnyCPU is true)
1660       // e) We couldn't expand SchedRW because TransVec doesn't have
1661       //    any transition with compatible CPU ID.
1662       // In such case we create new empty transition with zero (AnyCPU)
1663       // index.
1664       TransVec.reserve(TransVec.size() + 1);
1665       TransVec.emplace_back(TransVec[StartIdx].PredTerm);
1666       TransVec.back().ReadSequences.emplace_back();
1667       Subst |= CollectAndAddVariants(TransVec.size() - 1, SchedRW);
1668     }
1669   }
1670   return Subst;
1671 }
1672 
1673 // For each variant of a Read/Write in Trans, substitute the sequence of
1674 // Read/Writes guarded by the variant. This is exponential in the number of
1675 // variant Read/Writes, but in practice detection of mutually exclusive
1676 // predicates should result in linear growth in the total number variants.
1677 //
1678 // This is one step in a breadth-first search of nested variants.
1679 bool PredTransitions::substituteVariants(const PredTransition &Trans) {
1680   // Build up a set of partial results starting at the back of
1681   // PredTransitions. Remember the first new transition.
1682   unsigned StartIdx = TransVec.size();
1683   bool Subst = false;
1684   TransVec.emplace_back(Trans.PredTerm, Trans.ProcIndices);
1685 
1686   bool IsForAnyCPU = llvm::count(Trans.ProcIndices, 0);
1687   // Visit each original write sequence.
1688   for (SmallVectorImpl<SmallVector<unsigned,4>>::const_iterator
1689          WSI = Trans.WriteSequences.begin(), WSE = Trans.WriteSequences.end();
1690        WSI != WSE; ++WSI) {
1691     // Push a new (empty) write sequence onto all partial Transitions.
1692     for (std::vector<PredTransition>::iterator I =
1693            TransVec.begin() + StartIdx, E = TransVec.end(); I != E; ++I) {
1694       I->WriteSequences.emplace_back();
1695     }
1696     Subst |=
1697         substituteVariantOperand(*WSI, /*IsRead=*/false, IsForAnyCPU, StartIdx);
1698   }
1699   // Visit each original read sequence.
1700   for (SmallVectorImpl<SmallVector<unsigned,4>>::const_iterator
1701          RSI = Trans.ReadSequences.begin(), RSE = Trans.ReadSequences.end();
1702        RSI != RSE; ++RSI) {
1703     // Push a new (empty) read sequence onto all partial Transitions.
1704     for (std::vector<PredTransition>::iterator I =
1705            TransVec.begin() + StartIdx, E = TransVec.end(); I != E; ++I) {
1706       I->ReadSequences.emplace_back();
1707     }
1708     Subst |=
1709         substituteVariantOperand(*RSI, /*IsRead=*/true, IsForAnyCPU, StartIdx);
1710   }
1711   return Subst;
1712 }
1713 
1714 static void addSequences(CodeGenSchedModels &SchedModels,
1715                          const SmallVectorImpl<SmallVector<unsigned, 4>> &Seqs,
1716                          IdxVec &Result, bool IsRead) {
1717   for (const auto &S : Seqs)
1718     if (!S.empty())
1719       Result.push_back(SchedModels.findOrInsertRW(S, IsRead));
1720 }
1721 
1722 #ifndef NDEBUG
1723 static void dumpRecVec(const RecVec &RV) {
1724   for (const Record *R : RV)
1725     dbgs() << R->getName() << ", ";
1726 }
1727 #endif
1728 
1729 static void dumpTransition(const CodeGenSchedModels &SchedModels,
1730                            const CodeGenSchedClass &FromSC,
1731                            const CodeGenSchedTransition &SCTrans,
1732                            const RecVec &Preds) {
1733   LLVM_DEBUG(dbgs() << "Adding transition from " << FromSC.Name << "("
1734                     << FromSC.Index << ") to "
1735                     << SchedModels.getSchedClass(SCTrans.ToClassIdx).Name << "("
1736                     << SCTrans.ToClassIdx << ") on pred term: (";
1737              dumpRecVec(Preds); dbgs() << ") on processor indices: (";
1738              dumpIdxVec(SCTrans.ProcIndices); dbgs() << ")\n");
1739 }
1740 // Create a new SchedClass for each variant found by inferFromRW. Pass
1741 static void inferFromTransitions(ArrayRef<PredTransition> LastTransitions,
1742                                  unsigned FromClassIdx,
1743                                  CodeGenSchedModels &SchedModels) {
1744   // For each PredTransition, create a new CodeGenSchedTransition, which usually
1745   // requires creating a new SchedClass.
1746   for (ArrayRef<PredTransition>::iterator
1747          I = LastTransitions.begin(), E = LastTransitions.end(); I != E; ++I) {
1748     IdxVec OperWritesVariant, OperReadsVariant;
1749     addSequences(SchedModels, I->WriteSequences, OperWritesVariant, false);
1750     addSequences(SchedModels, I->ReadSequences, OperReadsVariant, true);
1751     CodeGenSchedTransition SCTrans;
1752 
1753     // Transition should not contain processor indices already assigned to
1754     // InstRWs in this scheduling class.
1755     const CodeGenSchedClass &FromSC = SchedModels.getSchedClass(FromClassIdx);
1756     llvm::copy_if(I->ProcIndices, std::back_inserter(SCTrans.ProcIndices),
1757                   [&FromSC](unsigned PIdx) {
1758                     return !FromSC.InstRWProcIndices.count(PIdx);
1759                   });
1760     if (SCTrans.ProcIndices.empty())
1761       continue;
1762     SCTrans.ToClassIdx =
1763         SchedModels.addSchedClass(/*ItinClassDef=*/nullptr, OperWritesVariant,
1764                                   OperReadsVariant, I->ProcIndices);
1765 
1766     // The final PredTerm is unique set of predicates guarding the transition.
1767     RecVec Preds;
1768     transform(I->PredTerm, std::back_inserter(Preds),
1769               [](const PredCheck &P) {
1770                 return P.Predicate;
1771               });
1772     Preds.erase(std::unique(Preds.begin(), Preds.end()), Preds.end());
1773     dumpTransition(SchedModels, FromSC, SCTrans, Preds);
1774     SCTrans.PredTerm = std::move(Preds);
1775     SchedModels.getSchedClass(FromClassIdx)
1776         .Transitions.push_back(std::move(SCTrans));
1777   }
1778 }
1779 
1780 // Create new SchedClasses for the given ReadWrite list. If any of the
1781 // ReadWrites refers to a SchedVariant, create a new SchedClass for each variant
1782 // of the ReadWrite list, following Aliases if necessary.
1783 void CodeGenSchedModels::inferFromRW(ArrayRef<unsigned> OperWrites,
1784                                      ArrayRef<unsigned> OperReads,
1785                                      unsigned FromClassIdx,
1786                                      ArrayRef<unsigned> ProcIndices) {
1787   LLVM_DEBUG(dbgs() << "INFER RW proc("; dumpIdxVec(ProcIndices);
1788              dbgs() << ") ");
1789   // Create a seed transition with an empty PredTerm and the expanded sequences
1790   // of SchedWrites for the current SchedClass.
1791   std::vector<PredTransition> LastTransitions;
1792   LastTransitions.emplace_back();
1793   LastTransitions.back().ProcIndices.append(ProcIndices.begin(),
1794                                             ProcIndices.end());
1795 
1796   for (unsigned WriteIdx : OperWrites) {
1797     IdxVec WriteSeq;
1798     expandRWSequence(WriteIdx, WriteSeq, /*IsRead=*/false);
1799     LastTransitions[0].WriteSequences.emplace_back();
1800     SmallVectorImpl<unsigned> &Seq = LastTransitions[0].WriteSequences.back();
1801     Seq.append(WriteSeq.begin(), WriteSeq.end());
1802     LLVM_DEBUG(dbgs() << "("; dumpIdxVec(Seq); dbgs() << ") ");
1803   }
1804   LLVM_DEBUG(dbgs() << " Reads: ");
1805   for (unsigned ReadIdx : OperReads) {
1806     IdxVec ReadSeq;
1807     expandRWSequence(ReadIdx, ReadSeq, /*IsRead=*/true);
1808     LastTransitions[0].ReadSequences.emplace_back();
1809     SmallVectorImpl<unsigned> &Seq = LastTransitions[0].ReadSequences.back();
1810     Seq.append(ReadSeq.begin(), ReadSeq.end());
1811     LLVM_DEBUG(dbgs() << "("; dumpIdxVec(Seq); dbgs() << ") ");
1812   }
1813   LLVM_DEBUG(dbgs() << '\n');
1814 
1815   // Collect all PredTransitions for individual operands.
1816   // Iterate until no variant writes remain.
1817   bool SubstitutedAny;
1818   do {
1819     SubstitutedAny = false;
1820     PredTransitions Transitions(*this);
1821     for (const PredTransition &Trans : LastTransitions)
1822       SubstitutedAny |= Transitions.substituteVariants(Trans);
1823     LLVM_DEBUG(Transitions.dump());
1824     LastTransitions.swap(Transitions.TransVec);
1825   } while (SubstitutedAny);
1826   // If the first transition has no variants, nothing to do.
1827   if (LastTransitions[0].PredTerm.empty())
1828     return;
1829 
1830   // WARNING: We are about to mutate the SchedClasses vector. Do not refer to
1831   // OperWrites, OperReads, or ProcIndices after calling inferFromTransitions.
1832   inferFromTransitions(LastTransitions, FromClassIdx, *this);
1833 }
1834 
1835 // Check if any processor resource group contains all resource records in
1836 // SubUnits.
1837 bool CodeGenSchedModels::hasSuperGroup(RecVec &SubUnits, CodeGenProcModel &PM) {
1838   for (unsigned i = 0, e = PM.ProcResourceDefs.size(); i < e; ++i) {
1839     if (!PM.ProcResourceDefs[i]->isSubClassOf("ProcResGroup"))
1840       continue;
1841     RecVec SuperUnits =
1842       PM.ProcResourceDefs[i]->getValueAsListOfDefs("Resources");
1843     RecIter RI = SubUnits.begin(), RE = SubUnits.end();
1844     for ( ; RI != RE; ++RI) {
1845       if (!is_contained(SuperUnits, *RI)) {
1846         break;
1847       }
1848     }
1849     if (RI == RE)
1850       return true;
1851   }
1852   return false;
1853 }
1854 
1855 // Verify that overlapping groups have a common supergroup.
1856 void CodeGenSchedModels::verifyProcResourceGroups(CodeGenProcModel &PM) {
1857   for (unsigned i = 0, e = PM.ProcResourceDefs.size(); i < e; ++i) {
1858     if (!PM.ProcResourceDefs[i]->isSubClassOf("ProcResGroup"))
1859       continue;
1860     RecVec CheckUnits =
1861       PM.ProcResourceDefs[i]->getValueAsListOfDefs("Resources");
1862     for (unsigned j = i+1; j < e; ++j) {
1863       if (!PM.ProcResourceDefs[j]->isSubClassOf("ProcResGroup"))
1864         continue;
1865       RecVec OtherUnits =
1866         PM.ProcResourceDefs[j]->getValueAsListOfDefs("Resources");
1867       if (std::find_first_of(CheckUnits.begin(), CheckUnits.end(),
1868                              OtherUnits.begin(), OtherUnits.end())
1869           != CheckUnits.end()) {
1870         // CheckUnits and OtherUnits overlap
1871         OtherUnits.insert(OtherUnits.end(), CheckUnits.begin(),
1872                           CheckUnits.end());
1873         if (!hasSuperGroup(OtherUnits, PM)) {
1874           PrintFatalError((PM.ProcResourceDefs[i])->getLoc(),
1875                           "proc resource group overlaps with "
1876                           + PM.ProcResourceDefs[j]->getName()
1877                           + " but no supergroup contains both.");
1878         }
1879       }
1880     }
1881   }
1882 }
1883 
1884 // Collect all the RegisterFile definitions available in this target.
1885 void CodeGenSchedModels::collectRegisterFiles() {
1886   RecVec RegisterFileDefs = Records.getAllDerivedDefinitions("RegisterFile");
1887 
1888   // RegisterFiles is the vector of CodeGenRegisterFile.
1889   for (Record *RF : RegisterFileDefs) {
1890     // For each register file definition, construct a CodeGenRegisterFile object
1891     // and add it to the appropriate scheduling model.
1892     CodeGenProcModel &PM = getProcModel(RF->getValueAsDef("SchedModel"));
1893     PM.RegisterFiles.emplace_back(CodeGenRegisterFile(RF->getName(),RF));
1894     CodeGenRegisterFile &CGRF = PM.RegisterFiles.back();
1895     CGRF.MaxMovesEliminatedPerCycle =
1896         RF->getValueAsInt("MaxMovesEliminatedPerCycle");
1897     CGRF.AllowZeroMoveEliminationOnly =
1898         RF->getValueAsBit("AllowZeroMoveEliminationOnly");
1899 
1900     // Now set the number of physical registers as well as the cost of registers
1901     // in each register class.
1902     CGRF.NumPhysRegs = RF->getValueAsInt("NumPhysRegs");
1903     if (!CGRF.NumPhysRegs) {
1904       PrintFatalError(RF->getLoc(),
1905                       "Invalid RegisterFile with zero physical registers");
1906     }
1907 
1908     RecVec RegisterClasses = RF->getValueAsListOfDefs("RegClasses");
1909     std::vector<int64_t> RegisterCosts = RF->getValueAsListOfInts("RegCosts");
1910     ListInit *MoveElimInfo = RF->getValueAsListInit("AllowMoveElimination");
1911     for (unsigned I = 0, E = RegisterClasses.size(); I < E; ++I) {
1912       int Cost = RegisterCosts.size() > I ? RegisterCosts[I] : 1;
1913 
1914       bool AllowMoveElim = false;
1915       if (MoveElimInfo->size() > I) {
1916         BitInit *Val = cast<BitInit>(MoveElimInfo->getElement(I));
1917         AllowMoveElim = Val->getValue();
1918       }
1919 
1920       CGRF.Costs.emplace_back(RegisterClasses[I], Cost, AllowMoveElim);
1921     }
1922   }
1923 }
1924 
1925 // Collect and sort WriteRes, ReadAdvance, and ProcResources.
1926 void CodeGenSchedModels::collectProcResources() {
1927   ProcResourceDefs = Records.getAllDerivedDefinitions("ProcResourceUnits");
1928   ProcResGroups = Records.getAllDerivedDefinitions("ProcResGroup");
1929 
1930   // Add any subtarget-specific SchedReadWrites that are directly associated
1931   // with processor resources. Refer to the parent SchedClass's ProcIndices to
1932   // determine which processors they apply to.
1933   for (const CodeGenSchedClass &SC :
1934        make_range(schedClassBegin(), schedClassEnd())) {
1935     if (SC.ItinClassDef) {
1936       collectItinProcResources(SC.ItinClassDef);
1937       continue;
1938     }
1939 
1940     // This class may have a default ReadWrite list which can be overriden by
1941     // InstRW definitions.
1942     for (Record *RW : SC.InstRWs) {
1943       Record *RWModelDef = RW->getValueAsDef("SchedModel");
1944       unsigned PIdx = getProcModel(RWModelDef).Index;
1945       IdxVec Writes, Reads;
1946       findRWs(RW->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);
1947       collectRWResources(Writes, Reads, PIdx);
1948     }
1949 
1950     collectRWResources(SC.Writes, SC.Reads, SC.ProcIndices);
1951   }
1952   // Add resources separately defined by each subtarget.
1953   RecVec WRDefs = Records.getAllDerivedDefinitions("WriteRes");
1954   for (Record *WR : WRDefs) {
1955     Record *ModelDef = WR->getValueAsDef("SchedModel");
1956     addWriteRes(WR, getProcModel(ModelDef).Index);
1957   }
1958   RecVec SWRDefs = Records.getAllDerivedDefinitions("SchedWriteRes");
1959   for (Record *SWR : SWRDefs) {
1960     Record *ModelDef = SWR->getValueAsDef("SchedModel");
1961     addWriteRes(SWR, getProcModel(ModelDef).Index);
1962   }
1963   RecVec RADefs = Records.getAllDerivedDefinitions("ReadAdvance");
1964   for (Record *RA : RADefs) {
1965     Record *ModelDef = RA->getValueAsDef("SchedModel");
1966     addReadAdvance(RA, getProcModel(ModelDef).Index);
1967   }
1968   RecVec SRADefs = Records.getAllDerivedDefinitions("SchedReadAdvance");
1969   for (Record *SRA : SRADefs) {
1970     if (SRA->getValueInit("SchedModel")->isComplete()) {
1971       Record *ModelDef = SRA->getValueAsDef("SchedModel");
1972       addReadAdvance(SRA, getProcModel(ModelDef).Index);
1973     }
1974   }
1975   // Add ProcResGroups that are defined within this processor model, which may
1976   // not be directly referenced but may directly specify a buffer size.
1977   RecVec ProcResGroups = Records.getAllDerivedDefinitions("ProcResGroup");
1978   for (Record *PRG : ProcResGroups) {
1979     if (!PRG->getValueInit("SchedModel")->isComplete())
1980       continue;
1981     CodeGenProcModel &PM = getProcModel(PRG->getValueAsDef("SchedModel"));
1982     if (!is_contained(PM.ProcResourceDefs, PRG))
1983       PM.ProcResourceDefs.push_back(PRG);
1984   }
1985   // Add ProcResourceUnits unconditionally.
1986   for (Record *PRU : Records.getAllDerivedDefinitions("ProcResourceUnits")) {
1987     if (!PRU->getValueInit("SchedModel")->isComplete())
1988       continue;
1989     CodeGenProcModel &PM = getProcModel(PRU->getValueAsDef("SchedModel"));
1990     if (!is_contained(PM.ProcResourceDefs, PRU))
1991       PM.ProcResourceDefs.push_back(PRU);
1992   }
1993   // Finalize each ProcModel by sorting the record arrays.
1994   for (CodeGenProcModel &PM : ProcModels) {
1995     llvm::sort(PM.WriteResDefs, LessRecord());
1996     llvm::sort(PM.ReadAdvanceDefs, LessRecord());
1997     llvm::sort(PM.ProcResourceDefs, LessRecord());
1998     LLVM_DEBUG(
1999         PM.dump();
2000         dbgs() << "WriteResDefs: "; for (RecIter RI = PM.WriteResDefs.begin(),
2001                                          RE = PM.WriteResDefs.end();
2002                                          RI != RE; ++RI) {
2003           if ((*RI)->isSubClassOf("WriteRes"))
2004             dbgs() << (*RI)->getValueAsDef("WriteType")->getName() << " ";
2005           else
2006             dbgs() << (*RI)->getName() << " ";
2007         } dbgs() << "\nReadAdvanceDefs: ";
2008         for (RecIter RI = PM.ReadAdvanceDefs.begin(),
2009              RE = PM.ReadAdvanceDefs.end();
2010              RI != RE; ++RI) {
2011           if ((*RI)->isSubClassOf("ReadAdvance"))
2012             dbgs() << (*RI)->getValueAsDef("ReadType")->getName() << " ";
2013           else
2014             dbgs() << (*RI)->getName() << " ";
2015         } dbgs()
2016         << "\nProcResourceDefs: ";
2017         for (RecIter RI = PM.ProcResourceDefs.begin(),
2018              RE = PM.ProcResourceDefs.end();
2019              RI != RE; ++RI) { dbgs() << (*RI)->getName() << " "; } dbgs()
2020         << '\n');
2021     verifyProcResourceGroups(PM);
2022   }
2023 
2024   ProcResourceDefs.clear();
2025   ProcResGroups.clear();
2026 }
2027 
2028 void CodeGenSchedModels::checkCompleteness() {
2029   bool Complete = true;
2030   bool HadCompleteModel = false;
2031   for (const CodeGenProcModel &ProcModel : procModels()) {
2032     const bool HasItineraries = ProcModel.hasItineraries();
2033     if (!ProcModel.ModelDef->getValueAsBit("CompleteModel"))
2034       continue;
2035     for (const CodeGenInstruction *Inst : Target.getInstructionsByEnumValue()) {
2036       if (Inst->hasNoSchedulingInfo)
2037         continue;
2038       if (ProcModel.isUnsupported(*Inst))
2039         continue;
2040       unsigned SCIdx = getSchedClassIdx(*Inst);
2041       if (!SCIdx) {
2042         if (Inst->TheDef->isValueUnset("SchedRW") && !HadCompleteModel) {
2043           PrintError(Inst->TheDef->getLoc(),
2044                      "No schedule information for instruction '" +
2045                          Inst->TheDef->getName() + "' in SchedMachineModel '" +
2046                      ProcModel.ModelDef->getName() + "'");
2047           Complete = false;
2048         }
2049         continue;
2050       }
2051 
2052       const CodeGenSchedClass &SC = getSchedClass(SCIdx);
2053       if (!SC.Writes.empty())
2054         continue;
2055       if (HasItineraries && SC.ItinClassDef != nullptr &&
2056           SC.ItinClassDef->getName() != "NoItinerary")
2057         continue;
2058 
2059       const RecVec &InstRWs = SC.InstRWs;
2060       auto I = find_if(InstRWs, [&ProcModel](const Record *R) {
2061         return R->getValueAsDef("SchedModel") == ProcModel.ModelDef;
2062       });
2063       if (I == InstRWs.end()) {
2064         PrintError(Inst->TheDef->getLoc(), "'" + ProcModel.ModelName +
2065                                                "' lacks information for '" +
2066                                                Inst->TheDef->getName() + "'");
2067         Complete = false;
2068       }
2069     }
2070     HadCompleteModel = true;
2071   }
2072   if (!Complete) {
2073     errs() << "\n\nIncomplete schedule models found.\n"
2074       << "- Consider setting 'CompleteModel = 0' while developing new models.\n"
2075       << "- Pseudo instructions can be marked with 'hasNoSchedulingInfo = 1'.\n"
2076       << "- Instructions should usually have Sched<[...]> as a superclass, "
2077          "you may temporarily use an empty list.\n"
2078       << "- Instructions related to unsupported features can be excluded with "
2079          "list<Predicate> UnsupportedFeatures = [HasA,..,HasY]; in the "
2080          "processor model.\n\n";
2081     PrintFatalError("Incomplete schedule model");
2082   }
2083 }
2084 
2085 // Collect itinerary class resources for each processor.
2086 void CodeGenSchedModels::collectItinProcResources(Record *ItinClassDef) {
2087   for (unsigned PIdx = 0, PEnd = ProcModels.size(); PIdx != PEnd; ++PIdx) {
2088     const CodeGenProcModel &PM = ProcModels[PIdx];
2089     // For all ItinRW entries.
2090     bool HasMatch = false;
2091     for (RecIter II = PM.ItinRWDefs.begin(), IE = PM.ItinRWDefs.end();
2092          II != IE; ++II) {
2093       RecVec Matched = (*II)->getValueAsListOfDefs("MatchedItinClasses");
2094       if (!std::count(Matched.begin(), Matched.end(), ItinClassDef))
2095         continue;
2096       if (HasMatch)
2097         PrintFatalError((*II)->getLoc(), "Duplicate itinerary class "
2098                         + ItinClassDef->getName()
2099                         + " in ItinResources for " + PM.ModelName);
2100       HasMatch = true;
2101       IdxVec Writes, Reads;
2102       findRWs((*II)->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);
2103       collectRWResources(Writes, Reads, PIdx);
2104     }
2105   }
2106 }
2107 
2108 void CodeGenSchedModels::collectRWResources(unsigned RWIdx, bool IsRead,
2109                                             ArrayRef<unsigned> ProcIndices) {
2110   const CodeGenSchedRW &SchedRW = getSchedRW(RWIdx, IsRead);
2111   if (SchedRW.TheDef) {
2112     if (!IsRead && SchedRW.TheDef->isSubClassOf("SchedWriteRes")) {
2113       for (unsigned Idx : ProcIndices)
2114         addWriteRes(SchedRW.TheDef, Idx);
2115     }
2116     else if (IsRead && SchedRW.TheDef->isSubClassOf("SchedReadAdvance")) {
2117       for (unsigned Idx : ProcIndices)
2118         addReadAdvance(SchedRW.TheDef, Idx);
2119     }
2120   }
2121   for (RecIter AI = SchedRW.Aliases.begin(), AE = SchedRW.Aliases.end();
2122        AI != AE; ++AI) {
2123     IdxVec AliasProcIndices;
2124     if ((*AI)->getValueInit("SchedModel")->isComplete()) {
2125       AliasProcIndices.push_back(
2126         getProcModel((*AI)->getValueAsDef("SchedModel")).Index);
2127     }
2128     else
2129       AliasProcIndices = ProcIndices;
2130     const CodeGenSchedRW &AliasRW = getSchedRW((*AI)->getValueAsDef("AliasRW"));
2131     assert(AliasRW.IsRead == IsRead && "cannot alias reads to writes");
2132 
2133     IdxVec ExpandedRWs;
2134     expandRWSequence(AliasRW.Index, ExpandedRWs, IsRead);
2135     for (IdxIter SI = ExpandedRWs.begin(), SE = ExpandedRWs.end();
2136          SI != SE; ++SI) {
2137       collectRWResources(*SI, IsRead, AliasProcIndices);
2138     }
2139   }
2140 }
2141 
2142 // Collect resources for a set of read/write types and processor indices.
2143 void CodeGenSchedModels::collectRWResources(ArrayRef<unsigned> Writes,
2144                                             ArrayRef<unsigned> Reads,
2145                                             ArrayRef<unsigned> ProcIndices) {
2146   for (unsigned Idx : Writes)
2147     collectRWResources(Idx, /*IsRead=*/false, ProcIndices);
2148 
2149   for (unsigned Idx : Reads)
2150     collectRWResources(Idx, /*IsRead=*/true, ProcIndices);
2151 }
2152 
2153 // Find the processor's resource units for this kind of resource.
2154 Record *CodeGenSchedModels::findProcResUnits(Record *ProcResKind,
2155                                              const CodeGenProcModel &PM,
2156                                              ArrayRef<SMLoc> Loc) const {
2157   if (ProcResKind->isSubClassOf("ProcResourceUnits"))
2158     return ProcResKind;
2159 
2160   Record *ProcUnitDef = nullptr;
2161   assert(!ProcResourceDefs.empty());
2162   assert(!ProcResGroups.empty());
2163 
2164   for (Record *ProcResDef : ProcResourceDefs) {
2165     if (ProcResDef->getValueAsDef("Kind") == ProcResKind
2166         && ProcResDef->getValueAsDef("SchedModel") == PM.ModelDef) {
2167       if (ProcUnitDef) {
2168         PrintFatalError(Loc,
2169                         "Multiple ProcessorResourceUnits associated with "
2170                         + ProcResKind->getName());
2171       }
2172       ProcUnitDef = ProcResDef;
2173     }
2174   }
2175   for (Record *ProcResGroup : ProcResGroups) {
2176     if (ProcResGroup == ProcResKind
2177         && ProcResGroup->getValueAsDef("SchedModel") == PM.ModelDef) {
2178       if (ProcUnitDef) {
2179         PrintFatalError(Loc,
2180                         "Multiple ProcessorResourceUnits associated with "
2181                         + ProcResKind->getName());
2182       }
2183       ProcUnitDef = ProcResGroup;
2184     }
2185   }
2186   if (!ProcUnitDef) {
2187     PrintFatalError(Loc,
2188                     "No ProcessorResources associated with "
2189                     + ProcResKind->getName());
2190   }
2191   return ProcUnitDef;
2192 }
2193 
2194 // Iteratively add a resource and its super resources.
2195 void CodeGenSchedModels::addProcResource(Record *ProcResKind,
2196                                          CodeGenProcModel &PM,
2197                                          ArrayRef<SMLoc> Loc) {
2198   while (true) {
2199     Record *ProcResUnits = findProcResUnits(ProcResKind, PM, Loc);
2200 
2201     // See if this ProcResource is already associated with this processor.
2202     if (is_contained(PM.ProcResourceDefs, ProcResUnits))
2203       return;
2204 
2205     PM.ProcResourceDefs.push_back(ProcResUnits);
2206     if (ProcResUnits->isSubClassOf("ProcResGroup"))
2207       return;
2208 
2209     if (!ProcResUnits->getValueInit("Super")->isComplete())
2210       return;
2211 
2212     ProcResKind = ProcResUnits->getValueAsDef("Super");
2213   }
2214 }
2215 
2216 // Add resources for a SchedWrite to this processor if they don't exist.
2217 void CodeGenSchedModels::addWriteRes(Record *ProcWriteResDef, unsigned PIdx) {
2218   assert(PIdx && "don't add resources to an invalid Processor model");
2219 
2220   RecVec &WRDefs = ProcModels[PIdx].WriteResDefs;
2221   if (is_contained(WRDefs, ProcWriteResDef))
2222     return;
2223   WRDefs.push_back(ProcWriteResDef);
2224 
2225   // Visit ProcResourceKinds referenced by the newly discovered WriteRes.
2226   RecVec ProcResDefs = ProcWriteResDef->getValueAsListOfDefs("ProcResources");
2227   for (RecIter WritePRI = ProcResDefs.begin(), WritePRE = ProcResDefs.end();
2228        WritePRI != WritePRE; ++WritePRI) {
2229     addProcResource(*WritePRI, ProcModels[PIdx], ProcWriteResDef->getLoc());
2230   }
2231 }
2232 
2233 // Add resources for a ReadAdvance to this processor if they don't exist.
2234 void CodeGenSchedModels::addReadAdvance(Record *ProcReadAdvanceDef,
2235                                         unsigned PIdx) {
2236   RecVec &RADefs = ProcModels[PIdx].ReadAdvanceDefs;
2237   if (is_contained(RADefs, ProcReadAdvanceDef))
2238     return;
2239   RADefs.push_back(ProcReadAdvanceDef);
2240 }
2241 
2242 unsigned CodeGenProcModel::getProcResourceIdx(Record *PRDef) const {
2243   RecIter PRPos = find(ProcResourceDefs, PRDef);
2244   if (PRPos == ProcResourceDefs.end())
2245     PrintFatalError(PRDef->getLoc(), "ProcResource def is not included in "
2246                     "the ProcResources list for " + ModelName);
2247   // Idx=0 is reserved for invalid.
2248   return 1 + (PRPos - ProcResourceDefs.begin());
2249 }
2250 
2251 bool CodeGenProcModel::isUnsupported(const CodeGenInstruction &Inst) const {
2252   for (const Record *TheDef : UnsupportedFeaturesDefs) {
2253     for (const Record *PredDef : Inst.TheDef->getValueAsListOfDefs("Predicates")) {
2254       if (TheDef->getName() == PredDef->getName())
2255         return true;
2256     }
2257   }
2258   return false;
2259 }
2260 
2261 #ifndef NDEBUG
2262 void CodeGenProcModel::dump() const {
2263   dbgs() << Index << ": " << ModelName << " "
2264          << (ModelDef ? ModelDef->getName() : "inferred") << " "
2265          << (ItinsDef ? ItinsDef->getName() : "no itinerary") << '\n';
2266 }
2267 
2268 void CodeGenSchedRW::dump() const {
2269   dbgs() << Name << (IsVariadic ? " (V) " : " ");
2270   if (IsSequence) {
2271     dbgs() << "(";
2272     dumpIdxVec(Sequence);
2273     dbgs() << ")";
2274   }
2275 }
2276 
2277 void CodeGenSchedClass::dump(const CodeGenSchedModels* SchedModels) const {
2278   dbgs() << "SCHEDCLASS " << Index << ":" << Name << '\n'
2279          << "  Writes: ";
2280   for (unsigned i = 0, N = Writes.size(); i < N; ++i) {
2281     SchedModels->getSchedWrite(Writes[i]).dump();
2282     if (i < N-1) {
2283       dbgs() << '\n';
2284       dbgs().indent(10);
2285     }
2286   }
2287   dbgs() << "\n  Reads: ";
2288   for (unsigned i = 0, N = Reads.size(); i < N; ++i) {
2289     SchedModels->getSchedRead(Reads[i]).dump();
2290     if (i < N-1) {
2291       dbgs() << '\n';
2292       dbgs().indent(10);
2293     }
2294   }
2295   dbgs() << "\n  ProcIdx: "; dumpIdxVec(ProcIndices);
2296   if (!Transitions.empty()) {
2297     dbgs() << "\n Transitions for Proc ";
2298     for (const CodeGenSchedTransition &Transition : Transitions) {
2299       dumpIdxVec(Transition.ProcIndices);
2300     }
2301   }
2302   dbgs() << '\n';
2303 }
2304 
2305 void PredTransitions::dump() const {
2306   dbgs() << "Expanded Variants:\n";
2307   for (std::vector<PredTransition>::const_iterator
2308          TI = TransVec.begin(), TE = TransVec.end(); TI != TE; ++TI) {
2309     dbgs() << "{";
2310     for (SmallVectorImpl<PredCheck>::const_iterator
2311            PCI = TI->PredTerm.begin(), PCE = TI->PredTerm.end();
2312          PCI != PCE; ++PCI) {
2313       if (PCI != TI->PredTerm.begin())
2314         dbgs() << ", ";
2315       dbgs() << SchedModels.getSchedRW(PCI->RWIdx, PCI->IsRead).Name
2316              << ":" << PCI->Predicate->getName();
2317     }
2318     dbgs() << "},\n  => {";
2319     for (SmallVectorImpl<SmallVector<unsigned,4>>::const_iterator
2320            WSI = TI->WriteSequences.begin(), WSE = TI->WriteSequences.end();
2321          WSI != WSE; ++WSI) {
2322       dbgs() << "(";
2323       for (SmallVectorImpl<unsigned>::const_iterator
2324              WI = WSI->begin(), WE = WSI->end(); WI != WE; ++WI) {
2325         if (WI != WSI->begin())
2326           dbgs() << ", ";
2327         dbgs() << SchedModels.getSchedWrite(*WI).Name;
2328       }
2329       dbgs() << "),";
2330     }
2331     dbgs() << "}\n";
2332   }
2333 }
2334 #endif // NDEBUG
2335