Path: blob/main/contrib/llvm-project/llvm/utils/TableGen/Common/CodeGenSchedule.cpp
35290 views
//===- CodeGenSchedule.cpp - Scheduling MachineModels ---------------------===//1//2// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.3// See https://llvm.org/LICENSE.txt for license information.4// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception5//6//===----------------------------------------------------------------------===//7//8// This file defines structures to encapsulate the machine model as described in9// the target description.10//11//===----------------------------------------------------------------------===//1213#include "CodeGenSchedule.h"14#include "CodeGenInstruction.h"15#include "CodeGenTarget.h"16#include "llvm/ADT/MapVector.h"17#include "llvm/ADT/STLExtras.h"18#include "llvm/ADT/SmallPtrSet.h"19#include "llvm/ADT/SmallVector.h"20#include "llvm/Support/Casting.h"21#include "llvm/Support/Debug.h"22#include "llvm/Support/Regex.h"23#include "llvm/Support/raw_ostream.h"24#include "llvm/TableGen/Error.h"25#include <algorithm>26#include <iterator>27#include <utility>2829using namespace llvm;3031#define DEBUG_TYPE "subtarget-emitter"3233#ifndef NDEBUG34static void dumpIdxVec(ArrayRef<unsigned> V) {35for (unsigned Idx : V)36dbgs() << Idx << ", ";37}38#endif3940namespace {4142// (instrs a, b, ...) Evaluate and union all arguments. Identical to AddOp.43struct InstrsOp : public SetTheory::Operator {44void apply(SetTheory &ST, DagInit *Expr, SetTheory::RecSet &Elts,45ArrayRef<SMLoc> Loc) override {46ST.evaluate(Expr->arg_begin(), Expr->arg_end(), Elts, Loc);47}48};4950// (instregex "OpcPat",...) Find all instructions matching an opcode pattern.51struct InstRegexOp : public SetTheory::Operator {52const CodeGenTarget &Target;53InstRegexOp(const CodeGenTarget &t) : Target(t) {}5455/// Remove any text inside of parentheses from S.56static std::string removeParens(llvm::StringRef S) {57std::string Result;58unsigned Paren = 0;59// NB: We don't care about escaped parens here.60for (char C : S) {61switch (C) {62case '(':63++Paren;64break;65case ')':66--Paren;67break;68default:69if (Paren == 0)70Result += C;71}72}73return Result;74}7576void apply(SetTheory &ST, DagInit *Expr, SetTheory::RecSet &Elts,77ArrayRef<SMLoc> Loc) override {78ArrayRef<const CodeGenInstruction *> Instructions =79Target.getInstructionsByEnumValue();8081unsigned NumGeneric = Target.getNumFixedInstructions();82unsigned NumPseudos = Target.getNumPseudoInstructions();83auto Generics = Instructions.slice(0, NumGeneric);84auto Pseudos = Instructions.slice(NumGeneric, NumPseudos);85auto NonPseudos = Instructions.slice(NumGeneric + NumPseudos);8687for (Init *Arg : Expr->getArgs()) {88StringInit *SI = dyn_cast<StringInit>(Arg);89if (!SI)90PrintFatalError(Loc, "instregex requires pattern string: " +91Expr->getAsString());92StringRef Original = SI->getValue();93// Drop an explicit ^ anchor to not interfere with prefix search.94bool HadAnchor = Original.consume_front("^");9596// Extract a prefix that we can binary search on.97static const char RegexMetachars[] = "()^$|*+?.[]\\{}";98auto FirstMeta = Original.find_first_of(RegexMetachars);99if (FirstMeta != StringRef::npos && FirstMeta > 0) {100// If we have a regex like ABC* we can only use AB as the prefix, as101// the * acts on C.102switch (Original[FirstMeta]) {103case '+':104case '*':105case '?':106--FirstMeta;107break;108default:109break;110}111}112113// Look for top-level | or ?. We cannot optimize them to binary search.114if (removeParens(Original).find_first_of("|?") != std::string::npos)115FirstMeta = 0;116117std::optional<Regex> Regexpr;118StringRef Prefix = Original.substr(0, FirstMeta);119StringRef PatStr = Original.substr(FirstMeta);120if (!PatStr.empty()) {121// For the rest use a python-style prefix match.122std::string pat = std::string(PatStr);123// Add ^ anchor. If we had one originally, don't need the group.124if (HadAnchor) {125pat.insert(0, "^");126} else {127pat.insert(0, "^(");128pat.insert(pat.end(), ')');129}130Regexpr = Regex(pat);131}132133int NumMatches = 0;134135// The generic opcodes are unsorted, handle them manually.136for (auto *Inst : Generics) {137StringRef InstName = Inst->TheDef->getName();138if (InstName.starts_with(Prefix) &&139(!Regexpr || Regexpr->match(InstName.substr(Prefix.size())))) {140Elts.insert(Inst->TheDef);141NumMatches++;142}143}144145// Target instructions are split into two ranges: pseudo instructions146// first, than non-pseudos. Each range is in lexicographical order147// sorted by name. Find the sub-ranges that start with our prefix.148struct Comp {149bool operator()(const CodeGenInstruction *LHS, StringRef RHS) {150return LHS->TheDef->getName() < RHS;151}152bool operator()(StringRef LHS, const CodeGenInstruction *RHS) {153return LHS < RHS->TheDef->getName() &&154!RHS->TheDef->getName().starts_with(LHS);155}156};157auto Range1 =158std::equal_range(Pseudos.begin(), Pseudos.end(), Prefix, Comp());159auto Range2 = std::equal_range(NonPseudos.begin(), NonPseudos.end(),160Prefix, Comp());161162// For these ranges we know that instruction names start with the prefix.163// Check if there's a regex that needs to be checked.164const auto HandleNonGeneric = [&](const CodeGenInstruction *Inst) {165StringRef InstName = Inst->TheDef->getName();166if (!Regexpr || Regexpr->match(InstName.substr(Prefix.size()))) {167Elts.insert(Inst->TheDef);168NumMatches++;169}170};171std::for_each(Range1.first, Range1.second, HandleNonGeneric);172std::for_each(Range2.first, Range2.second, HandleNonGeneric);173174if (0 == NumMatches)175PrintFatalError(Loc, "instregex has no matches: " + Original);176}177}178};179180} // end anonymous namespace181182/// CodeGenModels ctor interprets machine model records and populates maps.183CodeGenSchedModels::CodeGenSchedModels(RecordKeeper &RK,184const CodeGenTarget &TGT)185: Records(RK), Target(TGT) {186187Sets.addFieldExpander("InstRW", "Instrs");188189// Allow Set evaluation to recognize the dags used in InstRW records:190// (instrs Op1, Op1...)191Sets.addOperator("instrs", std::make_unique<InstrsOp>());192Sets.addOperator("instregex", std::make_unique<InstRegexOp>(Target));193194// Instantiate a CodeGenProcModel for each SchedMachineModel with the values195// that are explicitly referenced in tablegen records. Resources associated196// with each processor will be derived later. Populate ProcModelMap with the197// CodeGenProcModel instances.198collectProcModels();199200// Instantiate a CodeGenSchedRW for each SchedReadWrite record explicitly201// defined, and populate SchedReads and SchedWrites vectors. Implicit202// SchedReadWrites that represent sequences derived from expanded variant will203// be inferred later.204collectSchedRW();205206// Instantiate a CodeGenSchedClass for each unique SchedRW signature directly207// required by an instruction definition, and populate SchedClassIdxMap. Set208// NumItineraryClasses to the number of explicit itinerary classes referenced209// by instructions. Set NumInstrSchedClasses to the number of itinerary210// classes plus any classes implied by instructions that derive from class211// Sched and provide SchedRW list. This does not infer any new classes from212// SchedVariant.213collectSchedClasses();214215// Find instruction itineraries for each processor. Sort and populate216// CodeGenProcModel::ItinDefList. (Cycle-to-cycle itineraries). This requires217// all itinerary classes to be discovered.218collectProcItins();219220// Find ItinRW records for each processor and itinerary class.221// (For per-operand resources mapped to itinerary classes).222collectProcItinRW();223224// Find UnsupportedFeatures records for each processor.225// (For per-operand resources mapped to itinerary classes).226collectProcUnsupportedFeatures();227228// Infer new SchedClasses from SchedVariant.229inferSchedClasses();230231// Populate each CodeGenProcModel's WriteResDefs, ReadAdvanceDefs, and232// ProcResourceDefs.233LLVM_DEBUG(234dbgs() << "\n+++ RESOURCE DEFINITIONS (collectProcResources) +++\n");235collectProcResources();236237// Collect optional processor description.238collectOptionalProcessorInfo();239240// Check MCInstPredicate definitions.241checkMCInstPredicates();242243// Check STIPredicate definitions.244checkSTIPredicates();245246// Find STIPredicate definitions for each processor model, and construct247// STIPredicateFunction objects.248collectSTIPredicates();249250checkCompleteness();251}252253void CodeGenSchedModels::checkSTIPredicates() const {254DenseMap<StringRef, const Record *> Declarations;255256// There cannot be multiple declarations with the same name.257const RecVec Decls = Records.getAllDerivedDefinitions("STIPredicateDecl");258for (const Record *R : Decls) {259StringRef Name = R->getValueAsString("Name");260const auto It = Declarations.find(Name);261if (It == Declarations.end()) {262Declarations[Name] = R;263continue;264}265266PrintError(R->getLoc(), "STIPredicate " + Name + " multiply declared.");267PrintFatalNote(It->second->getLoc(), "Previous declaration was here.");268}269270// Disallow InstructionEquivalenceClasses with an empty instruction list.271const RecVec Defs =272Records.getAllDerivedDefinitions("InstructionEquivalenceClass");273for (const Record *R : Defs) {274RecVec Opcodes = R->getValueAsListOfDefs("Opcodes");275if (Opcodes.empty()) {276PrintFatalError(R->getLoc(), "Invalid InstructionEquivalenceClass "277"defined with an empty opcode list.");278}279}280}281282// Used by function `processSTIPredicate` to construct a mask of machine283// instruction operands.284static APInt constructOperandMask(ArrayRef<int64_t> Indices) {285APInt OperandMask;286if (Indices.empty())287return OperandMask;288289int64_t MaxIndex = *llvm::max_element(Indices);290assert(MaxIndex >= 0 && "Invalid negative indices in input!");291OperandMask = OperandMask.zext(MaxIndex + 1);292for (const int64_t Index : Indices) {293assert(Index >= 0 && "Invalid negative indices!");294OperandMask.setBit(Index);295}296297return OperandMask;298}299300static void processSTIPredicate(STIPredicateFunction &Fn,301const ProcModelMapTy &ProcModelMap) {302DenseMap<const Record *, unsigned> Opcode2Index;303using OpcodeMapPair = std::pair<const Record *, OpcodeInfo>;304std::vector<OpcodeMapPair> OpcodeMappings;305std::vector<std::pair<APInt, APInt>> OpcodeMasks;306307DenseMap<const Record *, unsigned> Predicate2Index;308unsigned NumUniquePredicates = 0;309310// Number unique predicates and opcodes used by InstructionEquivalenceClass311// definitions. Each unique opcode will be associated with an OpcodeInfo312// object.313for (const Record *Def : Fn.getDefinitions()) {314RecVec Classes = Def->getValueAsListOfDefs("Classes");315for (const Record *EC : Classes) {316const Record *Pred = EC->getValueAsDef("Predicate");317if (!Predicate2Index.contains(Pred))318Predicate2Index[Pred] = NumUniquePredicates++;319320RecVec Opcodes = EC->getValueAsListOfDefs("Opcodes");321for (const Record *Opcode : Opcodes) {322if (!Opcode2Index.contains(Opcode)) {323Opcode2Index[Opcode] = OpcodeMappings.size();324OpcodeMappings.emplace_back(Opcode, OpcodeInfo());325}326}327}328}329330// Initialize vector `OpcodeMasks` with default values. We want to keep track331// of which processors "use" which opcodes. We also want to be able to332// identify predicates that are used by different processors for a same333// opcode.334// This information is used later on by this algorithm to sort OpcodeMapping335// elements based on their processor and predicate sets.336OpcodeMasks.resize(OpcodeMappings.size());337APInt DefaultProcMask(ProcModelMap.size(), 0);338APInt DefaultPredMask(NumUniquePredicates, 0);339for (std::pair<APInt, APInt> &MaskPair : OpcodeMasks)340MaskPair = std::pair(DefaultProcMask, DefaultPredMask);341342// Construct a OpcodeInfo object for every unique opcode declared by an343// InstructionEquivalenceClass definition.344for (const Record *Def : Fn.getDefinitions()) {345RecVec Classes = Def->getValueAsListOfDefs("Classes");346const Record *SchedModel = Def->getValueAsDef("SchedModel");347unsigned ProcIndex = ProcModelMap.find(SchedModel)->second;348APInt ProcMask(ProcModelMap.size(), 0);349ProcMask.setBit(ProcIndex);350351for (const Record *EC : Classes) {352RecVec Opcodes = EC->getValueAsListOfDefs("Opcodes");353354std::vector<int64_t> OpIndices =355EC->getValueAsListOfInts("OperandIndices");356APInt OperandMask = constructOperandMask(OpIndices);357358const Record *Pred = EC->getValueAsDef("Predicate");359APInt PredMask(NumUniquePredicates, 0);360PredMask.setBit(Predicate2Index[Pred]);361362for (const Record *Opcode : Opcodes) {363unsigned OpcodeIdx = Opcode2Index[Opcode];364if (OpcodeMasks[OpcodeIdx].first[ProcIndex]) {365std::string Message =366"Opcode " + Opcode->getName().str() +367" used by multiple InstructionEquivalenceClass definitions.";368PrintFatalError(EC->getLoc(), Message);369}370OpcodeMasks[OpcodeIdx].first |= ProcMask;371OpcodeMasks[OpcodeIdx].second |= PredMask;372OpcodeInfo &OI = OpcodeMappings[OpcodeIdx].second;373374OI.addPredicateForProcModel(ProcMask, OperandMask, Pred);375}376}377}378379// Sort OpcodeMappings elements based on their CPU and predicate masks.380// As a last resort, order elements by opcode identifier.381llvm::sort(382OpcodeMappings, [&](const OpcodeMapPair &Lhs, const OpcodeMapPair &Rhs) {383unsigned LhsIdx = Opcode2Index[Lhs.first];384unsigned RhsIdx = Opcode2Index[Rhs.first];385const std::pair<APInt, APInt> &LhsMasks = OpcodeMasks[LhsIdx];386const std::pair<APInt, APInt> &RhsMasks = OpcodeMasks[RhsIdx];387388auto PopulationCountAndLeftBit =389[](const APInt &Other) -> std::pair<int, int> {390return std::pair<int, int>(Other.popcount(), -Other.countl_zero());391};392auto lhsmask_first = PopulationCountAndLeftBit(LhsMasks.first);393auto rhsmask_first = PopulationCountAndLeftBit(RhsMasks.first);394if (lhsmask_first != rhsmask_first)395return lhsmask_first < rhsmask_first;396397auto lhsmask_second = PopulationCountAndLeftBit(LhsMasks.second);398auto rhsmask_second = PopulationCountAndLeftBit(RhsMasks.second);399if (lhsmask_second != rhsmask_second)400return lhsmask_second < rhsmask_second;401402return LhsIdx < RhsIdx;403});404405// Now construct opcode groups. Groups are used by the SubtargetEmitter when406// expanding the body of a STIPredicate function. In particular, each opcode407// group is expanded into a sequence of labels in a switch statement.408// It identifies opcodes for which different processors define same predicates409// and same opcode masks.410for (OpcodeMapPair &Info : OpcodeMappings)411Fn.addOpcode(Info.first, std::move(Info.second));412}413414void CodeGenSchedModels::collectSTIPredicates() {415// Map STIPredicateDecl records to elements of vector416// CodeGenSchedModels::STIPredicates.417DenseMap<const Record *, unsigned> Decl2Index;418419RecVec RV = Records.getAllDerivedDefinitions("STIPredicate");420for (const Record *R : RV) {421const Record *Decl = R->getValueAsDef("Declaration");422423const auto It = Decl2Index.find(Decl);424if (It == Decl2Index.end()) {425Decl2Index[Decl] = STIPredicates.size();426STIPredicateFunction Predicate(Decl);427Predicate.addDefinition(R);428STIPredicates.emplace_back(std::move(Predicate));429continue;430}431432STIPredicateFunction &PreviousDef = STIPredicates[It->second];433PreviousDef.addDefinition(R);434}435436for (STIPredicateFunction &Fn : STIPredicates)437processSTIPredicate(Fn, ProcModelMap);438}439440void OpcodeInfo::addPredicateForProcModel(const llvm::APInt &CpuMask,441const llvm::APInt &OperandMask,442const Record *Predicate) {443auto It = llvm::find_if(444Predicates, [&OperandMask, &Predicate](const PredicateInfo &P) {445return P.Predicate == Predicate && P.OperandMask == OperandMask;446});447if (It == Predicates.end()) {448Predicates.emplace_back(CpuMask, OperandMask, Predicate);449return;450}451It->ProcModelMask |= CpuMask;452}453454void CodeGenSchedModels::checkMCInstPredicates() const {455RecVec MCPredicates = Records.getAllDerivedDefinitions("TIIPredicate");456if (MCPredicates.empty())457return;458459// A target cannot have multiple TIIPredicate definitions with a same name.460llvm::StringMap<const Record *> TIIPredicates(MCPredicates.size());461for (const Record *TIIPred : MCPredicates) {462StringRef Name = TIIPred->getValueAsString("FunctionName");463StringMap<const Record *>::const_iterator It = TIIPredicates.find(Name);464if (It == TIIPredicates.end()) {465TIIPredicates[Name] = TIIPred;466continue;467}468469PrintError(TIIPred->getLoc(),470"TIIPredicate " + Name + " is multiply defined.");471PrintFatalNote(It->second->getLoc(),472" Previous definition of " + Name + " was here.");473}474}475476void CodeGenSchedModels::collectRetireControlUnits() {477RecVec Units = Records.getAllDerivedDefinitions("RetireControlUnit");478479for (Record *RCU : Units) {480CodeGenProcModel &PM = getProcModel(RCU->getValueAsDef("SchedModel"));481if (PM.RetireControlUnit) {482PrintError(RCU->getLoc(),483"Expected a single RetireControlUnit definition");484PrintNote(PM.RetireControlUnit->getLoc(),485"Previous definition of RetireControlUnit was here");486}487PM.RetireControlUnit = RCU;488}489}490491void CodeGenSchedModels::collectLoadStoreQueueInfo() {492RecVec Queues = Records.getAllDerivedDefinitions("MemoryQueue");493494for (Record *Queue : Queues) {495CodeGenProcModel &PM = getProcModel(Queue->getValueAsDef("SchedModel"));496if (Queue->isSubClassOf("LoadQueue")) {497if (PM.LoadQueue) {498PrintError(Queue->getLoc(), "Expected a single LoadQueue definition");499PrintNote(PM.LoadQueue->getLoc(),500"Previous definition of LoadQueue was here");501}502503PM.LoadQueue = Queue;504}505506if (Queue->isSubClassOf("StoreQueue")) {507if (PM.StoreQueue) {508PrintError(Queue->getLoc(), "Expected a single StoreQueue definition");509PrintNote(PM.StoreQueue->getLoc(),510"Previous definition of StoreQueue was here");511}512513PM.StoreQueue = Queue;514}515}516}517518/// Collect optional processor information.519void CodeGenSchedModels::collectOptionalProcessorInfo() {520// Find register file definitions for each processor.521collectRegisterFiles();522523// Collect processor RetireControlUnit descriptors if available.524collectRetireControlUnits();525526// Collect information about load/store queues.527collectLoadStoreQueueInfo();528529checkCompleteness();530}531532/// Gather all processor models.533void CodeGenSchedModels::collectProcModels() {534RecVec ProcRecords = Records.getAllDerivedDefinitions("Processor");535llvm::sort(ProcRecords, LessRecordFieldName());536537// Check for duplicated names.538auto I = std::adjacent_find(ProcRecords.begin(), ProcRecords.end(),539[](const Record *Rec1, const Record *Rec2) {540return Rec1->getValueAsString("Name") ==541Rec2->getValueAsString("Name");542});543if (I != ProcRecords.end())544PrintFatalError((*I)->getLoc(), "Duplicate processor name " +545(*I)->getValueAsString("Name"));546547// Reserve space because we can. Reallocation would be ok.548ProcModels.reserve(ProcRecords.size() + 1);549550// Use idx=0 for NoModel/NoItineraries.551Record *NoModelDef = Records.getDef("NoSchedModel");552Record *NoItinsDef = Records.getDef("NoItineraries");553ProcModels.emplace_back(0, "NoSchedModel", NoModelDef, NoItinsDef);554ProcModelMap[NoModelDef] = 0;555556// For each processor, find a unique machine model.557LLVM_DEBUG(dbgs() << "+++ PROCESSOR MODELs (addProcModel) +++\n");558for (Record *ProcRecord : ProcRecords)559addProcModel(ProcRecord);560}561562/// Get a unique processor model based on the defined MachineModel and563/// ProcessorItineraries.564void CodeGenSchedModels::addProcModel(Record *ProcDef) {565Record *ModelKey = getModelOrItinDef(ProcDef);566if (!ProcModelMap.insert(std::pair(ModelKey, ProcModels.size())).second)567return;568569std::string Name = std::string(ModelKey->getName());570if (ModelKey->isSubClassOf("SchedMachineModel")) {571Record *ItinsDef = ModelKey->getValueAsDef("Itineraries");572ProcModels.emplace_back(ProcModels.size(), Name, ModelKey, ItinsDef);573} else {574// An itinerary is defined without a machine model. Infer a new model.575if (!ModelKey->getValueAsListOfDefs("IID").empty())576Name = Name + "Model";577ProcModels.emplace_back(ProcModels.size(), Name,578ProcDef->getValueAsDef("SchedModel"), ModelKey);579}580LLVM_DEBUG(ProcModels.back().dump());581}582583// Recursively find all reachable SchedReadWrite records.584static void scanSchedRW(Record *RWDef, RecVec &RWDefs,585SmallPtrSet<Record *, 16> &RWSet) {586if (!RWSet.insert(RWDef).second)587return;588RWDefs.push_back(RWDef);589// Reads don't currently have sequence records, but it can be added later.590if (RWDef->isSubClassOf("WriteSequence")) {591RecVec Seq = RWDef->getValueAsListOfDefs("Writes");592for (Record *WSRec : Seq)593scanSchedRW(WSRec, RWDefs, RWSet);594} else if (RWDef->isSubClassOf("SchedVariant")) {595// Visit each variant (guarded by a different predicate).596RecVec Vars = RWDef->getValueAsListOfDefs("Variants");597for (Record *Variant : Vars) {598// Visit each RW in the sequence selected by the current variant.599RecVec Selected = Variant->getValueAsListOfDefs("Selected");600for (Record *SelDef : Selected)601scanSchedRW(SelDef, RWDefs, RWSet);602}603}604}605606// Collect and sort all SchedReadWrites reachable via tablegen records.607// More may be inferred later when inferring new SchedClasses from variants.608void CodeGenSchedModels::collectSchedRW() {609// Reserve idx=0 for invalid writes/reads.610SchedWrites.resize(1);611SchedReads.resize(1);612613SmallPtrSet<Record *, 16> RWSet;614615// Find all SchedReadWrites referenced by instruction defs.616RecVec SWDefs, SRDefs;617for (const CodeGenInstruction *Inst : Target.getInstructionsByEnumValue()) {618Record *SchedDef = Inst->TheDef;619if (SchedDef->isValueUnset("SchedRW"))620continue;621RecVec RWs = SchedDef->getValueAsListOfDefs("SchedRW");622for (Record *RW : RWs) {623if (RW->isSubClassOf("SchedWrite"))624scanSchedRW(RW, SWDefs, RWSet);625else {626assert(RW->isSubClassOf("SchedRead") && "Unknown SchedReadWrite");627scanSchedRW(RW, SRDefs, RWSet);628}629}630}631// Find all ReadWrites referenced by InstRW.632RecVec InstRWDefs = Records.getAllDerivedDefinitions("InstRW");633for (Record *InstRWDef : InstRWDefs) {634// For all OperandReadWrites.635RecVec RWDefs = InstRWDef->getValueAsListOfDefs("OperandReadWrites");636for (Record *RWDef : RWDefs) {637if (RWDef->isSubClassOf("SchedWrite"))638scanSchedRW(RWDef, SWDefs, RWSet);639else {640assert(RWDef->isSubClassOf("SchedRead") && "Unknown SchedReadWrite");641scanSchedRW(RWDef, SRDefs, RWSet);642}643}644}645// Find all ReadWrites referenced by ItinRW.646RecVec ItinRWDefs = Records.getAllDerivedDefinitions("ItinRW");647for (Record *ItinRWDef : ItinRWDefs) {648// For all OperandReadWrites.649RecVec RWDefs = ItinRWDef->getValueAsListOfDefs("OperandReadWrites");650for (Record *RWDef : RWDefs) {651if (RWDef->isSubClassOf("SchedWrite"))652scanSchedRW(RWDef, SWDefs, RWSet);653else {654assert(RWDef->isSubClassOf("SchedRead") && "Unknown SchedReadWrite");655scanSchedRW(RWDef, SRDefs, RWSet);656}657}658}659// Find all ReadWrites referenced by SchedAlias. AliasDefs needs to be sorted660// for the loop below that initializes Alias vectors.661RecVec AliasDefs = Records.getAllDerivedDefinitions("SchedAlias");662llvm::sort(AliasDefs, LessRecord());663for (Record *ADef : AliasDefs) {664Record *MatchDef = ADef->getValueAsDef("MatchRW");665Record *AliasDef = ADef->getValueAsDef("AliasRW");666if (MatchDef->isSubClassOf("SchedWrite")) {667if (!AliasDef->isSubClassOf("SchedWrite"))668PrintFatalError(ADef->getLoc(), "SchedWrite Alias must be SchedWrite");669scanSchedRW(AliasDef, SWDefs, RWSet);670} else {671assert(MatchDef->isSubClassOf("SchedRead") && "Unknown SchedReadWrite");672if (!AliasDef->isSubClassOf("SchedRead"))673PrintFatalError(ADef->getLoc(), "SchedRead Alias must be SchedRead");674scanSchedRW(AliasDef, SRDefs, RWSet);675}676}677// Sort and add the SchedReadWrites directly referenced by instructions or678// itinerary resources. Index reads and writes in separate domains.679llvm::sort(SWDefs, LessRecord());680for (Record *SWDef : SWDefs) {681assert(!getSchedRWIdx(SWDef, /*IsRead=*/false) && "duplicate SchedWrite");682SchedWrites.emplace_back(SchedWrites.size(), SWDef);683}684llvm::sort(SRDefs, LessRecord());685for (Record *SRDef : SRDefs) {686assert(!getSchedRWIdx(SRDef, /*IsRead-*/ true) && "duplicate SchedWrite");687SchedReads.emplace_back(SchedReads.size(), SRDef);688}689// Initialize WriteSequence vectors.690for (CodeGenSchedRW &CGRW : SchedWrites) {691if (!CGRW.IsSequence)692continue;693findRWs(CGRW.TheDef->getValueAsListOfDefs("Writes"), CGRW.Sequence,694/*IsRead=*/false);695}696// Initialize Aliases vectors.697for (Record *ADef : AliasDefs) {698Record *AliasDef = ADef->getValueAsDef("AliasRW");699getSchedRW(AliasDef).IsAlias = true;700Record *MatchDef = ADef->getValueAsDef("MatchRW");701CodeGenSchedRW &RW = getSchedRW(MatchDef);702if (RW.IsAlias)703PrintFatalError(ADef->getLoc(), "Cannot Alias an Alias");704RW.Aliases.push_back(ADef);705}706LLVM_DEBUG(707dbgs() << "\n+++ SCHED READS and WRITES (collectSchedRW) +++\n";708for (unsigned WIdx = 0, WEnd = SchedWrites.size(); WIdx != WEnd; ++WIdx) {709dbgs() << WIdx << ": ";710SchedWrites[WIdx].dump();711dbgs() << '\n';712} for (unsigned RIdx = 0, REnd = SchedReads.size(); RIdx != REnd;713++RIdx) {714dbgs() << RIdx << ": ";715SchedReads[RIdx].dump();716dbgs() << '\n';717} RecVec RWDefs = Records.getAllDerivedDefinitions("SchedReadWrite");718for (Record *RWDef719: RWDefs) {720if (!getSchedRWIdx(RWDef, RWDef->isSubClassOf("SchedRead"))) {721StringRef Name = RWDef->getName();722if (Name != "NoWrite" && Name != "ReadDefault")723dbgs() << "Unused SchedReadWrite " << Name << '\n';724}725});726}727728/// Compute a SchedWrite name from a sequence of writes.729std::string CodeGenSchedModels::genRWName(ArrayRef<unsigned> Seq, bool IsRead) {730std::string Name("(");731ListSeparator LS("_");732for (unsigned I : Seq) {733Name += LS;734Name += getSchedRW(I, IsRead).Name;735}736Name += ')';737return Name;738}739740unsigned CodeGenSchedModels::getSchedRWIdx(const Record *Def,741bool IsRead) const {742const std::vector<CodeGenSchedRW> &RWVec = IsRead ? SchedReads : SchedWrites;743const auto I = find_if(744RWVec, [Def](const CodeGenSchedRW &RW) { return RW.TheDef == Def; });745return I == RWVec.end() ? 0 : std::distance(RWVec.begin(), I);746}747748static void splitSchedReadWrites(const RecVec &RWDefs, RecVec &WriteDefs,749RecVec &ReadDefs) {750for (Record *RWDef : RWDefs) {751if (RWDef->isSubClassOf("SchedWrite"))752WriteDefs.push_back(RWDef);753else {754assert(RWDef->isSubClassOf("SchedRead") && "unknown SchedReadWrite");755ReadDefs.push_back(RWDef);756}757}758}759760// Split the SchedReadWrites defs and call findRWs for each list.761void CodeGenSchedModels::findRWs(const RecVec &RWDefs, IdxVec &Writes,762IdxVec &Reads) const {763RecVec WriteDefs;764RecVec ReadDefs;765splitSchedReadWrites(RWDefs, WriteDefs, ReadDefs);766findRWs(WriteDefs, Writes, false);767findRWs(ReadDefs, Reads, true);768}769770// Call getSchedRWIdx for all elements in a sequence of SchedRW defs.771void CodeGenSchedModels::findRWs(const RecVec &RWDefs, IdxVec &RWs,772bool IsRead) const {773for (Record *RWDef : RWDefs) {774unsigned Idx = getSchedRWIdx(RWDef, IsRead);775assert(Idx && "failed to collect SchedReadWrite");776RWs.push_back(Idx);777}778}779780void CodeGenSchedModels::expandRWSequence(unsigned RWIdx, IdxVec &RWSeq,781bool IsRead) const {782const CodeGenSchedRW &SchedRW = getSchedRW(RWIdx, IsRead);783if (!SchedRW.IsSequence) {784RWSeq.push_back(RWIdx);785return;786}787int Repeat = SchedRW.TheDef ? SchedRW.TheDef->getValueAsInt("Repeat") : 1;788for (int i = 0; i < Repeat; ++i) {789for (unsigned I : SchedRW.Sequence) {790expandRWSequence(I, RWSeq, IsRead);791}792}793}794795// Expand a SchedWrite as a sequence following any aliases that coincide with796// the given processor model.797void CodeGenSchedModels::expandRWSeqForProc(798unsigned RWIdx, IdxVec &RWSeq, bool IsRead,799const CodeGenProcModel &ProcModel) const {800801const CodeGenSchedRW &SchedWrite = getSchedRW(RWIdx, IsRead);802Record *AliasDef = nullptr;803for (const Record *Rec : SchedWrite.Aliases) {804const CodeGenSchedRW &AliasRW = getSchedRW(Rec->getValueAsDef("AliasRW"));805if (Rec->getValueInit("SchedModel")->isComplete()) {806Record *ModelDef = Rec->getValueAsDef("SchedModel");807if (&getProcModel(ModelDef) != &ProcModel)808continue;809}810if (AliasDef)811PrintFatalError(AliasRW.TheDef->getLoc(),812"Multiple aliases "813"defined for processor " +814ProcModel.ModelName +815" Ensure only one SchedAlias exists per RW.");816AliasDef = AliasRW.TheDef;817}818if (AliasDef) {819expandRWSeqForProc(getSchedRWIdx(AliasDef, IsRead), RWSeq, IsRead,820ProcModel);821return;822}823if (!SchedWrite.IsSequence) {824RWSeq.push_back(RWIdx);825return;826}827int Repeat =828SchedWrite.TheDef ? SchedWrite.TheDef->getValueAsInt("Repeat") : 1;829for (int I = 0, E = Repeat; I < E; ++I) {830for (unsigned Idx : SchedWrite.Sequence) {831expandRWSeqForProc(Idx, RWSeq, IsRead, ProcModel);832}833}834}835836// Find the existing SchedWrite that models this sequence of writes.837unsigned CodeGenSchedModels::findRWForSequence(ArrayRef<unsigned> Seq,838bool IsRead) {839std::vector<CodeGenSchedRW> &RWVec = IsRead ? SchedReads : SchedWrites;840841auto I = find_if(RWVec, [Seq](CodeGenSchedRW &RW) {842return ArrayRef(RW.Sequence) == Seq;843});844// Index zero reserved for invalid RW.845return I == RWVec.end() ? 0 : std::distance(RWVec.begin(), I);846}847848/// Add this ReadWrite if it doesn't already exist.849unsigned CodeGenSchedModels::findOrInsertRW(ArrayRef<unsigned> Seq,850bool IsRead) {851assert(!Seq.empty() && "cannot insert empty sequence");852if (Seq.size() == 1)853return Seq.back();854855unsigned Idx = findRWForSequence(Seq, IsRead);856if (Idx)857return Idx;858859std::vector<CodeGenSchedRW> &RWVec = IsRead ? SchedReads : SchedWrites;860unsigned RWIdx = RWVec.size();861CodeGenSchedRW SchedRW(RWIdx, IsRead, Seq, genRWName(Seq, IsRead));862RWVec.push_back(SchedRW);863return RWIdx;864}865866/// Visit all the instruction definitions for this target to gather and867/// enumerate the itinerary classes. These are the explicitly specified868/// SchedClasses. More SchedClasses may be inferred.869void CodeGenSchedModels::collectSchedClasses() {870871// NoItinerary is always the first class at Idx=0872assert(SchedClasses.empty() && "Expected empty sched class");873SchedClasses.emplace_back(0, "NoInstrModel", Records.getDef("NoItinerary"));874SchedClasses.back().ProcIndices.push_back(0);875876// Create a SchedClass for each unique combination of itinerary class and877// SchedRW list.878for (const CodeGenInstruction *Inst : Target.getInstructionsByEnumValue()) {879Record *ItinDef = Inst->TheDef->getValueAsDef("Itinerary");880IdxVec Writes, Reads;881if (!Inst->TheDef->isValueUnset("SchedRW"))882findRWs(Inst->TheDef->getValueAsListOfDefs("SchedRW"), Writes, Reads);883884// ProcIdx == 0 indicates the class applies to all processors.885unsigned SCIdx = addSchedClass(ItinDef, Writes, Reads, /*ProcIndices*/ {0});886InstrClassMap[Inst->TheDef] = SCIdx;887}888// Create classes for InstRW defs.889RecVec InstRWDefs = Records.getAllDerivedDefinitions("InstRW");890llvm::sort(InstRWDefs, LessRecord());891LLVM_DEBUG(dbgs() << "\n+++ SCHED CLASSES (createInstRWClass) +++\n");892for (Record *RWDef : InstRWDefs)893createInstRWClass(RWDef);894895NumInstrSchedClasses = SchedClasses.size();896897bool EnableDump = false;898LLVM_DEBUG(EnableDump = true);899if (!EnableDump)900return;901902LLVM_DEBUG(903dbgs()904<< "\n+++ ITINERARIES and/or MACHINE MODELS (collectSchedClasses) +++\n");905for (const CodeGenInstruction *Inst : Target.getInstructionsByEnumValue()) {906StringRef InstName = Inst->TheDef->getName();907unsigned SCIdx = getSchedClassIdx(*Inst);908if (!SCIdx) {909LLVM_DEBUG({910if (!Inst->hasNoSchedulingInfo)911dbgs() << "No machine model for " << Inst->TheDef->getName() << '\n';912});913continue;914}915CodeGenSchedClass &SC = getSchedClass(SCIdx);916if (SC.ProcIndices[0] != 0)917PrintFatalError(Inst->TheDef->getLoc(),918"Instruction's sched class "919"must not be subtarget specific.");920921IdxVec ProcIndices;922if (SC.ItinClassDef->getName() != "NoItinerary") {923ProcIndices.push_back(0);924dbgs() << "Itinerary for " << InstName << ": "925<< SC.ItinClassDef->getName() << '\n';926}927if (!SC.Writes.empty()) {928ProcIndices.push_back(0);929LLVM_DEBUG({930dbgs() << "SchedRW machine model for " << InstName;931for (unsigned int Write : SC.Writes)932dbgs() << " " << SchedWrites[Write].Name;933for (unsigned int Read : SC.Reads)934dbgs() << " " << SchedReads[Read].Name;935dbgs() << '\n';936});937}938const RecVec &RWDefs = SchedClasses[SCIdx].InstRWs;939for (Record *RWDef : RWDefs) {940const CodeGenProcModel &ProcModel =941getProcModel(RWDef->getValueAsDef("SchedModel"));942ProcIndices.push_back(ProcModel.Index);943LLVM_DEBUG(dbgs() << "InstRW on " << ProcModel.ModelName << " for "944<< InstName);945IdxVec Writes;946IdxVec Reads;947findRWs(RWDef->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);948LLVM_DEBUG({949for (unsigned WIdx : Writes)950dbgs() << " " << SchedWrites[WIdx].Name;951for (unsigned RIdx : Reads)952dbgs() << " " << SchedReads[RIdx].Name;953dbgs() << '\n';954});955}956// If ProcIndices contains zero, the class applies to all processors.957LLVM_DEBUG({958if (!llvm::is_contained(ProcIndices, 0)) {959for (const CodeGenProcModel &PM : ProcModels) {960if (!llvm::is_contained(ProcIndices, PM.Index))961dbgs() << "No machine model for " << Inst->TheDef->getName()962<< " on processor " << PM.ModelName << '\n';963}964}965});966}967}968969// Get the SchedClass index for an instruction.970unsigned971CodeGenSchedModels::getSchedClassIdx(const CodeGenInstruction &Inst) const {972return InstrClassMap.lookup(Inst.TheDef);973}974975std::string976CodeGenSchedModels::createSchedClassName(Record *ItinClassDef,977ArrayRef<unsigned> OperWrites,978ArrayRef<unsigned> OperReads) {979980std::string Name;981if (ItinClassDef && ItinClassDef->getName() != "NoItinerary")982Name = std::string(ItinClassDef->getName());983for (unsigned Idx : OperWrites) {984if (!Name.empty())985Name += '_';986Name += SchedWrites[Idx].Name;987}988for (unsigned Idx : OperReads) {989Name += '_';990Name += SchedReads[Idx].Name;991}992return Name;993}994995std::string CodeGenSchedModels::createSchedClassName(const RecVec &InstDefs) {996997std::string Name;998ListSeparator LS("_");999for (const Record *InstDef : InstDefs) {1000Name += LS;1001Name += InstDef->getName();1002}1003return Name;1004}10051006/// Add an inferred sched class from an itinerary class and per-operand list of1007/// SchedWrites and SchedReads. ProcIndices contains the set of IDs of1008/// processors that may utilize this class.1009unsigned CodeGenSchedModels::addSchedClass(Record *ItinClassDef,1010ArrayRef<unsigned> OperWrites,1011ArrayRef<unsigned> OperReads,1012ArrayRef<unsigned> ProcIndices) {1013assert(!ProcIndices.empty() && "expect at least one ProcIdx");10141015auto IsKeyEqual = [=](const CodeGenSchedClass &SC) {1016return SC.isKeyEqual(ItinClassDef, OperWrites, OperReads);1017};10181019auto I = find_if(make_range(schedClassBegin(), schedClassEnd()), IsKeyEqual);1020unsigned Idx = I == schedClassEnd() ? 0 : std::distance(schedClassBegin(), I);1021if (Idx || SchedClasses[0].isKeyEqual(ItinClassDef, OperWrites, OperReads)) {1022IdxVec PI;1023std::set_union(SchedClasses[Idx].ProcIndices.begin(),1024SchedClasses[Idx].ProcIndices.end(), ProcIndices.begin(),1025ProcIndices.end(), std::back_inserter(PI));1026SchedClasses[Idx].ProcIndices = std::move(PI);1027return Idx;1028}1029Idx = SchedClasses.size();1030SchedClasses.emplace_back(1031Idx, createSchedClassName(ItinClassDef, OperWrites, OperReads),1032ItinClassDef);1033CodeGenSchedClass &SC = SchedClasses.back();1034SC.Writes = OperWrites;1035SC.Reads = OperReads;1036SC.ProcIndices = ProcIndices;10371038return Idx;1039}10401041// Create classes for each set of opcodes that are in the same InstReadWrite1042// definition across all processors.1043void CodeGenSchedModels::createInstRWClass(Record *InstRWDef) {1044// ClassInstrs will hold an entry for each subset of Instrs in InstRWDef that1045// intersects with an existing class via a previous InstRWDef. Instrs that do1046// not intersect with an existing class refer back to their former class as1047// determined from ItinDef or SchedRW.1048SmallMapVector<unsigned, SmallVector<Record *, 8>, 4> ClassInstrs;1049// Sort Instrs into sets.1050const RecVec *InstDefs = Sets.expand(InstRWDef);1051if (InstDefs->empty())1052PrintFatalError(InstRWDef->getLoc(), "No matching instruction opcodes");10531054for (Record *InstDef : *InstDefs) {1055InstClassMapTy::const_iterator Pos = InstrClassMap.find(InstDef);1056if (Pos == InstrClassMap.end())1057PrintFatalError(InstDef->getLoc(), "No sched class for instruction.");1058unsigned SCIdx = Pos->second;1059ClassInstrs[SCIdx].push_back(InstDef);1060}1061// For each set of Instrs, create a new class if necessary, and map or remap1062// the Instrs to it.1063for (auto &Entry : ClassInstrs) {1064unsigned OldSCIdx = Entry.first;1065ArrayRef<Record *> InstDefs = Entry.second;1066// If the all instrs in the current class are accounted for, then leave1067// them mapped to their old class.1068if (OldSCIdx) {1069const RecVec &RWDefs = SchedClasses[OldSCIdx].InstRWs;1070if (!RWDefs.empty()) {1071const RecVec *OrigInstDefs = Sets.expand(RWDefs[0]);1072unsigned OrigNumInstrs = count_if(*OrigInstDefs, [&](Record *OIDef) {1073return InstrClassMap[OIDef] == OldSCIdx;1074});1075if (OrigNumInstrs == InstDefs.size()) {1076assert(SchedClasses[OldSCIdx].ProcIndices[0] == 0 &&1077"expected a generic SchedClass");1078Record *RWModelDef = InstRWDef->getValueAsDef("SchedModel");1079// Make sure we didn't already have a InstRW containing this1080// instruction on this model.1081for (Record *RWD : RWDefs) {1082if (RWD->getValueAsDef("SchedModel") == RWModelDef &&1083RWModelDef->getValueAsBit("FullInstRWOverlapCheck")) {1084assert(!InstDefs.empty()); // Checked at function start.1085PrintError(1086InstRWDef->getLoc(),1087"Overlapping InstRW definition for \"" +1088InstDefs.front()->getName() +1089"\" also matches previous \"" +1090RWD->getValue("Instrs")->getValue()->getAsString() +1091"\".");1092PrintFatalNote(RWD->getLoc(), "Previous match was here.");1093}1094}1095LLVM_DEBUG(dbgs() << "InstRW: Reuse SC " << OldSCIdx << ":"1096<< SchedClasses[OldSCIdx].Name << " on "1097<< RWModelDef->getName() << "\n");1098SchedClasses[OldSCIdx].InstRWs.push_back(InstRWDef);1099continue;1100}1101}1102}1103unsigned SCIdx = SchedClasses.size();1104SchedClasses.emplace_back(SCIdx, createSchedClassName(InstDefs), nullptr);1105CodeGenSchedClass &SC = SchedClasses.back();1106LLVM_DEBUG(dbgs() << "InstRW: New SC " << SCIdx << ":" << SC.Name << " on "1107<< InstRWDef->getValueAsDef("SchedModel")->getName()1108<< "\n");11091110// Preserve ItinDef and Writes/Reads for processors without an InstRW entry.1111SC.ItinClassDef = SchedClasses[OldSCIdx].ItinClassDef;1112SC.Writes = SchedClasses[OldSCIdx].Writes;1113SC.Reads = SchedClasses[OldSCIdx].Reads;1114SC.ProcIndices.push_back(0);1115// If we had an old class, copy it's InstRWs to this new class.1116if (OldSCIdx) {1117Record *RWModelDef = InstRWDef->getValueAsDef("SchedModel");1118for (Record *OldRWDef : SchedClasses[OldSCIdx].InstRWs) {1119if (OldRWDef->getValueAsDef("SchedModel") == RWModelDef) {1120assert(!InstDefs.empty()); // Checked at function start.1121PrintError(1122InstRWDef->getLoc(),1123"Overlapping InstRW definition for \"" +1124InstDefs.front()->getName() + "\" also matches previous \"" +1125OldRWDef->getValue("Instrs")->getValue()->getAsString() +1126"\".");1127PrintFatalNote(OldRWDef->getLoc(), "Previous match was here.");1128}1129assert(OldRWDef != InstRWDef && "SchedClass has duplicate InstRW def");1130SC.InstRWs.push_back(OldRWDef);1131}1132}1133// Map each Instr to this new class.1134for (Record *InstDef : InstDefs)1135InstrClassMap[InstDef] = SCIdx;1136SC.InstRWs.push_back(InstRWDef);1137}1138}11391140// True if collectProcItins found anything.1141bool CodeGenSchedModels::hasItineraries() const {1142for (const CodeGenProcModel &PM :1143make_range(procModelBegin(), procModelEnd()))1144if (PM.hasItineraries())1145return true;1146return false;1147}11481149// Gather the processor itineraries.1150void CodeGenSchedModels::collectProcItins() {1151LLVM_DEBUG(dbgs() << "\n+++ PROBLEM ITINERARIES (collectProcItins) +++\n");1152for (CodeGenProcModel &ProcModel : ProcModels) {1153if (!ProcModel.hasItineraries())1154continue;11551156RecVec ItinRecords = ProcModel.ItinsDef->getValueAsListOfDefs("IID");1157assert(!ItinRecords.empty() && "ProcModel.hasItineraries is incorrect");11581159// Populate ItinDefList with Itinerary records.1160ProcModel.ItinDefList.resize(NumInstrSchedClasses);11611162// Insert each itinerary data record in the correct position within1163// the processor model's ItinDefList.1164for (Record *ItinData : ItinRecords) {1165const Record *ItinDef = ItinData->getValueAsDef("TheClass");1166bool FoundClass = false;11671168for (const CodeGenSchedClass &SC :1169make_range(schedClassBegin(), schedClassEnd())) {1170// Multiple SchedClasses may share an itinerary. Update all of them.1171if (SC.ItinClassDef == ItinDef) {1172ProcModel.ItinDefList[SC.Index] = ItinData;1173FoundClass = true;1174}1175}1176if (!FoundClass) {1177LLVM_DEBUG(dbgs() << ProcModel.ItinsDef->getName()1178<< " missing class for itinerary "1179<< ItinDef->getName() << '\n');1180}1181}1182// Check for missing itinerary entries.1183assert(!ProcModel.ItinDefList[0] && "NoItinerary class can't have rec");1184LLVM_DEBUG(1185for (unsigned i = 1, N = ProcModel.ItinDefList.size(); i < N; ++i) {1186if (!ProcModel.ItinDefList[i])1187dbgs() << ProcModel.ItinsDef->getName()1188<< " missing itinerary for class " << SchedClasses[i].Name1189<< '\n';1190});1191}1192}11931194// Gather the read/write types for each itinerary class.1195void CodeGenSchedModels::collectProcItinRW() {1196RecVec ItinRWDefs = Records.getAllDerivedDefinitions("ItinRW");1197llvm::sort(ItinRWDefs, LessRecord());1198for (Record *RWDef : ItinRWDefs) {1199if (!RWDef->getValueInit("SchedModel")->isComplete())1200PrintFatalError(RWDef->getLoc(), "SchedModel is undefined");1201Record *ModelDef = RWDef->getValueAsDef("SchedModel");1202ProcModelMapTy::const_iterator I = ProcModelMap.find(ModelDef);1203if (I == ProcModelMap.end()) {1204PrintFatalError(RWDef->getLoc(),1205"Undefined SchedMachineModel " + ModelDef->getName());1206}1207ProcModels[I->second].ItinRWDefs.push_back(RWDef);1208}1209}12101211// Gather the unsupported features for processor models.1212void CodeGenSchedModels::collectProcUnsupportedFeatures() {1213for (CodeGenProcModel &ProcModel : ProcModels)1214append_range(1215ProcModel.UnsupportedFeaturesDefs,1216ProcModel.ModelDef->getValueAsListOfDefs("UnsupportedFeatures"));1217}12181219/// Infer new classes from existing classes. In the process, this may create new1220/// SchedWrites from sequences of existing SchedWrites.1221void CodeGenSchedModels::inferSchedClasses() {1222LLVM_DEBUG(1223dbgs() << "\n+++ INFERRING SCHED CLASSES (inferSchedClasses) +++\n");1224LLVM_DEBUG(dbgs() << NumInstrSchedClasses << " instr sched classes.\n");12251226// Visit all existing classes and newly created classes.1227for (unsigned Idx = 0; Idx != SchedClasses.size(); ++Idx) {1228assert(SchedClasses[Idx].Index == Idx && "bad SCIdx");12291230if (SchedClasses[Idx].ItinClassDef)1231inferFromItinClass(SchedClasses[Idx].ItinClassDef, Idx);1232if (!SchedClasses[Idx].InstRWs.empty())1233inferFromInstRWs(Idx);1234if (!SchedClasses[Idx].Writes.empty()) {1235inferFromRW(SchedClasses[Idx].Writes, SchedClasses[Idx].Reads, Idx,1236SchedClasses[Idx].ProcIndices);1237}1238assert(SchedClasses.size() < (NumInstrSchedClasses * 6) &&1239"too many SchedVariants");1240}1241}12421243/// Infer classes from per-processor itinerary resources.1244void CodeGenSchedModels::inferFromItinClass(Record *ItinClassDef,1245unsigned FromClassIdx) {1246for (unsigned PIdx = 0, PEnd = ProcModels.size(); PIdx != PEnd; ++PIdx) {1247const CodeGenProcModel &PM = ProcModels[PIdx];1248// For all ItinRW entries.1249bool HasMatch = false;1250for (const Record *Rec : PM.ItinRWDefs) {1251RecVec Matched = Rec->getValueAsListOfDefs("MatchedItinClasses");1252if (!llvm::is_contained(Matched, ItinClassDef))1253continue;1254if (HasMatch)1255PrintFatalError(Rec->getLoc(),1256"Duplicate itinerary class " + ItinClassDef->getName() +1257" in ItinResources for " + PM.ModelName);1258HasMatch = true;1259IdxVec Writes, Reads;1260findRWs(Rec->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);1261inferFromRW(Writes, Reads, FromClassIdx, PIdx);1262}1263}1264}12651266/// Infer classes from per-processor InstReadWrite definitions.1267void CodeGenSchedModels::inferFromInstRWs(unsigned SCIdx) {1268for (unsigned I = 0, E = SchedClasses[SCIdx].InstRWs.size(); I != E; ++I) {1269assert(SchedClasses[SCIdx].InstRWs.size() == E && "InstrRWs was mutated!");1270Record *Rec = SchedClasses[SCIdx].InstRWs[I];1271const RecVec *InstDefs = Sets.expand(Rec);1272RecIter II = InstDefs->begin(), IE = InstDefs->end();1273for (; II != IE; ++II) {1274if (InstrClassMap[*II] == SCIdx)1275break;1276}1277// If this class no longer has any instructions mapped to it, it has become1278// irrelevant.1279if (II == IE)1280continue;1281IdxVec Writes, Reads;1282findRWs(Rec->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);1283unsigned PIdx = getProcModel(Rec->getValueAsDef("SchedModel")).Index;1284inferFromRW(Writes, Reads, SCIdx, PIdx); // May mutate SchedClasses.1285SchedClasses[SCIdx].InstRWProcIndices.insert(PIdx);1286}1287}12881289namespace {12901291// Helper for substituteVariantOperand.1292struct TransVariant {1293Record *VarOrSeqDef; // Variant or sequence.1294unsigned RWIdx; // Index of this variant or sequence's matched type.1295unsigned ProcIdx; // Processor model index or zero for any.1296unsigned TransVecIdx; // Index into PredTransitions::TransVec.12971298TransVariant(Record *def, unsigned rwi, unsigned pi, unsigned ti)1299: VarOrSeqDef(def), RWIdx(rwi), ProcIdx(pi), TransVecIdx(ti) {}1300};13011302// Associate a predicate with the SchedReadWrite that it guards.1303// RWIdx is the index of the read/write variant.1304struct PredCheck {1305bool IsRead;1306unsigned RWIdx;1307Record *Predicate;13081309PredCheck(bool r, unsigned w, Record *p)1310: IsRead(r), RWIdx(w), Predicate(p) {}1311};13121313// A Predicate transition is a list of RW sequences guarded by a PredTerm.1314struct PredTransition {1315// A predicate term is a conjunction of PredChecks.1316SmallVector<PredCheck, 4> PredTerm;1317SmallVector<SmallVector<unsigned, 4>, 16> WriteSequences;1318SmallVector<SmallVector<unsigned, 4>, 16> ReadSequences;1319unsigned ProcIndex = 0;13201321PredTransition() = default;1322PredTransition(ArrayRef<PredCheck> PT, unsigned ProcId) {1323PredTerm.assign(PT.begin(), PT.end());1324ProcIndex = ProcId;1325}1326};13271328// Encapsulate a set of partially constructed transitions.1329// The results are built by repeated calls to substituteVariants.1330class PredTransitions {1331CodeGenSchedModels &SchedModels;13321333public:1334std::vector<PredTransition> TransVec;13351336PredTransitions(CodeGenSchedModels &sm) : SchedModels(sm) {}13371338bool substituteVariantOperand(const SmallVectorImpl<unsigned> &RWSeq,1339bool IsRead, unsigned StartIdx);13401341bool substituteVariants(const PredTransition &Trans);13421343#ifndef NDEBUG1344void dump() const;1345#endif13461347private:1348bool mutuallyExclusive(Record *PredDef, ArrayRef<Record *> Preds,1349ArrayRef<PredCheck> Term);1350void getIntersectingVariants(const CodeGenSchedRW &SchedRW, unsigned TransIdx,1351std::vector<TransVariant> &IntersectingVariants);1352void pushVariant(const TransVariant &VInfo, bool IsRead);1353};13541355} // end anonymous namespace13561357// Return true if this predicate is mutually exclusive with a PredTerm. This1358// degenerates into checking if the predicate is mutually exclusive with any1359// predicate in the Term's conjunction.1360//1361// All predicates associated with a given SchedRW are considered mutually1362// exclusive. This should work even if the conditions expressed by the1363// predicates are not exclusive because the predicates for a given SchedWrite1364// are always checked in the order they are defined in the .td file. Later1365// conditions implicitly negate any prior condition.1366bool PredTransitions::mutuallyExclusive(Record *PredDef,1367ArrayRef<Record *> Preds,1368ArrayRef<PredCheck> Term) {1369for (const PredCheck &PC : Term) {1370if (PC.Predicate == PredDef)1371return false;13721373const CodeGenSchedRW &SchedRW = SchedModels.getSchedRW(PC.RWIdx, PC.IsRead);1374assert(SchedRW.HasVariants && "PredCheck must refer to a SchedVariant");1375RecVec Variants = SchedRW.TheDef->getValueAsListOfDefs("Variants");1376if (any_of(Variants, [PredDef](const Record *R) {1377return R->getValueAsDef("Predicate") == PredDef;1378})) {1379// To check if PredDef is mutually exclusive with PC we also need to1380// check that PC.Predicate is exclusive with all predicates from variant1381// we're expanding. Consider following RW sequence with two variants1382// (1 & 2), where A, B and C are predicates from corresponding SchedVars:1383//1384// 1:A/B - 2:C/B1385//1386// Here C is not mutually exclusive with variant (1), because A doesn't1387// exist in variant (2). This means we have possible transitions from A1388// to C and from A to B, and fully expanded sequence would look like:1389//1390// if (A & C) return ...;1391// if (A & B) return ...;1392// if (B) return ...;1393//1394// Now let's consider another sequence:1395//1396// 1:A/B - 2:A/B1397//1398// Here A in variant (2) is mutually exclusive with variant (1), because1399// A also exists in (2). This means A->B transition is impossible and1400// expanded sequence would look like:1401//1402// if (A) return ...;1403// if (B) return ...;1404if (!llvm::is_contained(Preds, PC.Predicate))1405continue;1406return true;1407}1408}1409return false;1410}14111412static std::vector<Record *> getAllPredicates(ArrayRef<TransVariant> Variants,1413unsigned ProcId) {1414std::vector<Record *> Preds;1415for (auto &Variant : Variants) {1416if (!Variant.VarOrSeqDef->isSubClassOf("SchedVar"))1417continue;1418Preds.push_back(Variant.VarOrSeqDef->getValueAsDef("Predicate"));1419}1420return Preds;1421}14221423// Populate IntersectingVariants with any variants or aliased sequences of the1424// given SchedRW whose processor indices and predicates are not mutually1425// exclusive with the given transition.1426void PredTransitions::getIntersectingVariants(1427const CodeGenSchedRW &SchedRW, unsigned TransIdx,1428std::vector<TransVariant> &IntersectingVariants) {14291430bool GenericRW = false;14311432std::vector<TransVariant> Variants;1433if (SchedRW.HasVariants) {1434unsigned VarProcIdx = 0;1435if (SchedRW.TheDef->getValueInit("SchedModel")->isComplete()) {1436Record *ModelDef = SchedRW.TheDef->getValueAsDef("SchedModel");1437VarProcIdx = SchedModels.getProcModel(ModelDef).Index;1438}1439if (VarProcIdx == 0 || VarProcIdx == TransVec[TransIdx].ProcIndex) {1440// Push each variant. Assign TransVecIdx later.1441const RecVec VarDefs = SchedRW.TheDef->getValueAsListOfDefs("Variants");1442for (Record *VarDef : VarDefs)1443Variants.emplace_back(VarDef, SchedRW.Index, VarProcIdx, 0);1444if (VarProcIdx == 0)1445GenericRW = true;1446}1447}1448for (RecIter AI = SchedRW.Aliases.begin(), AE = SchedRW.Aliases.end();1449AI != AE; ++AI) {1450// If either the SchedAlias itself or the SchedReadWrite that it aliases1451// to is defined within a processor model, constrain all variants to1452// that processor.1453unsigned AliasProcIdx = 0;1454if ((*AI)->getValueInit("SchedModel")->isComplete()) {1455Record *ModelDef = (*AI)->getValueAsDef("SchedModel");1456AliasProcIdx = SchedModels.getProcModel(ModelDef).Index;1457}1458if (AliasProcIdx && AliasProcIdx != TransVec[TransIdx].ProcIndex)1459continue;1460if (!Variants.empty()) {1461const CodeGenProcModel &PM =1462*(SchedModels.procModelBegin() + AliasProcIdx);1463PrintFatalError((*AI)->getLoc(),1464"Multiple variants defined for processor " +1465PM.ModelName +1466" Ensure only one SchedAlias exists per RW.");1467}14681469const CodeGenSchedRW &AliasRW =1470SchedModels.getSchedRW((*AI)->getValueAsDef("AliasRW"));14711472if (AliasRW.HasVariants) {1473const RecVec VarDefs = AliasRW.TheDef->getValueAsListOfDefs("Variants");1474for (Record *VD : VarDefs)1475Variants.emplace_back(VD, AliasRW.Index, AliasProcIdx, 0);1476}1477if (AliasRW.IsSequence)1478Variants.emplace_back(AliasRW.TheDef, SchedRW.Index, AliasProcIdx, 0);1479if (AliasProcIdx == 0)1480GenericRW = true;1481}1482std::vector<Record *> AllPreds =1483getAllPredicates(Variants, TransVec[TransIdx].ProcIndex);1484for (TransVariant &Variant : Variants) {1485// Don't expand variants if the processor models don't intersect.1486// A zero processor index means any processor.1487if (Variant.VarOrSeqDef->isSubClassOf("SchedVar")) {1488Record *PredDef = Variant.VarOrSeqDef->getValueAsDef("Predicate");1489if (mutuallyExclusive(PredDef, AllPreds, TransVec[TransIdx].PredTerm))1490continue;1491}14921493if (IntersectingVariants.empty()) {1494// The first variant builds on the existing transition.1495Variant.TransVecIdx = TransIdx;1496IntersectingVariants.push_back(Variant);1497} else {1498// Push another copy of the current transition for more variants.1499Variant.TransVecIdx = TransVec.size();1500IntersectingVariants.push_back(Variant);1501TransVec.push_back(TransVec[TransIdx]);1502}1503}1504if (GenericRW && IntersectingVariants.empty()) {1505PrintFatalError(SchedRW.TheDef->getLoc(),1506"No variant of this type has "1507"a matching predicate on any processor");1508}1509}15101511// Push the Reads/Writes selected by this variant onto the PredTransition1512// specified by VInfo.1513void PredTransitions::pushVariant(const TransVariant &VInfo, bool IsRead) {1514PredTransition &Trans = TransVec[VInfo.TransVecIdx];15151516// If this operand transition is reached through a processor-specific alias,1517// then the whole transition is specific to this processor.1518IdxVec SelectedRWs;1519if (VInfo.VarOrSeqDef->isSubClassOf("SchedVar")) {1520Record *PredDef = VInfo.VarOrSeqDef->getValueAsDef("Predicate");1521Trans.PredTerm.emplace_back(IsRead, VInfo.RWIdx, PredDef);1522RecVec SelectedDefs = VInfo.VarOrSeqDef->getValueAsListOfDefs("Selected");1523SchedModels.findRWs(SelectedDefs, SelectedRWs, IsRead);1524} else {1525assert(VInfo.VarOrSeqDef->isSubClassOf("WriteSequence") &&1526"variant must be a SchedVariant or aliased WriteSequence");1527SelectedRWs.push_back(SchedModels.getSchedRWIdx(VInfo.VarOrSeqDef, IsRead));1528}15291530const CodeGenSchedRW &SchedRW = SchedModels.getSchedRW(VInfo.RWIdx, IsRead);15311532SmallVectorImpl<SmallVector<unsigned, 4>> &RWSequences =1533IsRead ? Trans.ReadSequences : Trans.WriteSequences;1534if (SchedRW.IsVariadic) {1535unsigned OperIdx = RWSequences.size() - 1;1536// Make N-1 copies of this transition's last sequence.1537RWSequences.reserve(RWSequences.size() + SelectedRWs.size() - 1);1538RWSequences.insert(RWSequences.end(), SelectedRWs.size() - 1,1539RWSequences[OperIdx]);1540// Push each of the N elements of the SelectedRWs onto a copy of the last1541// sequence (split the current operand into N operands).1542// Note that write sequences should be expanded within this loop--the entire1543// sequence belongs to a single operand.1544for (IdxIter RWI = SelectedRWs.begin(), RWE = SelectedRWs.end(); RWI != RWE;1545++RWI, ++OperIdx) {1546IdxVec ExpandedRWs;1547if (IsRead)1548ExpandedRWs.push_back(*RWI);1549else1550SchedModels.expandRWSequence(*RWI, ExpandedRWs, IsRead);1551llvm::append_range(RWSequences[OperIdx], ExpandedRWs);1552}1553assert(OperIdx == RWSequences.size() && "missed a sequence");1554} else {1555// Push this transition's expanded sequence onto this transition's last1556// sequence (add to the current operand's sequence).1557SmallVectorImpl<unsigned> &Seq = RWSequences.back();1558IdxVec ExpandedRWs;1559for (unsigned int SelectedRW : SelectedRWs) {1560if (IsRead)1561ExpandedRWs.push_back(SelectedRW);1562else1563SchedModels.expandRWSequence(SelectedRW, ExpandedRWs, IsRead);1564}1565llvm::append_range(Seq, ExpandedRWs);1566}1567}15681569// RWSeq is a sequence of all Reads or all Writes for the next read or write1570// operand. StartIdx is an index into TransVec where partial results1571// starts. RWSeq must be applied to all transitions between StartIdx and the end1572// of TransVec.1573bool PredTransitions::substituteVariantOperand(1574const SmallVectorImpl<unsigned> &RWSeq, bool IsRead, unsigned StartIdx) {1575bool Subst = false;1576// Visit each original RW within the current sequence.1577for (unsigned int RWI : RWSeq) {1578const CodeGenSchedRW &SchedRW = SchedModels.getSchedRW(RWI, IsRead);1579// Push this RW on all partial PredTransitions or distribute variants.1580// New PredTransitions may be pushed within this loop which should not be1581// revisited (TransEnd must be loop invariant).1582for (unsigned TransIdx = StartIdx, TransEnd = TransVec.size();1583TransIdx != TransEnd; ++TransIdx) {1584// Distribute this partial PredTransition across intersecting variants.1585// This will push a copies of TransVec[TransIdx] on the back of TransVec.1586std::vector<TransVariant> IntersectingVariants;1587getIntersectingVariants(SchedRW, TransIdx, IntersectingVariants);1588// Now expand each variant on top of its copy of the transition.1589for (const TransVariant &IV : IntersectingVariants)1590pushVariant(IV, IsRead);1591if (IntersectingVariants.empty()) {1592if (IsRead)1593TransVec[TransIdx].ReadSequences.back().push_back(RWI);1594else1595TransVec[TransIdx].WriteSequences.back().push_back(RWI);1596continue;1597} else {1598Subst = true;1599}1600}1601}1602return Subst;1603}16041605// For each variant of a Read/Write in Trans, substitute the sequence of1606// Read/Writes guarded by the variant. This is exponential in the number of1607// variant Read/Writes, but in practice detection of mutually exclusive1608// predicates should result in linear growth in the total number variants.1609//1610// This is one step in a breadth-first search of nested variants.1611bool PredTransitions::substituteVariants(const PredTransition &Trans) {1612// Build up a set of partial results starting at the back of1613// PredTransitions. Remember the first new transition.1614unsigned StartIdx = TransVec.size();1615bool Subst = false;1616assert(Trans.ProcIndex != 0);1617TransVec.emplace_back(Trans.PredTerm, Trans.ProcIndex);16181619// Visit each original write sequence.1620for (const auto &WriteSequence : Trans.WriteSequences) {1621// Push a new (empty) write sequence onto all partial Transitions.1622for (std::vector<PredTransition>::iterator I = TransVec.begin() + StartIdx,1623E = TransVec.end();1624I != E; ++I) {1625I->WriteSequences.emplace_back();1626}1627Subst |=1628substituteVariantOperand(WriteSequence, /*IsRead=*/false, StartIdx);1629}1630// Visit each original read sequence.1631for (const auto &ReadSequence : Trans.ReadSequences) {1632// Push a new (empty) read sequence onto all partial Transitions.1633for (std::vector<PredTransition>::iterator I = TransVec.begin() + StartIdx,1634E = TransVec.end();1635I != E; ++I) {1636I->ReadSequences.emplace_back();1637}1638Subst |= substituteVariantOperand(ReadSequence, /*IsRead=*/true, StartIdx);1639}1640return Subst;1641}16421643static void addSequences(CodeGenSchedModels &SchedModels,1644const SmallVectorImpl<SmallVector<unsigned, 4>> &Seqs,1645IdxVec &Result, bool IsRead) {1646for (const auto &S : Seqs)1647if (!S.empty())1648Result.push_back(SchedModels.findOrInsertRW(S, IsRead));1649}16501651#ifndef NDEBUG1652static void dumpRecVec(const RecVec &RV) {1653for (const Record *R : RV)1654dbgs() << R->getName() << ", ";1655}1656#endif16571658static void dumpTransition(const CodeGenSchedModels &SchedModels,1659const CodeGenSchedClass &FromSC,1660const CodeGenSchedTransition &SCTrans,1661const RecVec &Preds) {1662LLVM_DEBUG(dbgs() << "Adding transition from " << FromSC.Name << "("1663<< FromSC.Index << ") to "1664<< SchedModels.getSchedClass(SCTrans.ToClassIdx).Name << "("1665<< SCTrans.ToClassIdx << ") on pred term: (";1666dumpRecVec(Preds);1667dbgs() << ") on processor (" << SCTrans.ProcIndex << ")\n");1668}1669// Create a new SchedClass for each variant found by inferFromRW. Pass1670static void inferFromTransitions(ArrayRef<PredTransition> LastTransitions,1671unsigned FromClassIdx,1672CodeGenSchedModels &SchedModels) {1673// For each PredTransition, create a new CodeGenSchedTransition, which usually1674// requires creating a new SchedClass.1675for (const auto &LastTransition : LastTransitions) {1676// Variant expansion (substituteVariants) may create unconditional1677// transitions. We don't need to build sched classes for them.1678if (LastTransition.PredTerm.empty())1679continue;1680IdxVec OperWritesVariant, OperReadsVariant;1681addSequences(SchedModels, LastTransition.WriteSequences, OperWritesVariant,1682false);1683addSequences(SchedModels, LastTransition.ReadSequences, OperReadsVariant,1684true);1685CodeGenSchedTransition SCTrans;16861687// Transition should not contain processor indices already assigned to1688// InstRWs in this scheduling class.1689const CodeGenSchedClass &FromSC = SchedModels.getSchedClass(FromClassIdx);1690if (FromSC.InstRWProcIndices.count(LastTransition.ProcIndex))1691continue;1692SCTrans.ProcIndex = LastTransition.ProcIndex;1693SCTrans.ToClassIdx =1694SchedModels.addSchedClass(/*ItinClassDef=*/nullptr, OperWritesVariant,1695OperReadsVariant, LastTransition.ProcIndex);16961697// The final PredTerm is unique set of predicates guarding the transition.1698RecVec Preds;1699transform(LastTransition.PredTerm, std::back_inserter(Preds),1700[](const PredCheck &P) { return P.Predicate; });1701Preds.erase(llvm::unique(Preds), Preds.end());1702dumpTransition(SchedModels, FromSC, SCTrans, Preds);1703SCTrans.PredTerm = std::move(Preds);1704SchedModels.getSchedClass(FromClassIdx)1705.Transitions.push_back(std::move(SCTrans));1706}1707}17081709std::vector<unsigned> CodeGenSchedModels::getAllProcIndices() const {1710std::vector<unsigned> ProcIdVec;1711for (const auto &PM : ProcModelMap)1712if (PM.second != 0)1713ProcIdVec.push_back(PM.second);1714// The order of the keys (Record pointers) of ProcModelMap are not stable.1715// Sort to stabalize the values.1716llvm::sort(ProcIdVec);1717return ProcIdVec;1718}17191720static std::vector<PredTransition>1721makePerProcessorTransitions(const PredTransition &Trans,1722ArrayRef<unsigned> ProcIndices) {1723std::vector<PredTransition> PerCpuTransVec;1724for (unsigned ProcId : ProcIndices) {1725assert(ProcId != 0);1726PerCpuTransVec.push_back(Trans);1727PerCpuTransVec.back().ProcIndex = ProcId;1728}1729return PerCpuTransVec;1730}17311732// Create new SchedClasses for the given ReadWrite list. If any of the1733// ReadWrites refers to a SchedVariant, create a new SchedClass for each variant1734// of the ReadWrite list, following Aliases if necessary.1735void CodeGenSchedModels::inferFromRW(ArrayRef<unsigned> OperWrites,1736ArrayRef<unsigned> OperReads,1737unsigned FromClassIdx,1738ArrayRef<unsigned> ProcIndices) {1739LLVM_DEBUG(dbgs() << "INFER RW proc("; dumpIdxVec(ProcIndices);1740dbgs() << ") ");1741// Create a seed transition with an empty PredTerm and the expanded sequences1742// of SchedWrites for the current SchedClass.1743std::vector<PredTransition> LastTransitions;1744LastTransitions.emplace_back();17451746for (unsigned WriteIdx : OperWrites) {1747IdxVec WriteSeq;1748expandRWSequence(WriteIdx, WriteSeq, /*IsRead=*/false);1749LastTransitions[0].WriteSequences.emplace_back();1750SmallVectorImpl<unsigned> &Seq = LastTransitions[0].WriteSequences.back();1751Seq.append(WriteSeq.begin(), WriteSeq.end());1752LLVM_DEBUG(dbgs() << "("; dumpIdxVec(Seq); dbgs() << ") ");1753}1754LLVM_DEBUG(dbgs() << " Reads: ");1755for (unsigned ReadIdx : OperReads) {1756IdxVec ReadSeq;1757expandRWSequence(ReadIdx, ReadSeq, /*IsRead=*/true);1758LastTransitions[0].ReadSequences.emplace_back();1759SmallVectorImpl<unsigned> &Seq = LastTransitions[0].ReadSequences.back();1760Seq.append(ReadSeq.begin(), ReadSeq.end());1761LLVM_DEBUG(dbgs() << "("; dumpIdxVec(Seq); dbgs() << ") ");1762}1763LLVM_DEBUG(dbgs() << '\n');17641765LastTransitions = makePerProcessorTransitions(1766LastTransitions[0], llvm::is_contained(ProcIndices, 0)1767? ArrayRef<unsigned>(getAllProcIndices())1768: ProcIndices);1769// Collect all PredTransitions for individual operands.1770// Iterate until no variant writes remain.1771bool SubstitutedAny;1772do {1773SubstitutedAny = false;1774PredTransitions Transitions(*this);1775for (const PredTransition &Trans : LastTransitions)1776SubstitutedAny |= Transitions.substituteVariants(Trans);1777LLVM_DEBUG(Transitions.dump());1778LastTransitions = std::move(Transitions.TransVec);1779} while (SubstitutedAny);17801781// WARNING: We are about to mutate the SchedClasses vector. Do not refer to1782// OperWrites, OperReads, or ProcIndices after calling inferFromTransitions.1783inferFromTransitions(LastTransitions, FromClassIdx, *this);1784}17851786// Check if any processor resource group contains all resource records in1787// SubUnits.1788bool CodeGenSchedModels::hasSuperGroup(RecVec &SubUnits, CodeGenProcModel &PM) {1789for (Record *ProcResourceDef : PM.ProcResourceDefs) {1790if (!ProcResourceDef->isSubClassOf("ProcResGroup"))1791continue;1792RecVec SuperUnits = ProcResourceDef->getValueAsListOfDefs("Resources");1793RecIter RI = SubUnits.begin(), RE = SubUnits.end();1794for (; RI != RE; ++RI) {1795if (!is_contained(SuperUnits, *RI)) {1796break;1797}1798}1799if (RI == RE)1800return true;1801}1802return false;1803}18041805// Verify that overlapping groups have a common supergroup.1806void CodeGenSchedModels::verifyProcResourceGroups(CodeGenProcModel &PM) {1807for (unsigned i = 0, e = PM.ProcResourceDefs.size(); i < e; ++i) {1808if (!PM.ProcResourceDefs[i]->isSubClassOf("ProcResGroup"))1809continue;1810RecVec CheckUnits =1811PM.ProcResourceDefs[i]->getValueAsListOfDefs("Resources");1812for (unsigned j = i + 1; j < e; ++j) {1813if (!PM.ProcResourceDefs[j]->isSubClassOf("ProcResGroup"))1814continue;1815RecVec OtherUnits =1816PM.ProcResourceDefs[j]->getValueAsListOfDefs("Resources");1817if (std::find_first_of(CheckUnits.begin(), CheckUnits.end(),1818OtherUnits.begin(),1819OtherUnits.end()) != CheckUnits.end()) {1820// CheckUnits and OtherUnits overlap1821llvm::append_range(OtherUnits, CheckUnits);1822if (!hasSuperGroup(OtherUnits, PM)) {1823PrintFatalError((PM.ProcResourceDefs[i])->getLoc(),1824"proc resource group overlaps with " +1825PM.ProcResourceDefs[j]->getName() +1826" but no supergroup contains both.");1827}1828}1829}1830}1831}18321833// Collect all the RegisterFile definitions available in this target.1834void CodeGenSchedModels::collectRegisterFiles() {1835RecVec RegisterFileDefs = Records.getAllDerivedDefinitions("RegisterFile");18361837// RegisterFiles is the vector of CodeGenRegisterFile.1838for (Record *RF : RegisterFileDefs) {1839// For each register file definition, construct a CodeGenRegisterFile object1840// and add it to the appropriate scheduling model.1841CodeGenProcModel &PM = getProcModel(RF->getValueAsDef("SchedModel"));1842PM.RegisterFiles.emplace_back(CodeGenRegisterFile(RF->getName(), RF));1843CodeGenRegisterFile &CGRF = PM.RegisterFiles.back();1844CGRF.MaxMovesEliminatedPerCycle =1845RF->getValueAsInt("MaxMovesEliminatedPerCycle");1846CGRF.AllowZeroMoveEliminationOnly =1847RF->getValueAsBit("AllowZeroMoveEliminationOnly");18481849// Now set the number of physical registers as well as the cost of registers1850// in each register class.1851CGRF.NumPhysRegs = RF->getValueAsInt("NumPhysRegs");1852if (!CGRF.NumPhysRegs) {1853PrintFatalError(RF->getLoc(),1854"Invalid RegisterFile with zero physical registers");1855}18561857RecVec RegisterClasses = RF->getValueAsListOfDefs("RegClasses");1858std::vector<int64_t> RegisterCosts = RF->getValueAsListOfInts("RegCosts");1859ListInit *MoveElimInfo = RF->getValueAsListInit("AllowMoveElimination");1860for (unsigned I = 0, E = RegisterClasses.size(); I < E; ++I) {1861int Cost = RegisterCosts.size() > I ? RegisterCosts[I] : 1;18621863bool AllowMoveElim = false;1864if (MoveElimInfo->size() > I) {1865BitInit *Val = cast<BitInit>(MoveElimInfo->getElement(I));1866AllowMoveElim = Val->getValue();1867}18681869CGRF.Costs.emplace_back(RegisterClasses[I], Cost, AllowMoveElim);1870}1871}1872}18731874// Collect and sort WriteRes, ReadAdvance, and ProcResources.1875void CodeGenSchedModels::collectProcResources() {1876ProcResourceDefs = Records.getAllDerivedDefinitions("ProcResourceUnits");1877ProcResGroups = Records.getAllDerivedDefinitions("ProcResGroup");18781879// Add any subtarget-specific SchedReadWrites that are directly associated1880// with processor resources. Refer to the parent SchedClass's ProcIndices to1881// determine which processors they apply to.1882for (const CodeGenSchedClass &SC :1883make_range(schedClassBegin(), schedClassEnd())) {1884if (SC.ItinClassDef) {1885collectItinProcResources(SC.ItinClassDef);1886continue;1887}18881889// This class may have a default ReadWrite list which can be overriden by1890// InstRW definitions.1891for (Record *RW : SC.InstRWs) {1892Record *RWModelDef = RW->getValueAsDef("SchedModel");1893unsigned PIdx = getProcModel(RWModelDef).Index;1894IdxVec Writes, Reads;1895findRWs(RW->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);1896collectRWResources(Writes, Reads, PIdx);1897}18981899collectRWResources(SC.Writes, SC.Reads, SC.ProcIndices);1900}1901// Add resources separately defined by each subtarget.1902RecVec WRDefs = Records.getAllDerivedDefinitions("WriteRes");1903for (Record *WR : WRDefs) {1904Record *ModelDef = WR->getValueAsDef("SchedModel");1905addWriteRes(WR, getProcModel(ModelDef).Index);1906}1907RecVec SWRDefs = Records.getAllDerivedDefinitions("SchedWriteRes");1908for (Record *SWR : SWRDefs) {1909Record *ModelDef = SWR->getValueAsDef("SchedModel");1910addWriteRes(SWR, getProcModel(ModelDef).Index);1911}1912RecVec RADefs = Records.getAllDerivedDefinitions("ReadAdvance");1913for (Record *RA : RADefs) {1914Record *ModelDef = RA->getValueAsDef("SchedModel");1915addReadAdvance(RA, getProcModel(ModelDef).Index);1916}1917RecVec SRADefs = Records.getAllDerivedDefinitions("SchedReadAdvance");1918for (Record *SRA : SRADefs) {1919if (SRA->getValueInit("SchedModel")->isComplete()) {1920Record *ModelDef = SRA->getValueAsDef("SchedModel");1921addReadAdvance(SRA, getProcModel(ModelDef).Index);1922}1923}1924// Add ProcResGroups that are defined within this processor model, which may1925// not be directly referenced but may directly specify a buffer size.1926RecVec ProcResGroups = Records.getAllDerivedDefinitions("ProcResGroup");1927for (Record *PRG : ProcResGroups) {1928if (!PRG->getValueInit("SchedModel")->isComplete())1929continue;1930CodeGenProcModel &PM = getProcModel(PRG->getValueAsDef("SchedModel"));1931if (!is_contained(PM.ProcResourceDefs, PRG))1932PM.ProcResourceDefs.push_back(PRG);1933}1934// Add ProcResourceUnits unconditionally.1935for (Record *PRU : Records.getAllDerivedDefinitions("ProcResourceUnits")) {1936if (!PRU->getValueInit("SchedModel")->isComplete())1937continue;1938CodeGenProcModel &PM = getProcModel(PRU->getValueAsDef("SchedModel"));1939if (!is_contained(PM.ProcResourceDefs, PRU))1940PM.ProcResourceDefs.push_back(PRU);1941}1942// Finalize each ProcModel by sorting the record arrays.1943for (CodeGenProcModel &PM : ProcModels) {1944llvm::sort(PM.WriteResDefs, LessRecord());1945llvm::sort(PM.ReadAdvanceDefs, LessRecord());1946llvm::sort(PM.ProcResourceDefs, LessRecord());1947LLVM_DEBUG(1948PM.dump(); dbgs() << "WriteResDefs: "; for (auto WriteResDef1949: PM.WriteResDefs) {1950if (WriteResDef->isSubClassOf("WriteRes"))1951dbgs() << WriteResDef->getValueAsDef("WriteType")->getName() << " ";1952else1953dbgs() << WriteResDef->getName() << " ";1954} dbgs() << "\nReadAdvanceDefs: ";1955for (Record *ReadAdvanceDef1956: PM.ReadAdvanceDefs) {1957if (ReadAdvanceDef->isSubClassOf("ReadAdvance"))1958dbgs() << ReadAdvanceDef->getValueAsDef("ReadType")->getName()1959<< " ";1960else1961dbgs() << ReadAdvanceDef->getName() << " ";1962} dbgs()1963<< "\nProcResourceDefs: ";1964for (Record *ProcResourceDef1965: PM.ProcResourceDefs) {1966dbgs() << ProcResourceDef->getName() << " ";1967} dbgs()1968<< '\n');1969verifyProcResourceGroups(PM);1970}19711972ProcResourceDefs.clear();1973ProcResGroups.clear();1974}19751976void CodeGenSchedModels::checkCompleteness() {1977bool Complete = true;1978for (const CodeGenProcModel &ProcModel : procModels()) {1979const bool HasItineraries = ProcModel.hasItineraries();1980if (!ProcModel.ModelDef->getValueAsBit("CompleteModel"))1981continue;1982for (const CodeGenInstruction *Inst : Target.getInstructionsByEnumValue()) {1983if (Inst->hasNoSchedulingInfo)1984continue;1985if (ProcModel.isUnsupported(*Inst))1986continue;1987unsigned SCIdx = getSchedClassIdx(*Inst);1988if (!SCIdx) {1989if (Inst->TheDef->isValueUnset("SchedRW")) {1990PrintError(Inst->TheDef->getLoc(),1991"No schedule information for instruction '" +1992Inst->TheDef->getName() + "' in SchedMachineModel '" +1993ProcModel.ModelDef->getName() + "'");1994Complete = false;1995}1996continue;1997}19981999const CodeGenSchedClass &SC = getSchedClass(SCIdx);2000if (!SC.Writes.empty())2001continue;2002if (HasItineraries && SC.ItinClassDef != nullptr &&2003SC.ItinClassDef->getName() != "NoItinerary")2004continue;20052006const RecVec &InstRWs = SC.InstRWs;2007auto I = find_if(InstRWs, [&ProcModel](const Record *R) {2008return R->getValueAsDef("SchedModel") == ProcModel.ModelDef;2009});2010if (I == InstRWs.end()) {2011PrintError(Inst->TheDef->getLoc(), "'" + ProcModel.ModelName +2012"' lacks information for '" +2013Inst->TheDef->getName() + "'");2014Complete = false;2015}2016}2017}2018if (!Complete) {2019errs()2020<< "\n\nIncomplete schedule models found.\n"2021<< "- Consider setting 'CompleteModel = 0' while developing new "2022"models.\n"2023<< "- Pseudo instructions can be marked with 'hasNoSchedulingInfo = "2024"1'.\n"2025<< "- Instructions should usually have Sched<[...]> as a superclass, "2026"you may temporarily use an empty list.\n"2027<< "- Instructions related to unsupported features can be excluded "2028"with "2029"list<Predicate> UnsupportedFeatures = [HasA,..,HasY]; in the "2030"processor model.\n\n";2031PrintFatalError("Incomplete schedule model");2032}2033}20342035// Collect itinerary class resources for each processor.2036void CodeGenSchedModels::collectItinProcResources(Record *ItinClassDef) {2037for (unsigned PIdx = 0, PEnd = ProcModels.size(); PIdx != PEnd; ++PIdx) {2038const CodeGenProcModel &PM = ProcModels[PIdx];2039// For all ItinRW entries.2040bool HasMatch = false;2041for (RecIter II = PM.ItinRWDefs.begin(), IE = PM.ItinRWDefs.end(); II != IE;2042++II) {2043RecVec Matched = (*II)->getValueAsListOfDefs("MatchedItinClasses");2044if (!llvm::is_contained(Matched, ItinClassDef))2045continue;2046if (HasMatch)2047PrintFatalError((*II)->getLoc(),2048"Duplicate itinerary class " + ItinClassDef->getName() +2049" in ItinResources for " + PM.ModelName);2050HasMatch = true;2051IdxVec Writes, Reads;2052findRWs((*II)->getValueAsListOfDefs("OperandReadWrites"), Writes, Reads);2053collectRWResources(Writes, Reads, PIdx);2054}2055}2056}20572058void CodeGenSchedModels::collectRWResources(unsigned RWIdx, bool IsRead,2059ArrayRef<unsigned> ProcIndices) {2060const CodeGenSchedRW &SchedRW = getSchedRW(RWIdx, IsRead);2061if (SchedRW.TheDef) {2062if (!IsRead && SchedRW.TheDef->isSubClassOf("SchedWriteRes")) {2063for (unsigned Idx : ProcIndices)2064addWriteRes(SchedRW.TheDef, Idx);2065} else if (IsRead && SchedRW.TheDef->isSubClassOf("SchedReadAdvance")) {2066for (unsigned Idx : ProcIndices)2067addReadAdvance(SchedRW.TheDef, Idx);2068}2069}2070for (auto *Alias : SchedRW.Aliases) {2071IdxVec AliasProcIndices;2072if (Alias->getValueInit("SchedModel")->isComplete()) {2073AliasProcIndices.push_back(2074getProcModel(Alias->getValueAsDef("SchedModel")).Index);2075} else2076AliasProcIndices = ProcIndices;2077const CodeGenSchedRW &AliasRW = getSchedRW(Alias->getValueAsDef("AliasRW"));2078assert(AliasRW.IsRead == IsRead && "cannot alias reads to writes");20792080IdxVec ExpandedRWs;2081expandRWSequence(AliasRW.Index, ExpandedRWs, IsRead);2082for (unsigned int ExpandedRW : ExpandedRWs) {2083collectRWResources(ExpandedRW, IsRead, AliasProcIndices);2084}2085}2086}20872088// Collect resources for a set of read/write types and processor indices.2089void CodeGenSchedModels::collectRWResources(ArrayRef<unsigned> Writes,2090ArrayRef<unsigned> Reads,2091ArrayRef<unsigned> ProcIndices) {2092for (unsigned Idx : Writes)2093collectRWResources(Idx, /*IsRead=*/false, ProcIndices);20942095for (unsigned Idx : Reads)2096collectRWResources(Idx, /*IsRead=*/true, ProcIndices);2097}20982099// Find the processor's resource units for this kind of resource.2100Record *CodeGenSchedModels::findProcResUnits(Record *ProcResKind,2101const CodeGenProcModel &PM,2102ArrayRef<SMLoc> Loc) const {2103if (ProcResKind->isSubClassOf("ProcResourceUnits"))2104return ProcResKind;21052106Record *ProcUnitDef = nullptr;2107assert(!ProcResourceDefs.empty());2108assert(!ProcResGroups.empty());21092110for (Record *ProcResDef : ProcResourceDefs) {2111if (ProcResDef->getValueAsDef("Kind") == ProcResKind &&2112ProcResDef->getValueAsDef("SchedModel") == PM.ModelDef) {2113if (ProcUnitDef) {2114PrintFatalError(Loc,2115"Multiple ProcessorResourceUnits associated with " +2116ProcResKind->getName());2117}2118ProcUnitDef = ProcResDef;2119}2120}2121for (Record *ProcResGroup : ProcResGroups) {2122if (ProcResGroup == ProcResKind &&2123ProcResGroup->getValueAsDef("SchedModel") == PM.ModelDef) {2124if (ProcUnitDef) {2125PrintFatalError(Loc,2126"Multiple ProcessorResourceUnits associated with " +2127ProcResKind->getName());2128}2129ProcUnitDef = ProcResGroup;2130}2131}2132if (!ProcUnitDef) {2133PrintFatalError(Loc, "No ProcessorResources associated with " +2134ProcResKind->getName());2135}2136return ProcUnitDef;2137}21382139// Iteratively add a resource and its super resources.2140void CodeGenSchedModels::addProcResource(Record *ProcResKind,2141CodeGenProcModel &PM,2142ArrayRef<SMLoc> Loc) {2143while (true) {2144Record *ProcResUnits = findProcResUnits(ProcResKind, PM, Loc);21452146// See if this ProcResource is already associated with this processor.2147if (is_contained(PM.ProcResourceDefs, ProcResUnits))2148return;21492150PM.ProcResourceDefs.push_back(ProcResUnits);2151if (ProcResUnits->isSubClassOf("ProcResGroup"))2152return;21532154if (!ProcResUnits->getValueInit("Super")->isComplete())2155return;21562157ProcResKind = ProcResUnits->getValueAsDef("Super");2158}2159}21602161// Add resources for a SchedWrite to this processor if they don't exist.2162void CodeGenSchedModels::addWriteRes(Record *ProcWriteResDef, unsigned PIdx) {2163assert(PIdx && "don't add resources to an invalid Processor model");21642165RecVec &WRDefs = ProcModels[PIdx].WriteResDefs;2166if (is_contained(WRDefs, ProcWriteResDef))2167return;2168WRDefs.push_back(ProcWriteResDef);21692170// Visit ProcResourceKinds referenced by the newly discovered WriteRes.2171RecVec ProcResDefs = ProcWriteResDef->getValueAsListOfDefs("ProcResources");2172for (auto *ProcResDef : ProcResDefs) {2173addProcResource(ProcResDef, ProcModels[PIdx], ProcWriteResDef->getLoc());2174}2175}21762177// Add resources for a ReadAdvance to this processor if they don't exist.2178void CodeGenSchedModels::addReadAdvance(Record *ProcReadAdvanceDef,2179unsigned PIdx) {2180for (const Record *ValidWrite :2181ProcReadAdvanceDef->getValueAsListOfDefs("ValidWrites"))2182if (getSchedRWIdx(ValidWrite, /*IsRead=*/false) == 0)2183PrintFatalError(2184ProcReadAdvanceDef->getLoc(),2185"ReadAdvance referencing a ValidWrite that is not used by "2186"any instruction (" +2187ValidWrite->getName() + ")");21882189RecVec &RADefs = ProcModels[PIdx].ReadAdvanceDefs;2190if (is_contained(RADefs, ProcReadAdvanceDef))2191return;2192RADefs.push_back(ProcReadAdvanceDef);2193}21942195unsigned CodeGenProcModel::getProcResourceIdx(Record *PRDef) const {2196RecIter PRPos = find(ProcResourceDefs, PRDef);2197if (PRPos == ProcResourceDefs.end())2198PrintFatalError(PRDef->getLoc(), "ProcResource def is not included in "2199"the ProcResources list for " +2200ModelName);2201// Idx=0 is reserved for invalid.2202return 1 + (PRPos - ProcResourceDefs.begin());2203}22042205bool CodeGenProcModel::isUnsupported(const CodeGenInstruction &Inst) const {2206for (const Record *TheDef : UnsupportedFeaturesDefs) {2207for (const Record *PredDef :2208Inst.TheDef->getValueAsListOfDefs("Predicates")) {2209if (TheDef->getName() == PredDef->getName())2210return true;2211}2212}2213return false;2214}22152216bool CodeGenProcModel::hasReadOfWrite(Record *WriteDef) const {2217for (auto &RADef : ReadAdvanceDefs) {2218RecVec ValidWrites = RADef->getValueAsListOfDefs("ValidWrites");2219if (is_contained(ValidWrites, WriteDef))2220return true;2221}2222return false;2223}22242225#ifndef NDEBUG2226void CodeGenProcModel::dump() const {2227dbgs() << Index << ": " << ModelName << " "2228<< (ModelDef ? ModelDef->getName() : "inferred") << " "2229<< (ItinsDef ? ItinsDef->getName() : "no itinerary") << '\n';2230}22312232void CodeGenSchedRW::dump() const {2233dbgs() << Name << (IsVariadic ? " (V) " : " ");2234if (IsSequence) {2235dbgs() << "(";2236dumpIdxVec(Sequence);2237dbgs() << ")";2238}2239}22402241void CodeGenSchedClass::dump(const CodeGenSchedModels *SchedModels) const {2242dbgs() << "SCHEDCLASS " << Index << ":" << Name << '\n' << " Writes: ";2243for (unsigned i = 0, N = Writes.size(); i < N; ++i) {2244SchedModels->getSchedWrite(Writes[i]).dump();2245if (i < N - 1) {2246dbgs() << '\n';2247dbgs().indent(10);2248}2249}2250dbgs() << "\n Reads: ";2251for (unsigned i = 0, N = Reads.size(); i < N; ++i) {2252SchedModels->getSchedRead(Reads[i]).dump();2253if (i < N - 1) {2254dbgs() << '\n';2255dbgs().indent(10);2256}2257}2258dbgs() << "\n ProcIdx: ";2259dumpIdxVec(ProcIndices);2260if (!Transitions.empty()) {2261dbgs() << "\n Transitions for Proc ";2262for (const CodeGenSchedTransition &Transition : Transitions) {2263dbgs() << Transition.ProcIndex << ", ";2264}2265}2266dbgs() << '\n';2267}22682269void PredTransitions::dump() const {2270dbgs() << "Expanded Variants:\n";2271for (const auto &TI : TransVec) {2272dbgs() << "{";2273ListSeparator LS;2274for (const PredCheck &PC : TI.PredTerm)2275dbgs() << LS << SchedModels.getSchedRW(PC.RWIdx, PC.IsRead).Name << ":"2276<< PC.Predicate->getName();2277dbgs() << "},\n => {";2278for (SmallVectorImpl<SmallVector<unsigned, 4>>::const_iterator2279WSI = TI.WriteSequences.begin(),2280WSE = TI.WriteSequences.end();2281WSI != WSE; ++WSI) {2282dbgs() << "(";2283ListSeparator LS;2284for (unsigned N : *WSI)2285dbgs() << LS << SchedModels.getSchedWrite(N).Name;2286dbgs() << "),";2287}2288dbgs() << "}\n";2289}2290}2291#endif // NDEBUG229222932294