diff --git a/llvm/include/llvm/CodeGen/MachinePipeliner.h b/llvm/include/llvm/CodeGen/MachinePipeliner.h index c90ff4f3daa47..298ce32702d41 100644 --- a/llvm/include/llvm/CodeGen/MachinePipeliner.h +++ b/llvm/include/llvm/CodeGen/MachinePipeliner.h @@ -74,7 +74,7 @@ class MachinePipeliner : public MachineFunctionPass { const MachineDominatorTree *MDT = nullptr; const InstrItineraryData *InstrItins = nullptr; const TargetInstrInfo *TII = nullptr; - RegisterClassInfo RegClassInfo; + RegisterClassInfo *RegClassInfo = nullptr; bool disabledByPragma = false; unsigned II_setByPragma = 0; diff --git a/llvm/include/llvm/CodeGen/MachineScheduler.h b/llvm/include/llvm/CodeGen/MachineScheduler.h index 7b965d400ed08..b7cfc4b7e78b6 100644 --- a/llvm/include/llvm/CodeGen/MachineScheduler.h +++ b/llvm/include/llvm/CodeGen/MachineScheduler.h @@ -147,13 +147,7 @@ struct LLVM_ABI MachineSchedContext { const TargetMachine *TM = nullptr; AAResults *AA = nullptr; LiveIntervals *LIS = nullptr; - RegisterClassInfo *RegClassInfo; - - MachineSchedContext(); - MachineSchedContext &operator=(const MachineSchedContext &other) = delete; - MachineSchedContext(const MachineSchedContext &other) = delete; - virtual ~MachineSchedContext(); }; /// MachineSchedRegistry provides a selection of available machine instruction diff --git a/llvm/include/llvm/CodeGen/RegisterClassInfo.h b/llvm/include/llvm/CodeGen/RegisterClassInfo.h index 124c7aff8c76d..add3cb49913ab 100644 --- a/llvm/include/llvm/CodeGen/RegisterClassInfo.h +++ b/llvm/include/llvm/CodeGen/RegisterClassInfo.h @@ -19,6 +19,8 @@ #include "llvm/ADT/ArrayRef.h" #include "llvm/ADT/BitVector.h" #include "llvm/ADT/SmallVector.h" +#include "llvm/CodeGen/MachineFunctionPass.h" +#include "llvm/CodeGen/MachinePassManager.h" #include "llvm/CodeGen/TargetRegisterInfo.h" #include "llvm/MC/MCRegister.h" #include "llvm/Support/Compiler.h" @@ -27,6 +29,8 @@ namespace llvm { +class MachineRegisterClassAnalysis; + class RegisterClassInfo { struct RCInfo { unsigned Tag = 0; @@ -94,6 +98,14 @@ class RegisterClassInfo { LLVM_ABI void runOnMachineFunction(const MachineFunction &MF, bool Rev = false); + bool invalidate(MachineFunction &, const PreservedAnalyses &PA, + MachineFunctionAnalysisManager::Invalidator &) { + // Check whether the analysis has been explicitly invalidated. Otherwise, + // it's stateless and remains preserved. + auto PAC = PA.getChecker(); + return !PAC.preservedWhenStateless(); + } + /// getNumAllocatableRegs - Returns the number of actually allocatable /// registers in RC in the current function. unsigned getNumAllocatableRegs(const TargetRegisterClass *RC) const { @@ -158,6 +170,39 @@ class RegisterClassInfo { LLVM_ABI unsigned computePSetLimit(unsigned Idx) const; }; +class MachineRegisterClassAnalysis + : public AnalysisInfoMixin { + friend AnalysisInfoMixin; + + static AnalysisKey Key; + +public: + using Result = RegisterClassInfo; + + Result run(MachineFunction &, MachineFunctionAnalysisManager &); +}; + +class MachineRegisterClassInfoWrapperPass : public MachineFunctionPass { + virtual void anchor(); + + RegisterClassInfo RCI; + +public: + static char ID; + + MachineRegisterClassInfoWrapperPass(); + + void getAnalysisUsage(AnalysisUsage &AU) const override { + AU.setPreservesAll(); + MachineFunctionPass::getAnalysisUsage(AU); + } + + bool runOnMachineFunction(MachineFunction &MF) override; + + RegisterClassInfo &getRCI() { return RCI; } + const RegisterClassInfo &getRCI() const { return RCI; } +}; + } // end namespace llvm #endif // LLVM_CODEGEN_REGISTERCLASSINFO_H diff --git a/llvm/include/llvm/InitializePasses.h b/llvm/include/llvm/InitializePasses.h index 10a4d8525a9e8..b562373f1c075 100644 --- a/llvm/include/llvm/InitializePasses.h +++ b/llvm/include/llvm/InitializePasses.h @@ -218,6 +218,7 @@ LLVM_ABI void initializeStaticDataAnnotatorPass(PassRegistry &); LLVM_ABI void initializeMachinePipelinerPass(PassRegistry &); LLVM_ABI void initializeMachinePostDominatorTreeWrapperPassPass(PassRegistry &); LLVM_ABI void initializeMachineRegionInfoPassPass(PassRegistry &); +LLVM_ABI void initializeMachineRegisterClassInfoWrapperPassPass(PassRegistry &); LLVM_ABI void initializeMachineSanitizerBinaryMetadataLegacyPass(PassRegistry &); LLVM_ABI void initializeMIR2VecVocabLegacyAnalysisPass(PassRegistry &); diff --git a/llvm/include/llvm/Passes/MachinePassRegistry.def b/llvm/include/llvm/Passes/MachinePassRegistry.def index 04a0da06fb6ec..d22a76b8e515b 100644 --- a/llvm/include/llvm/Passes/MachinePassRegistry.def +++ b/llvm/include/llvm/Passes/MachinePassRegistry.def @@ -79,6 +79,8 @@ MACHINE_FUNCTION_ANALYSIS("machine-opt-remark-emitter", MachineOptimizationRemarkEmitterAnalysis()) MACHINE_FUNCTION_ANALYSIS("machine-post-dom-tree", MachinePostDominatorTreeAnalysis()) +MACHINE_FUNCTION_ANALYSIS("machine-reg-class-info", + MachineRegisterClassAnalysis()) MACHINE_FUNCTION_ANALYSIS("machine-trace-metrics", MachineTraceMetricsAnalysis()) MACHINE_FUNCTION_ANALYSIS("machine-uniformity", MachineUniformityAnalysis()) MACHINE_FUNCTION_ANALYSIS("pass-instrumentation", PassInstrumentationAnalysis(PIC)) diff --git a/llvm/lib/CodeGen/BreakFalseDeps.cpp b/llvm/lib/CodeGen/BreakFalseDeps.cpp index fead3ee250841..3a4102dd265a8 100644 --- a/llvm/lib/CodeGen/BreakFalseDeps.cpp +++ b/llvm/lib/CodeGen/BreakFalseDeps.cpp @@ -38,7 +38,7 @@ class BreakFalseDeps : public MachineFunctionPass { MachineFunction *MF = nullptr; const TargetInstrInfo *TII = nullptr; const TargetRegisterInfo *TRI = nullptr; - RegisterClassInfo RegClassInfo; + RegisterClassInfo *RegClassInfo = nullptr; /// List of undefined register reads in this block in forward order. std::vector> UndefReads; @@ -57,6 +57,7 @@ class BreakFalseDeps : public MachineFunctionPass { void getAnalysisUsage(AnalysisUsage &AU) const override { AU.setPreservesAll(); + AU.addRequired(); AU.addRequired(); MachineFunctionPass::getAnalysisUsage(AU); } @@ -101,6 +102,7 @@ class BreakFalseDeps : public MachineFunctionPass { char BreakFalseDeps::ID = 0; INITIALIZE_PASS_BEGIN(BreakFalseDeps, DEBUG_TYPE, "BreakFalseDeps", false, false) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_DEPENDENCY(ReachingDefInfoWrapperPass) INITIALIZE_PASS_END(BreakFalseDeps, DEBUG_TYPE, "BreakFalseDeps", false, false) @@ -151,7 +153,7 @@ bool BreakFalseDeps::pickBestRegisterForUndef(MachineInstr *MI, unsigned OpIdx, // max clearance or clearance higher than Pref. unsigned MaxClearance = 0; unsigned MaxClearanceReg = OriginalReg; - ArrayRef Order = RegClassInfo.getOrder(OpRC); + ArrayRef Order = RegClassInfo->getOrder(OpRC); for (MCPhysReg Reg : Order) { unsigned Clearance = RDI->getClearance(MI, Reg); if (Clearance <= MaxClearance) @@ -282,10 +284,9 @@ bool BreakFalseDeps::runOnMachineFunction(MachineFunction &mf) { MF = &mf; TII = MF->getSubtarget().getInstrInfo(); TRI = MF->getSubtarget().getRegisterInfo(); + RegClassInfo = &getAnalysis().getRCI(); RDI = &getAnalysis().getRDI(); - RegClassInfo.runOnMachineFunction(mf, /*Rev=*/true); - LLVM_DEBUG(dbgs() << "********** BREAK FALSE DEPENDENCIES **********\n"); // Skip Dead blocks due to ReachingDefAnalysis has no idea about instructions diff --git a/llvm/lib/CodeGen/MachineCombiner.cpp b/llvm/lib/CodeGen/MachineCombiner.cpp index 205c79e71854f..54ea87459a253 100644 --- a/llvm/lib/CodeGen/MachineCombiner.cpp +++ b/llvm/lib/CodeGen/MachineCombiner.cpp @@ -73,7 +73,7 @@ class MachineCombiner : public MachineFunctionPass { MachineTraceMetrics::Ensemble *TraceEnsemble = nullptr; MachineBlockFrequencyInfo *MBFI = nullptr; ProfileSummaryInfo *PSI = nullptr; - RegisterClassInfo RegClassInfo; + RegisterClassInfo *RegClassInfo = nullptr; TargetSchedModel TSchedModel; @@ -130,6 +130,7 @@ char &llvm::MachineCombinerID = MachineCombiner::ID; INITIALIZE_PASS_BEGIN(MachineCombiner, DEBUG_TYPE, "Machine InstCombiner", false, false) INITIALIZE_PASS_DEPENDENCY(MachineLoopInfoWrapperPass) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineTraceMetricsWrapperPass) INITIALIZE_PASS_END(MachineCombiner, DEBUG_TYPE, "Machine InstCombiner", false, false) @@ -139,6 +140,8 @@ void MachineCombiner::getAnalysisUsage(AnalysisUsage &AU) const { AU.addPreserved(); AU.addRequired(); AU.addPreserved(); + AU.addRequired(); + AU.addPreserved(); AU.addRequired(); AU.addPreserved(); AU.addRequired(); @@ -570,7 +573,7 @@ bool MachineCombiner::combineInstructions(MachineBasicBlock *MBB) { bool OptForSize = llvm::shouldOptimizeForSize(MBB, PSI, MBFI); bool DoRegPressureReduce = - TII->shouldReduceRegisterPressure(MBB, &RegClassInfo); + TII->shouldReduceRegisterPressure(MBB, RegClassInfo); while (BlockIter != MBB->end()) { auto &MI = *BlockIter++; @@ -729,7 +732,7 @@ bool MachineCombiner::runOnMachineFunction(MachineFunction &MF) { &getAnalysis().getBFI() : nullptr; TraceEnsemble = nullptr; - RegClassInfo.runOnMachineFunction(MF); + RegClassInfo = &getAnalysis().getRCI(); LLVM_DEBUG(dbgs() << getPassName() << ": " << MF.getName() << '\n'); if (!TII->useMachineCombiner()) { diff --git a/llvm/lib/CodeGen/MachinePipeliner.cpp b/llvm/lib/CodeGen/MachinePipeliner.cpp index 0ded0d6fc2f5d..9302c149b9846 100644 --- a/llvm/lib/CodeGen/MachinePipeliner.cpp +++ b/llvm/lib/CodeGen/MachinePipeliner.cpp @@ -238,6 +238,7 @@ INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineLoopInfoWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineDominatorTreeWrapperPass) INITIALIZE_PASS_DEPENDENCY(LiveIntervalsWrapperPass) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_END(MachinePipeliner, DEBUG_TYPE, "Modulo Software Pipelining", false, false) @@ -385,8 +386,8 @@ bool MachinePipeliner::runOnMachineFunction(MachineFunction &mf) { MLI = &getAnalysis().getLI(); MDT = &getAnalysis().getDomTree(); ORE = &getAnalysis().getORE(); + RegClassInfo = &getAnalysis().getRCI(); TII = MF->getSubtarget().getInstrInfo(); - RegClassInfo.runOnMachineFunction(*MF); for (const auto &L : *MLI) scheduleLoop(*L); @@ -671,7 +672,7 @@ bool MachinePipeliner::swingModuloScheduler(MachineLoop &L) { AliasAnalysis *AA = &getAnalysis().getAAResults(); SwingSchedulerDAG SMS( - *this, L, getAnalysis().getLIS(), RegClassInfo, + *this, L, getAnalysis().getLIS(), *RegClassInfo, II_setByPragma, LI.LoopPipelinerInfo.get(), AA); MachineBasicBlock *MBB = L.getHeader(); @@ -702,6 +703,8 @@ void MachinePipeliner::getAnalysisUsage(AnalysisUsage &AU) const { AU.addRequired(); AU.addRequired(); AU.addRequired(); + AU.addRequired(); + AU.addPreserved(); AU.addRequired(); MachineFunctionPass::getAnalysisUsage(AU); } @@ -714,7 +717,8 @@ bool MachinePipeliner::runWindowScheduler(MachineLoop &L) { Context.TM = &getAnalysis().getTM(); Context.AA = &getAnalysis().getAAResults(); Context.LIS = &getAnalysis().getLIS(); - Context.RegClassInfo->runOnMachineFunction(*MF); + Context.RegClassInfo = + &getAnalysis().getRCI(); WindowScheduler WS(&Context, L); return WS.run(); } diff --git a/llvm/lib/CodeGen/MachineScheduler.cpp b/llvm/lib/CodeGen/MachineScheduler.cpp index de29a9fab876e..00061bf26315a 100644 --- a/llvm/lib/CodeGen/MachineScheduler.cpp +++ b/llvm/lib/CodeGen/MachineScheduler.cpp @@ -302,14 +302,6 @@ void ScheduleDAGMutation::anchor() {} // Machine Instruction Scheduling Pass and Registry //===----------------------------------------------------------------------===// -MachineSchedContext::MachineSchedContext() { - RegClassInfo = new RegisterClassInfo(); -} - -MachineSchedContext::~MachineSchedContext() { - delete RegClassInfo; -} - namespace llvm { namespace impl_detail { @@ -332,6 +324,7 @@ class MachineSchedulerImpl : public MachineSchedulerBase { MachineDominatorTree &MDT; AAResults &AA; LiveIntervals &LIS; + RegisterClassInfo &RegClassInfo; }; MachineSchedulerImpl() = default; @@ -432,6 +425,8 @@ void MachineSchedulerLegacy::getAnalysisUsage(AnalysisUsage &AU) const { AU.addPreserved(); AU.addRequired(); AU.addPreserved(); + AU.addRequired(); + AU.addPreserved(); MachineFunctionPass::getAnalysisUsage(AU); } @@ -444,6 +439,7 @@ INITIALIZE_PASS_BEGIN(PostMachineSchedulerLegacy, "postmisched", INITIALIZE_PASS_DEPENDENCY(MachineDominatorTreeWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineLoopInfoWrapperPass) INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_END(PostMachineSchedulerLegacy, "postmisched", "PostRA Machine Instruction Scheduler", false, false) @@ -555,6 +551,7 @@ bool MachineSchedulerImpl::run(MachineFunction &Func, const TargetMachine &TM, this->TM = &TM; AA = &Analyses.AA; LIS = &Analyses.LIS; + RegClassInfo = &Analyses.RegClassInfo; if (VerifyScheduling) { LLVM_DEBUG(LIS->dump()); @@ -564,7 +561,6 @@ bool MachineSchedulerImpl::run(MachineFunction &Func, const TargetMachine &TM, else MF->verify(*MFAM, MSchedBanner, &errs()); } - RegClassInfo->runOnMachineFunction(*MF); // Instantiate the selected scheduler for this target, function, and // optimization level. @@ -660,8 +656,11 @@ bool MachineSchedulerLegacy::runOnMachineFunction(MachineFunction &MF) { auto &TM = getAnalysis().getTM(); auto &AA = getAnalysis().getAAResults(); auto &LIS = getAnalysis().getLIS(); + auto &RegClassInfo = + getAnalysis().getRCI(); + Impl.setLegacyPass(this); - return Impl.run(MF, TM, {MLI, MDT, AA, LIS}); + return Impl.run(MF, TM, {MLI, MDT, AA, LIS, RegClassInfo}); } MachineSchedulerPass::MachineSchedulerPass(const TargetMachine *TM) @@ -693,8 +692,9 @@ MachineSchedulerPass::run(MachineFunction &MF, .getManager(); auto &AA = FAM.getResult(MF.getFunction()); auto &LIS = MFAM.getResult(MF); + auto &RegClassInfo = MFAM.getResult(MF); Impl->setMFAM(&MFAM); - bool Changed = Impl->run(MF, *TM, {MLI, MDT, AA, LIS}); + bool Changed = Impl->run(MF, *TM, {MLI, MDT, AA, LIS, RegClassInfo}); if (!Changed) return PreservedAnalyses::all(); diff --git a/llvm/lib/CodeGen/MachineSink.cpp b/llvm/lib/CodeGen/MachineSink.cpp index 0ceeda4eb16d2..e4467c435168d 100644 --- a/llvm/lib/CodeGen/MachineSink.cpp +++ b/llvm/lib/CodeGen/MachineSink.cpp @@ -135,7 +135,7 @@ class MachineSinking { MachineBlockFrequencyInfo *MBFI = nullptr; const MachineBranchProbabilityInfo *MBPI = nullptr; AliasAnalysis *AA = nullptr; - RegisterClassInfo RegClassInfo; + RegisterClassInfo *RegClassInfo = nullptr; TargetSchedModel SchedModel; // Required for split critical edge LiveIntervals *LIS; @@ -204,9 +204,10 @@ class MachineSinking { MachineLoopInfo *MLI, SlotIndexes *SI, LiveIntervals *LIS, MachineCycleInfo *CI, ProfileSummaryInfo *PSI, MachineBlockFrequencyInfo *MBFI, - const MachineBranchProbabilityInfo *MBPI, AliasAnalysis *AA) + const MachineBranchProbabilityInfo *MBPI, AliasAnalysis *AA, + RegisterClassInfo *RegClassInfo) : DT(DT), PDT(PDT), CI(CI), PSI(PSI), MBFI(MBFI), MBPI(MBPI), AA(AA), - LIS(LIS), SI(SI), LV(LV), MLI(MLI), + RegClassInfo(RegClassInfo), LIS(LIS), SI(SI), LV(LV), MLI(MLI), EnableSinkAndFold(EnableSinkAndFold) {} bool run(MachineFunction &MF); @@ -306,8 +307,10 @@ class MachineSinkingLegacy : public MachineFunctionPass { AU.addRequired(); AU.addRequired(); AU.addRequired(); + AU.addRequired(); AU.addPreserved(); AU.addPreserved(); + AU.addPreserved(); AU.addRequired(); if (UseBlockFreqInfo) AU.addRequired(); @@ -327,6 +330,7 @@ INITIALIZE_PASS_DEPENDENCY(ProfileSummaryInfoWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineBranchProbabilityInfoWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineDominatorTreeWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineCycleInfoWrapperPass) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass) INITIALIZE_PASS_END(MachineSinkingLegacy, DEBUG_TYPE, "Machine code sinking", false, false) @@ -773,8 +777,9 @@ MachineSinkingPass::run(MachineFunction &MF, auto *SI = MFAM.getCachedResult(MF); auto *LV = MFAM.getCachedResult(MF); auto *MLI = MFAM.getCachedResult(MF); + auto *RegClassInfo = &MFAM.getResult(MF); MachineSinking Impl(EnableSinkAndFold, DT, PDT, LV, MLI, SI, LIS, CI, PSI, - MBFI, MBPI, AA); + MBFI, MBPI, AA, RegClassInfo); bool Changed = Impl.run(MF); if (!Changed) return PreservedAnalyses::all(); @@ -819,9 +824,11 @@ bool MachineSinkingLegacy::runOnMachineFunction(MachineFunction &MF) { auto *LV = LVWrapper ? &LVWrapper->getLV() : nullptr; auto *MLIWrapper = getAnalysisIfAvailable(); auto *MLI = MLIWrapper ? &MLIWrapper->getLI() : nullptr; + auto *RegClassInfo = + &getAnalysis().getRCI(); MachineSinking Impl(EnableSinkAndFold, DT, PDT, LV, MLI, SI, LIS, CI, PSI, - MBFI, MBPI, AA); + MBFI, MBPI, AA, RegClassInfo); return Impl.run(MF); } @@ -833,8 +840,6 @@ bool MachineSinking::run(MachineFunction &MF) { TRI = STI->getRegisterInfo(); MRI = &MF.getRegInfo(); - RegClassInfo.runOnMachineFunction(MF); - bool EverMadeChange = false; while (true) { @@ -1202,7 +1207,7 @@ MachineSinking::getBBRegisterPressure(const MachineBasicBlock &MBB, RegPressureTracker RPTracker(Pressure); // Initialize the register pressure tracker. - RPTracker.init(MBB.getParent(), &RegClassInfo, nullptr, &MBB, MBB.end(), + RPTracker.init(MBB.getParent(), RegClassInfo, nullptr, &MBB, MBB.end(), /*TrackLaneMasks*/ false, /*TrackUntiedDefs=*/true); for (MachineBasicBlock::const_iterator MII = MBB.instr_end(), @@ -1238,7 +1243,7 @@ bool MachineSinking::registerPressureSetExceedsLimit( std::vector BBRegisterPressure = getBBRegisterPressure(MBB); for (; *PS != -1; PS++) if (Weight + BBRegisterPressure[*PS] >= - RegClassInfo.getRegPressureSetLimit(*PS)) + RegClassInfo->getRegPressureSetLimit(*PS)) return true; return false; } diff --git a/llvm/lib/CodeGen/PostRASchedulerList.cpp b/llvm/lib/CodeGen/PostRASchedulerList.cpp index 06e5b18c19301..88c6dc1fa9b7d 100644 --- a/llvm/lib/CodeGen/PostRASchedulerList.cpp +++ b/llvm/lib/CodeGen/PostRASchedulerList.cpp @@ -80,12 +80,13 @@ class PostRAScheduler { MachineLoopInfo *MLI = nullptr; AliasAnalysis *AA = nullptr; const TargetMachine *TM = nullptr; - RegisterClassInfo RegClassInfo; + RegisterClassInfo *RegClassInfo = nullptr; public: PostRAScheduler(MachineFunction &MF, MachineLoopInfo *MLI, AliasAnalysis *AA, - const TargetMachine *TM) - : TII(MF.getSubtarget().getInstrInfo()), MLI(MLI), AA(AA), TM(TM) {} + const TargetMachine *TM, RegisterClassInfo *RegClassInfo) + : TII(MF.getSubtarget().getInstrInfo()), MLI(MLI), AA(AA), TM(TM), + RegClassInfo(RegClassInfo) {} bool run(MachineFunction &MF); }; @@ -102,6 +103,8 @@ class PostRASchedulerLegacy : public MachineFunctionPass { AU.addPreserved(); AU.addRequired(); AU.addPreserved(); + AU.addRequired(); + AU.addPreserved(); MachineFunctionPass::getAnalysisUsage(AU); } @@ -201,8 +204,11 @@ class SchedulePostRATDList : public ScheduleDAGInstrs { char &llvm::PostRASchedulerID = PostRASchedulerLegacy::ID; -INITIALIZE_PASS(PostRASchedulerLegacy, DEBUG_TYPE, - "Post RA top-down list latency scheduler", false, false) +INITIALIZE_PASS_BEGIN(PostRASchedulerLegacy, DEBUG_TYPE, + "Post RA top-down list latency scheduler", false, false) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) +INITIALIZE_PASS_END(PostRASchedulerLegacy, DEBUG_TYPE, + "Post RA top-down list latency scheduler", false, false) SchedulePostRATDList::SchedulePostRATDList( MachineFunction &MF, MachineLoopInfo &MLI, AliasAnalysis *AA, @@ -291,11 +297,10 @@ bool PostRAScheduler::run(MachineFunction &MF) { } SmallVector CriticalPathRCs; Subtarget.getCriticalPathRCs(CriticalPathRCs); - RegClassInfo.runOnMachineFunction(MF); LLVM_DEBUG(dbgs() << "PostRAScheduler\n"); - SchedulePostRATDList Scheduler(MF, *MLI, AA, RegClassInfo, AntiDepMode, + SchedulePostRATDList Scheduler(MF, *MLI, AA, *RegClassInfo, AntiDepMode, CriticalPathRCs); // Loop over all of the basic blocks @@ -365,7 +370,9 @@ bool PostRASchedulerLegacy::runOnMachineFunction(MachineFunction &MF) { AliasAnalysis *AA = &getAnalysis().getAAResults(); const TargetMachine *TM = &getAnalysis().getTM(); - PostRAScheduler Impl(MF, MLI, AA, TM); + RegisterClassInfo *RegClassInfo = + &getAnalysis().getRCI(); + PostRAScheduler Impl(MF, MLI, AA, TM, RegClassInfo); return Impl.run(MF); } @@ -378,7 +385,9 @@ PostRASchedulerPass::run(MachineFunction &MF, auto &FAM = MFAM.getResult(MF) .getManager(); AliasAnalysis *AA = &FAM.getResult(MF.getFunction()); - PostRAScheduler Impl(MF, MLI, AA, TM); + RegisterClassInfo *RegClassInfo = + &MFAM.getResult(MF); + PostRAScheduler Impl(MF, MLI, AA, TM, RegClassInfo); bool Changed = Impl.run(MF); if (!Changed) return PreservedAnalyses::all(); diff --git a/llvm/lib/CodeGen/RegisterClassInfo.cpp b/llvm/lib/CodeGen/RegisterClassInfo.cpp index bbeb7adae825c..d6a7deb1e2414 100644 --- a/llvm/lib/CodeGen/RegisterClassInfo.cpp +++ b/llvm/lib/CodeGen/RegisterClassInfo.cpp @@ -21,6 +21,7 @@ #include "llvm/CodeGen/MachineRegisterInfo.h" #include "llvm/CodeGen/TargetRegisterInfo.h" #include "llvm/CodeGen/TargetSubtargetInfo.h" +#include "llvm/InitializePasses.h" #include "llvm/MC/MCRegisterInfo.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/Debug.h" @@ -240,3 +241,32 @@ unsigned RegisterClassInfo::computePSetLimit(unsigned Idx) const { unsigned NReserved = RC->getNumRegs() - NAllocatableRegs; return RegPressureSetLimit - TRI->getRegClassWeight(RC).RegWeight * NReserved; } + +INITIALIZE_PASS(MachineRegisterClassInfoWrapperPass, "machine-reg-class-info", + "Machine Register Class Info Analysis", true, true) + +MachineRegisterClassAnalysis::Result +MachineRegisterClassAnalysis::run(MachineFunction &MF, + MachineFunctionAnalysisManager &) { + RegisterClassInfo RCI; + RCI.runOnMachineFunction(MF); + return RCI; +} + +char MachineRegisterClassInfoWrapperPass::ID = 0; + +MachineRegisterClassInfoWrapperPass::MachineRegisterClassInfoWrapperPass() + : MachineFunctionPass(ID), RCI() { + PassRegistry &Registry = *PassRegistry::getPassRegistry(); + initializeMachineRegisterClassInfoWrapperPassPass(Registry); +} + +bool MachineRegisterClassInfoWrapperPass::runOnMachineFunction( + MachineFunction &MF) { + RCI.runOnMachineFunction(MF); + return false; +} + +void MachineRegisterClassInfoWrapperPass::anchor() {} + +AnalysisKey MachineRegisterClassAnalysis::Key; diff --git a/llvm/lib/CodeGen/RegisterCoalescer.cpp b/llvm/lib/CodeGen/RegisterCoalescer.cpp index 25c4375a73ce0..729d73a1560ab 100644 --- a/llvm/lib/CodeGen/RegisterCoalescer.cpp +++ b/llvm/lib/CodeGen/RegisterCoalescer.cpp @@ -133,7 +133,7 @@ class RegisterCoalescer : private LiveRangeEdit::Delegate { LiveIntervals *LIS = nullptr; SlotIndexes *SI = nullptr; const MachineLoopInfo *Loops = nullptr; - RegisterClassInfo RegClassInfo; + RegisterClassInfo *RegClassInfo = nullptr; /// Position and VReg of a PHI instruction during coalescing. struct PHIValPos { @@ -382,8 +382,9 @@ class RegisterCoalescer : private LiveRangeEdit::Delegate { RegisterCoalescer &operator=(RegisterCoalescer &&Other) = default; RegisterCoalescer(LiveIntervals *LIS, SlotIndexes *SI, - const MachineLoopInfo *Loops) - : LIS(LIS), SI(SI), Loops(Loops) {} + const MachineLoopInfo *Loops, + RegisterClassInfo *RegClassInfo) + : LIS(LIS), SI(SI), Loops(Loops), RegClassInfo(RegClassInfo) {} bool run(MachineFunction &MF); }; @@ -417,6 +418,7 @@ INITIALIZE_PASS_BEGIN(RegisterCoalescerLegacy, "register-coalescer", INITIALIZE_PASS_DEPENDENCY(LiveIntervalsWrapperPass) INITIALIZE_PASS_DEPENDENCY(SlotIndexesWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineLoopInfoWrapperPass) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_END(RegisterCoalescerLegacy, "register-coalescer", "Register Coalescer", false, false) @@ -603,6 +605,8 @@ void RegisterCoalescerLegacy::getAnalysisUsage(AnalysisUsage &AU) const { AU.addRequired(); AU.addPreserved(); AU.addPreservedID(MachineDominatorsID); + AU.addRequired(); + AU.addPreserved(); MachineFunctionPass::getAnalysisUsage(AU); } @@ -2059,7 +2063,7 @@ bool RegisterCoalescer::joinCopy( } if (CP.getNewRC()) { - if (RegClassInfo.getNumAllocatableRegs(CP.getNewRC()) == 0) { + if (RegClassInfo->getNumAllocatableRegs(CP.getNewRC()) == 0) { LLVM_DEBUG(dbgs() << "\tNo " << TRI->getRegClassName(CP.getNewRC()) << "are available for allocation\n"); return false; @@ -2239,7 +2243,7 @@ bool RegisterCoalescer::joinCopy( // Removing sub-register copies can ease the register class constraints. // Make sure we attempt to inflate the register class of DstReg. - if (!CP.isPhys() && RegClassInfo.isProperSubClass(CP.getNewRC())) + if (!CP.isPhys() && RegClassInfo->isProperSubClass(CP.getNewRC())) InflateRegs.push_back(CP.getDstReg()); // CopyMI has been erased by joinIntervals at this point. Remove it from @@ -4271,7 +4275,8 @@ RegisterCoalescerPass::run(MachineFunction &MF, auto &LIS = MFAM.getResult(MF); auto &Loops = MFAM.getResult(MF); auto *SI = MFAM.getCachedResult(MF); - RegisterCoalescer Impl(&LIS, SI, &Loops); + auto *RegClassInfo = &MFAM.getResult(MF); + RegisterCoalescer Impl(&LIS, SI, &Loops, RegClassInfo); if (!Impl.run(MF)) return PreservedAnalyses::all(); auto PA = getMachineFunctionPassPreservedAnalyses(); @@ -4287,8 +4292,10 @@ bool RegisterCoalescerLegacy::runOnMachineFunction(MachineFunction &MF) { auto *LIS = &getAnalysis().getLIS(); auto *Loops = &getAnalysis().getLI(); auto *SIWrapper = getAnalysisIfAvailable(); + auto *RegClassInfo = + &getAnalysis().getRCI(); SlotIndexes *SI = SIWrapper ? &SIWrapper->getSI() : nullptr; - RegisterCoalescer Impl(LIS, SI, Loops); + RegisterCoalescer Impl(LIS, SI, Loops, RegClassInfo); return Impl.run(MF); } @@ -4315,6 +4322,7 @@ bool RegisterCoalescer::run(MachineFunction &fn) { const TargetSubtargetInfo &STI = fn.getSubtarget(); TRI = STI.getRegisterInfo(); TII = STI.getInstrInfo(); + if (EnableGlobalCopies == cl::BOU_UNSET) JoinGlobalCopies = STI.enableJoinGlobalCopies(); else @@ -4344,8 +4352,6 @@ bool RegisterCoalescer::run(MachineFunction &fn) { DbgVRegToValues.clear(); buildVRegToDbgValueMap(fn); - RegClassInfo.runOnMachineFunction(fn); - // Join (coalesce) intervals if requested. if (EnableJoining) joinAllIntervals(); diff --git a/llvm/lib/CodeGen/ShrinkWrap.cpp b/llvm/lib/CodeGen/ShrinkWrap.cpp index 83581052560cb..7349dd0fdc79b 100644 --- a/llvm/lib/CodeGen/ShrinkWrap.cpp +++ b/llvm/lib/CodeGen/ShrinkWrap.cpp @@ -113,7 +113,7 @@ namespace { /// are safe for such insertion. class ShrinkWrapImpl { /// Hold callee-saved information. - RegisterClassInfo RCI; + RegisterClassInfo *RCI = nullptr; MachineDominatorTree *MDT = nullptr; MachinePostDominatorTree *MPDT = nullptr; @@ -224,7 +224,6 @@ class ShrinkWrapImpl { /// Initialize the pass for \p MF. void init(MachineFunction &MF) { - RCI.runOnMachineFunction(MF); Save = nullptr; Restore = nullptr; EntryFreq = MBFI->getEntryFreq(); @@ -245,10 +244,11 @@ class ShrinkWrapImpl { bool ArePointsInteresting() const { return Save != Entry && Save && Restore; } public: - ShrinkWrapImpl(MachineDominatorTree *MDT, MachinePostDominatorTree *MPDT, + ShrinkWrapImpl(RegisterClassInfo *RCI, MachineDominatorTree *MDT, + MachinePostDominatorTree *MPDT, MachineBlockFrequencyInfo *MBFI, MachineLoopInfo *MLI, MachineOptimizationRemarkEmitter *ORE) - : MDT(MDT), MPDT(MPDT), MBFI(MBFI), MLI(MLI), ORE(ORE) {} + : RCI(RCI), MDT(MDT), MPDT(MPDT), MBFI(MBFI), MLI(MLI), ORE(ORE) {} /// Check if shrink wrapping is enabled for this target and function. static bool isShrinkWrapEnabled(const MachineFunction &MF); @@ -271,6 +271,7 @@ class ShrinkWrapLegacy : public MachineFunctionPass { AU.addRequired(); AU.addRequired(); AU.addRequired(); + AU.addRequired(); MachineFunctionPass::getAnalysisUsage(AU); } @@ -298,6 +299,7 @@ INITIALIZE_PASS_DEPENDENCY(MachineDominatorTreeWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachinePostDominatorTreeWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineLoopInfoWrapperPass) INITIALIZE_PASS_DEPENDENCY(MachineOptimizationRemarkEmitterPass) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_END(ShrinkWrapLegacy, DEBUG_TYPE, "Shrink Wrap Pass", false, false) @@ -359,7 +361,7 @@ bool ShrinkWrapImpl::useOrDefCSROrFI(const MachineInstr &MI, RegScavenger *RS, // register. Until the FP is assigned a Physical Register PPC's FP needs // to be checked separately. UseOrDefCSR = (!MI.isCall() && PhysReg == SP) || - RCI.getLastCalleeSavedAlias(PhysReg) || + RCI->getLastCalleeSavedAlias(PhysReg) || (!MI.isReturn() && TRI->isNonallocatableRegisterCalleeSave(PhysReg)) || TRI->isVirtualFrameRegister(PhysReg); @@ -984,6 +986,8 @@ bool ShrinkWrapLegacy::runOnMachineFunction(MachineFunction &MF) { !ShrinkWrapImpl::isShrinkWrapEnabled(MF)) return false; + RegisterClassInfo *RCI = + &getAnalysis().getRCI(); MachineDominatorTree *MDT = &getAnalysis().getDomTree(); MachinePostDominatorTree *MPDT = @@ -994,7 +998,7 @@ bool ShrinkWrapLegacy::runOnMachineFunction(MachineFunction &MF) { MachineOptimizationRemarkEmitter *ORE = &getAnalysis().getORE(); - return ShrinkWrapImpl(MDT, MPDT, MBFI, MLI, ORE).run(MF); + return ShrinkWrapImpl(RCI, MDT, MPDT, MBFI, MLI, ORE).run(MF); } PreservedAnalyses ShrinkWrapPass::run(MachineFunction &MF, @@ -1003,6 +1007,7 @@ PreservedAnalyses ShrinkWrapPass::run(MachineFunction &MF, if (MF.empty() || !ShrinkWrapImpl::isShrinkWrapEnabled(MF)) return PreservedAnalyses::all(); + RegisterClassInfo &RCI = MFAM.getResult(MF); MachineDominatorTree &MDT = MFAM.getResult(MF); MachinePostDominatorTree &MPDT = MFAM.getResult(MF); @@ -1012,7 +1017,7 @@ PreservedAnalyses ShrinkWrapPass::run(MachineFunction &MF, MachineOptimizationRemarkEmitter &ORE = MFAM.getResult(MF); - ShrinkWrapImpl(&MDT, &MPDT, &MBFI, &MLI, &ORE).run(MF); + ShrinkWrapImpl(&RCI, &MDT, &MPDT, &MBFI, &MLI, &ORE).run(MF); return PreservedAnalyses::all(); } diff --git a/llvm/lib/Passes/PassBuilder.cpp b/llvm/lib/Passes/PassBuilder.cpp index 0d190ea448931..83555c98e6971 100644 --- a/llvm/lib/Passes/PassBuilder.cpp +++ b/llvm/lib/Passes/PassBuilder.cpp @@ -152,6 +152,7 @@ #include "llvm/CodeGen/RegAllocPriorityAdvisor.h" #include "llvm/CodeGen/RegUsageInfoCollector.h" #include "llvm/CodeGen/RegUsageInfoPropagate.h" +#include "llvm/CodeGen/RegisterClassInfo.h" #include "llvm/CodeGen/RegisterCoalescerPass.h" #include "llvm/CodeGen/RegisterUsageInfo.h" #include "llvm/CodeGen/RemoveLoadsIntoFakeUses.h" diff --git a/llvm/lib/Target/AArch64/AArch64A57FPLoadBalancing.cpp b/llvm/lib/Target/AArch64/AArch64A57FPLoadBalancing.cpp index b816f11508bed..23b46949ae143 100644 --- a/llvm/lib/Target/AArch64/AArch64A57FPLoadBalancing.cpp +++ b/llvm/lib/Target/AArch64/AArch64A57FPLoadBalancing.cpp @@ -38,6 +38,7 @@ #include "llvm/CodeGen/MachineRegisterInfo.h" #include "llvm/CodeGen/RegisterClassInfo.h" #include "llvm/CodeGen/RegisterScavenging.h" +#include "llvm/InitializePasses.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/Debug.h" #include "llvm/Support/raw_ostream.h" @@ -108,7 +109,7 @@ class Chain; class AArch64A57FPLoadBalancing : public MachineFunctionPass { MachineRegisterInfo *MRI; const TargetRegisterInfo *TRI; - RegisterClassInfo RCI; + RegisterClassInfo *RCI = nullptr; public: static char ID; @@ -126,6 +127,8 @@ class AArch64A57FPLoadBalancing : public MachineFunctionPass { void getAnalysisUsage(AnalysisUsage &AU) const override { AU.setPreservesCFG(); + AU.addRequired(); + AU.addPreserved(); MachineFunctionPass::getAnalysisUsage(AU); } @@ -149,6 +152,7 @@ char AArch64A57FPLoadBalancing::ID = 0; INITIALIZE_PASS_BEGIN(AArch64A57FPLoadBalancing, DEBUG_TYPE, "AArch64 A57 FP Load-Balancing", false, false) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_END(AArch64A57FPLoadBalancing, DEBUG_TYPE, "AArch64 A57 FP Load-Balancing", false, false) @@ -314,7 +318,7 @@ bool AArch64A57FPLoadBalancing::runOnMachineFunction(MachineFunction &F) { MRI = &F.getRegInfo(); TRI = F.getRegInfo().getTargetRegisterInfo(); - RCI.runOnMachineFunction(F); + RCI = &getAnalysis().getRCI(); for (auto &MBB : F) { Changed |= runOnBasicBlock(MBB); @@ -514,7 +518,7 @@ int AArch64A57FPLoadBalancing::scavengeRegister(Chain *G, Color C, // Make sure we allocate in-order, to get the cheapest registers first. unsigned RegClassID = ChainBegin->getDesc().operands()[0].RegClass; - auto Ord = RCI.getOrder(TRI->getRegClass(RegClassID)); + auto Ord = RCI->getOrder(TRI->getRegClass(RegClassID)); for (auto Reg : Ord) { if (!Units.available(Reg)) continue; diff --git a/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.cpp b/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.cpp index ecfaa5c70e9d3..6af0de82987ae 100644 --- a/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.cpp +++ b/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.cpp @@ -43,7 +43,7 @@ class SIPreAllocateWWMRegs { LiveIntervals *LIS; LiveRegMatrix *Matrix; VirtRegMap *VRM; - RegisterClassInfo RegClassInfo; + const RegisterClassInfo &RegClassInfo; std::vector RegsToRewrite; #ifndef NDEBUG @@ -54,8 +54,8 @@ class SIPreAllocateWWMRegs { public: SIPreAllocateWWMRegs(LiveIntervals *LIS, LiveRegMatrix *Matrix, - VirtRegMap *VRM) - : LIS(LIS), Matrix(Matrix), VRM(VRM) {} + VirtRegMap *VRM, const RegisterClassInfo &RCI) + : LIS(LIS), Matrix(Matrix), VRM(VRM), RegClassInfo(RCI) {} bool run(MachineFunction &MF); }; @@ -71,6 +71,8 @@ class SIPreAllocateWWMRegsLegacy : public MachineFunctionPass { AU.addRequired(); AU.addRequired(); AU.addRequired(); + // TODO: Update RCI with the additional reserved registers the pass sets. + AU.addRequired(); AU.setPreservesAll(); MachineFunctionPass::getAnalysisUsage(AU); } @@ -83,6 +85,7 @@ INITIALIZE_PASS_BEGIN(SIPreAllocateWWMRegsLegacy, DEBUG_TYPE, INITIALIZE_PASS_DEPENDENCY(LiveIntervalsWrapperPass) INITIALIZE_PASS_DEPENDENCY(VirtRegMapWrapperLegacy) INITIALIZE_PASS_DEPENDENCY(LiveRegMatrixWrapperLegacy) +INITIALIZE_PASS_DEPENDENCY(MachineRegisterClassInfoWrapperPass) INITIALIZE_PASS_END(SIPreAllocateWWMRegsLegacy, DEBUG_TYPE, "SI Pre-allocate WWM Registers", false, false) @@ -196,7 +199,8 @@ bool SIPreAllocateWWMRegsLegacy::runOnMachineFunction(MachineFunction &MF) { auto *LIS = &getAnalysis().getLIS(); auto *Matrix = &getAnalysis().getLRM(); auto *VRM = &getAnalysis().getVRM(); - return SIPreAllocateWWMRegs(LIS, Matrix, VRM).run(MF); + const auto &RCI = getAnalysis().getRCI(); + return SIPreAllocateWWMRegs(LIS, Matrix, VRM, RCI).run(MF); } bool SIPreAllocateWWMRegs::run(MachineFunction &MF) { @@ -208,8 +212,6 @@ bool SIPreAllocateWWMRegs::run(MachineFunction &MF) { TRI = &TII->getRegisterInfo(); MRI = &MF.getRegInfo(); - RegClassInfo.runOnMachineFunction(MF); - bool PreallocateSGPRSpillVGPRs = EnablePreallocateSGPRSpillVGPRs || MF.getFunction().hasFnAttribute("amdgpu-prealloc-sgpr-spill-vgprs"); @@ -269,6 +271,7 @@ SIPreAllocateWWMRegsPass::run(MachineFunction &MF, auto *LIS = &MFAM.getResult(MF); auto *Matrix = &MFAM.getResult(MF); auto *VRM = &MFAM.getResult(MF); - SIPreAllocateWWMRegs(LIS, Matrix, VRM).run(MF); + const auto &RCI = MFAM.getResult(MF); + SIPreAllocateWWMRegs(LIS, Matrix, VRM, RCI).run(MF); return PreservedAnalyses::all(); } diff --git a/llvm/test/CodeGen/AArch64/O3-pipeline.ll b/llvm/test/CodeGen/AArch64/O3-pipeline.ll index e1481667a4ab7..3bb89fee3408a 100644 --- a/llvm/test/CodeGen/AArch64/O3-pipeline.ll +++ b/llvm/test/CodeGen/AArch64/O3-pipeline.ll @@ -140,6 +140,7 @@ ; CHECK-NEXT: Machine Natural Loop Construction ; CHECK-NEXT: Machine Trace Metrics ; CHECK-NEXT: AArch64 Conditional Compares +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Lazy Machine Block Frequency Analysis ; CHECK-NEXT: Machine InstCombiner ; CHECK-NEXT: AArch64 Conditional Branch Tuning @@ -157,6 +158,7 @@ ; CHECK-NEXT: Machine Common Subexpression Elimination ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Machine Cycle Info Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Machine code sinking ; CHECK-NEXT: Peephole Optimizations ; CHECK-NEXT: Remove dead machine instructions @@ -172,6 +174,7 @@ ; CHECK-NEXT: MachineDominator Tree Construction ; CHECK-NEXT: Slot index numbering ; CHECK-NEXT: Live Interval Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Register Coalescer ; CHECK-NEXT: Rename Disconnected Subregister Components ; CHECK-NEXT: Machine Instruction Scheduler @@ -192,6 +195,7 @@ ; CHECK-NEXT: Machine Copy Propagation Pass ; CHECK-NEXT: Machine Loop Invariant Code Motion ; CHECK-NEXT: AArch64 Redundant Copy Elimination +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: A57 FP Anti-dependency breaker ; CHECK-NEXT: Remove Redundant DEBUG_VALUE analysis ; CHECK-NEXT: Fixup Statepoint Caller Saved diff --git a/llvm/test/CodeGen/AMDGPU/llc-pipeline.ll b/llvm/test/CodeGen/AMDGPU/llc-pipeline.ll index fe75b2b5bfcf5..ea65d7a835ea9 100644 --- a/llvm/test/CodeGen/AMDGPU/llc-pipeline.ll +++ b/llvm/test/CodeGen/AMDGPU/llc-pipeline.ll @@ -123,6 +123,7 @@ ; GCN-O0-NEXT: Live Interval Analysis ; GCN-O0-NEXT: Virtual Register Map ; GCN-O0-NEXT: Live Register Matrix +; GCN-O0-NEXT: Machine Register Class Info Analysis ; GCN-O0-NEXT: SI Pre-allocate WWM Registers ; GCN-O0-NEXT: Fast Register Allocator ; GCN-O0-NEXT: SI Lower WWM Copies @@ -336,6 +337,7 @@ ; GCN-O1-NEXT: Machine Common Subexpression Elimination ; GCN-O1-NEXT: MachinePostDominator Tree Construction ; GCN-O1-NEXT: Machine Cycle Info Analysis +; GCN-O1-NEXT: Machine Register Class Info Analysis ; GCN-O1-NEXT: Machine code sinking ; GCN-O1-NEXT: Peephole Optimizations ; GCN-O1-NEXT: Remove dead machine instructions @@ -360,6 +362,7 @@ ; GCN-O1-NEXT: Slot index numbering ; GCN-O1-NEXT: Live Interval Analysis ; GCN-O1-NEXT: Machine Natural Loop Construction +; GCN-O1-NEXT: Machine Register Class Info Analysis ; GCN-O1-NEXT: Register Coalescer ; GCN-O1-NEXT: Rename Disconnected Subregister Components ; GCN-O1-NEXT: Rewrite Partial Register Uses @@ -383,6 +386,7 @@ ; GCN-O1-NEXT: SI lower SGPR spill instructions ; GCN-O1-NEXT: Virtual Register Map ; GCN-O1-NEXT: Live Register Matrix +; GCN-O1-NEXT: Machine Register Class Info Analysis ; GCN-O1-NEXT: SI Pre-allocate WWM Registers ; GCN-O1-NEXT: Live Stack Slot Analysis ; GCN-O1-NEXT: Greedy Register Allocator @@ -409,6 +413,7 @@ ; GCN-O1-NEXT: MachinePostDominator Tree Construction ; GCN-O1-NEXT: Lazy Machine Block Frequency Analysis ; GCN-O1-NEXT: Machine Optimization Remark Emitter +; GCN-O1-NEXT: Machine Register Class Info Analysis ; GCN-O1-NEXT: Shrink Wrapping analysis ; GCN-O1-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; GCN-O1-NEXT: Machine Late Instructions Cleanup Pass @@ -649,6 +654,7 @@ ; GCN-O1-OPTS-NEXT: Machine Common Subexpression Elimination ; GCN-O1-OPTS-NEXT: MachinePostDominator Tree Construction ; GCN-O1-OPTS-NEXT: Machine Cycle Info Analysis +; GCN-O1-OPTS-NEXT: Machine Register Class Info Analysis ; GCN-O1-OPTS-NEXT: Machine code sinking ; GCN-O1-OPTS-NEXT: Peephole Optimizations ; GCN-O1-OPTS-NEXT: Remove dead machine instructions @@ -680,6 +686,7 @@ ; GCN-O1-OPTS-NEXT: Slot index numbering ; GCN-O1-OPTS-NEXT: Live Interval Analysis ; GCN-O1-OPTS-NEXT: Machine Natural Loop Construction +; GCN-O1-OPTS-NEXT: Machine Register Class Info Analysis ; GCN-O1-OPTS-NEXT: Register Coalescer ; GCN-O1-OPTS-NEXT: Rename Disconnected Subregister Components ; GCN-O1-OPTS-NEXT: Rewrite Partial Register Uses @@ -704,6 +711,7 @@ ; GCN-O1-OPTS-NEXT: SI lower SGPR spill instructions ; GCN-O1-OPTS-NEXT: Virtual Register Map ; GCN-O1-OPTS-NEXT: Live Register Matrix +; GCN-O1-OPTS-NEXT: Machine Register Class Info Analysis ; GCN-O1-OPTS-NEXT: SI Pre-allocate WWM Registers ; GCN-O1-OPTS-NEXT: Live Stack Slot Analysis ; GCN-O1-OPTS-NEXT: Greedy Register Allocator @@ -730,6 +738,7 @@ ; GCN-O1-OPTS-NEXT: MachinePostDominator Tree Construction ; GCN-O1-OPTS-NEXT: Lazy Machine Block Frequency Analysis ; GCN-O1-OPTS-NEXT: Machine Optimization Remark Emitter +; GCN-O1-OPTS-NEXT: Machine Register Class Info Analysis ; GCN-O1-OPTS-NEXT: Shrink Wrapping analysis ; GCN-O1-OPTS-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; GCN-O1-OPTS-NEXT: Machine Late Instructions Cleanup Pass @@ -974,6 +983,7 @@ ; GCN-O2-NEXT: Machine Common Subexpression Elimination ; GCN-O2-NEXT: MachinePostDominator Tree Construction ; GCN-O2-NEXT: Machine Cycle Info Analysis +; GCN-O2-NEXT: Machine Register Class Info Analysis ; GCN-O2-NEXT: Machine code sinking ; GCN-O2-NEXT: Peephole Optimizations ; GCN-O2-NEXT: Remove dead machine instructions @@ -1005,6 +1015,7 @@ ; GCN-O2-NEXT: Slot index numbering ; GCN-O2-NEXT: Live Interval Analysis ; GCN-O2-NEXT: Machine Natural Loop Construction +; GCN-O2-NEXT: Machine Register Class Info Analysis ; GCN-O2-NEXT: Register Coalescer ; GCN-O2-NEXT: Rename Disconnected Subregister Components ; GCN-O2-NEXT: Rewrite Partial Register Uses @@ -1030,6 +1041,7 @@ ; GCN-O2-NEXT: SI lower SGPR spill instructions ; GCN-O2-NEXT: Virtual Register Map ; GCN-O2-NEXT: Live Register Matrix +; GCN-O2-NEXT: Machine Register Class Info Analysis ; GCN-O2-NEXT: SI Pre-allocate WWM Registers ; GCN-O2-NEXT: Live Stack Slot Analysis ; GCN-O2-NEXT: Greedy Register Allocator @@ -1056,6 +1068,7 @@ ; GCN-O2-NEXT: MachinePostDominator Tree Construction ; GCN-O2-NEXT: Lazy Machine Block Frequency Analysis ; GCN-O2-NEXT: Machine Optimization Remark Emitter +; GCN-O2-NEXT: Machine Register Class Info Analysis ; GCN-O2-NEXT: Shrink Wrapping analysis ; GCN-O2-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; GCN-O2-NEXT: Machine Late Instructions Cleanup Pass @@ -1313,6 +1326,7 @@ ; GCN-O3-NEXT: Machine Common Subexpression Elimination ; GCN-O3-NEXT: MachinePostDominator Tree Construction ; GCN-O3-NEXT: Machine Cycle Info Analysis +; GCN-O3-NEXT: Machine Register Class Info Analysis ; GCN-O3-NEXT: Machine code sinking ; GCN-O3-NEXT: Peephole Optimizations ; GCN-O3-NEXT: Remove dead machine instructions @@ -1344,6 +1358,7 @@ ; GCN-O3-NEXT: Slot index numbering ; GCN-O3-NEXT: Live Interval Analysis ; GCN-O3-NEXT: Machine Natural Loop Construction +; GCN-O3-NEXT: Machine Register Class Info Analysis ; GCN-O3-NEXT: Register Coalescer ; GCN-O3-NEXT: Rename Disconnected Subregister Components ; GCN-O3-NEXT: Rewrite Partial Register Uses @@ -1369,6 +1384,7 @@ ; GCN-O3-NEXT: SI lower SGPR spill instructions ; GCN-O3-NEXT: Virtual Register Map ; GCN-O3-NEXT: Live Register Matrix +; GCN-O3-NEXT: Machine Register Class Info Analysis ; GCN-O3-NEXT: SI Pre-allocate WWM Registers ; GCN-O3-NEXT: Live Stack Slot Analysis ; GCN-O3-NEXT: Greedy Register Allocator @@ -1395,6 +1411,7 @@ ; GCN-O3-NEXT: MachinePostDominator Tree Construction ; GCN-O3-NEXT: Lazy Machine Block Frequency Analysis ; GCN-O3-NEXT: Machine Optimization Remark Emitter +; GCN-O3-NEXT: Machine Register Class Info Analysis ; GCN-O3-NEXT: Shrink Wrapping analysis ; GCN-O3-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; GCN-O3-NEXT: Machine Late Instructions Cleanup Pass diff --git a/llvm/test/CodeGen/AMDGPU/sgpr-regalloc-flags.ll b/llvm/test/CodeGen/AMDGPU/sgpr-regalloc-flags.ll index c83af33659dad..8cef98f8d2826 100644 --- a/llvm/test/CodeGen/AMDGPU/sgpr-regalloc-flags.ll +++ b/llvm/test/CodeGen/AMDGPU/sgpr-regalloc-flags.ll @@ -21,6 +21,7 @@ ; DEFAULT-NEXT: SI lower SGPR spill instructions ; DEFAULT-NEXT: Virtual Register Map ; DEFAULT-NEXT: Live Register Matrix +; DEFAULT-NEXT: Machine Register Class Info Analysis ; DEFAULT-NEXT: SI Pre-allocate WWM Registers ; DEFAULT-NEXT: Live Stack Slot Analysis ; DEFAULT-NEXT: Greedy Register Allocator @@ -42,6 +43,7 @@ ; O0-NEXT: Live Interval Analysis ; O0-NEXT: Virtual Register Map ; O0-NEXT: Live Register Matrix +; O0-NEXT: Machine Register Class Info Analysis ; O0-NEXT: SI Pre-allocate WWM Registers ; O0-NEXT: Fast Register Allocator ; O0-NEXT: SI Lower WWM Copies @@ -64,6 +66,7 @@ ; BASIC-DEFAULT-NEXT: SI lower SGPR spill instructions ; BASIC-DEFAULT-NEXT: Virtual Register Map ; BASIC-DEFAULT-NEXT: Live Register Matrix +; BASIC-DEFAULT-NEXT: Machine Register Class Info Analysis ; BASIC-DEFAULT-NEXT: SI Pre-allocate WWM Registers ; BASIC-DEFAULT-NEXT: Live Stack Slot Analysis ; BASIC-DEFAULT-NEXT: Bundle Machine CFG Edges @@ -91,6 +94,7 @@ ; DEFAULT-BASIC-NEXT: SI lower SGPR spill instructions ; DEFAULT-BASIC-NEXT: Virtual Register Map ; DEFAULT-BASIC-NEXT: Live Register Matrix +; DEFAULT-BASIC-NEXT: Machine Register Class Info Analysis ; DEFAULT-BASIC-NEXT: SI Pre-allocate WWM Registers ; DEFAULT-BASIC-NEXT: Live Stack Slot Analysis ; DEFAULT-BASIC-NEXT: Basic Register Allocator @@ -120,6 +124,7 @@ ; BASIC-BASIC-NEXT: SI lower SGPR spill instructions ; BASIC-BASIC-NEXT: Virtual Register Map ; BASIC-BASIC-NEXT: Live Register Matrix +; BASIC-BASIC-NEXT: Machine Register Class Info Analysis ; BASIC-BASIC-NEXT: SI Pre-allocate WWM Registers ; BASIC-BASIC-NEXT: Live Stack Slot Analysis ; BASIC-BASIC-NEXT: Basic Register Allocator diff --git a/llvm/test/CodeGen/ARM/O3-pipeline.ll b/llvm/test/CodeGen/ARM/O3-pipeline.ll index 273114822ec44..110c3d01579c6 100644 --- a/llvm/test/CodeGen/ARM/O3-pipeline.ll +++ b/llvm/test/CodeGen/ARM/O3-pipeline.ll @@ -100,6 +100,7 @@ ; CHECK-NEXT: Machine Common Subexpression Elimination ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Machine Cycle Info Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Machine code sinking ; CHECK-NEXT: Peephole Optimizations ; CHECK-NEXT: Remove dead machine instructions @@ -127,6 +128,7 @@ ; CHECK-NEXT: Two-Address instruction pass ; CHECK-NEXT: Slot index numbering ; CHECK-NEXT: Live Interval Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Register Coalescer ; CHECK-NEXT: Rename Disconnected Subregister Components ; CHECK-NEXT: Machine Instruction Scheduler @@ -153,6 +155,7 @@ ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Lazy Machine Block Frequency Analysis ; CHECK-NEXT: Machine Optimization Remark Emitter +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Shrink Wrapping analysis ; CHECK-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; CHECK-NEXT: Machine Late Instructions Cleanup Pass @@ -164,6 +167,7 @@ ; CHECK-NEXT: ARM load / store optimization pass ; CHECK-NEXT: Reaching Definitions Analysis ; CHECK-NEXT: ARM Execution Domain Fix +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: BreakFalseDeps ; CHECK-NEXT: ARM pseudo instruction expansion pass ; CHECK-NEXT: Insert KCFI indirect call checks @@ -176,6 +180,7 @@ ; CHECK-NEXT: MachineDominator Tree Construction ; CHECK-NEXT: Machine Natural Loop Construction ; CHECK-NEXT: PostRA Machine Instruction Scheduler +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Post RA top-down list latency scheduler ; CHECK-NEXT: MVE VPT block insertion pass ; CHECK-NEXT: ARM Indirect Thunks diff --git a/llvm/test/CodeGen/LoongArch/opt-pipeline.ll b/llvm/test/CodeGen/LoongArch/opt-pipeline.ll index 661f67d4989c4..3a8b03a601def 100644 --- a/llvm/test/CodeGen/LoongArch/opt-pipeline.ll +++ b/llvm/test/CodeGen/LoongArch/opt-pipeline.ll @@ -105,6 +105,7 @@ ; LAXX-NEXT: Machine Common Subexpression Elimination ; LAXX-NEXT: MachinePostDominator Tree Construction ; LAXX-NEXT: Machine Cycle Info Analysis +; LAXX-NEXT: Machine Register Class Info Analysis ; LAXX-NEXT: Machine code sinking ; LAXX-NEXT: Peephole Optimizations ; LAXX-NEXT: Remove dead machine instructions @@ -121,6 +122,7 @@ ; LAXX-NEXT: MachineDominator Tree Construction ; LAXX-NEXT: Slot index numbering ; LAXX-NEXT: Live Interval Analysis +; LAXX-NEXT: Machine Register Class Info Analysis ; LAXX-NEXT: Register Coalescer ; LAXX-NEXT: Rename Disconnected Subregister Components ; LAXX-NEXT: Machine Instruction Scheduler @@ -148,6 +150,7 @@ ; LAXX-NEXT: MachinePostDominator Tree Construction ; LAXX-NEXT: Lazy Machine Block Frequency Analysis ; LAXX-NEXT: Machine Optimization Remark Emitter +; LAXX-NEXT: Machine Register Class Info Analysis ; LAXX-NEXT: Shrink Wrapping analysis ; LAXX-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; LAXX-NEXT: Machine Late Instructions Cleanup Pass @@ -158,6 +161,7 @@ ; LAXX-NEXT: Post-RA pseudo instruction expansion pass ; LAXX-NEXT: MachineDominator Tree Construction ; LAXX-NEXT: Machine Natural Loop Construction +; LAXX-NEXT: Machine Register Class Info Analysis ; LAXX-NEXT: Post RA top-down list latency scheduler ; LAXX-NEXT: Analyze Machine Code For Garbage Collection ; LAXX-NEXT: Machine Block Frequency Analysis diff --git a/llvm/test/CodeGen/PowerPC/O3-pipeline.ll b/llvm/test/CodeGen/PowerPC/O3-pipeline.ll index 7cbb1a1c98873..dda900bc3d11e 100644 --- a/llvm/test/CodeGen/PowerPC/O3-pipeline.ll +++ b/llvm/test/CodeGen/PowerPC/O3-pipeline.ll @@ -115,6 +115,7 @@ ; CHECK-NEXT: Machine Natural Loop Construction ; CHECK-NEXT: Machine Trace Metrics ; CHECK-NEXT: Early If-Conversion +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Lazy Machine Block Frequency Analysis ; CHECK-NEXT: Machine InstCombiner ; CHECK-NEXT: Machine Block Frequency Analysis @@ -124,6 +125,7 @@ ; CHECK-NEXT: Machine Common Subexpression Elimination ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Machine Cycle Info Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Machine code sinking ; CHECK-NEXT: Peephole Optimizations ; CHECK-NEXT: Remove dead machine instructions @@ -149,6 +151,7 @@ ; CHECK-NEXT: Live Interval Analysis ; CHECK-NEXT: Lazy Machine Block Frequency Analysis ; CHECK-NEXT: Machine Optimization Remark Emitter +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Modulo Software Pipelining ; CHECK-NEXT: Detect Dead Lanes ; CHECK-NEXT: Init Undef Pass @@ -161,6 +164,7 @@ ; CHECK-NEXT: Two-Address instruction pass ; CHECK-NEXT: Slot index numbering ; CHECK-NEXT: Live Interval Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Register Coalescer ; CHECK-NEXT: Rename Disconnected Subregister Components ; CHECK-NEXT: Machine Instruction Scheduler @@ -189,6 +193,7 @@ ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Lazy Machine Block Frequency Analysis ; CHECK-NEXT: Machine Optimization Remark Emitter +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Shrink Wrapping analysis ; CHECK-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; CHECK-NEXT: Machine Late Instructions Cleanup Pass diff --git a/llvm/test/CodeGen/RISCV/O3-pipeline.ll b/llvm/test/CodeGen/RISCV/O3-pipeline.ll index 769823d1c4216..8999197dc5515 100644 --- a/llvm/test/CodeGen/RISCV/O3-pipeline.ll +++ b/llvm/test/CodeGen/RISCV/O3-pipeline.ll @@ -118,6 +118,7 @@ ; CHECK-NEXT: Machine Common Subexpression Elimination ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Machine Cycle Info Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Machine code sinking ; CHECK-NEXT: Peephole Optimizations ; CHECK-NEXT: Remove dead machine instructions @@ -139,6 +140,7 @@ ; CHECK-NEXT: Two-Address instruction pass ; CHECK-NEXT: Slot index numbering ; CHECK-NEXT: Live Interval Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Register Coalescer ; CHECK-NEXT: Rename Disconnected Subregister Components ; CHECK-NEXT: Machine Instruction Scheduler @@ -173,6 +175,7 @@ ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Lazy Machine Block Frequency Analysis ; CHECK-NEXT: Machine Optimization Remark Emitter +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Shrink Wrapping analysis ; CHECK-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; CHECK-NEXT: Machine Late Instructions Cleanup Pass diff --git a/llvm/test/CodeGen/X86/opt-pipeline.ll b/llvm/test/CodeGen/X86/opt-pipeline.ll index 276232e27c000..cc134ff381825 100644 --- a/llvm/test/CodeGen/X86/opt-pipeline.ll +++ b/llvm/test/CodeGen/X86/opt-pipeline.ll @@ -105,6 +105,7 @@ ; CHECK-NEXT: Machine Natural Loop Construction ; CHECK-NEXT: Machine Trace Metrics ; CHECK-NEXT: Early If-Conversion +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Lazy Machine Block Frequency Analysis ; CHECK-NEXT: Machine InstCombiner ; CHECK-NEXT: X86 cmov Conversion @@ -117,6 +118,7 @@ ; CHECK-NEXT: Machine Common Subexpression Elimination ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Machine Cycle Info Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Machine code sinking ; CHECK-NEXT: Peephole Optimizations ; CHECK-NEXT: Remove dead machine instructions @@ -142,6 +144,7 @@ ; CHECK-NEXT: Two-Address instruction pass ; CHECK-NEXT: Slot index numbering ; CHECK-NEXT: Live Interval Analysis +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Register Coalescer ; CHECK-NEXT: Rename Disconnected Subregister Components ; CHECK-NEXT: Machine Instruction Scheduler @@ -175,6 +178,7 @@ ; CHECK-NEXT: MachinePostDominator Tree Construction ; CHECK-NEXT: Lazy Machine Block Frequency Analysis ; CHECK-NEXT: Machine Optimization Remark Emitter +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Shrink Wrapping analysis ; CHECK-NEXT: Prologue/Epilogue Insertion & Frame Finalization ; CHECK-NEXT: Machine Late Instructions Cleanup Pass @@ -187,6 +191,7 @@ ; CHECK-NEXT: Insert KCFI indirect call checks ; CHECK-NEXT: MachineDominator Tree Construction ; CHECK-NEXT: Machine Natural Loop Construction +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: Post RA top-down list latency scheduler ; CHECK-NEXT: Analyze Machine Code For Garbage Collection ; CHECK-NEXT: Machine Block Frequency Analysis @@ -197,6 +202,7 @@ ; CHECK-NEXT: Implement the 'patchable-function' attribute ; CHECK-NEXT: Reaching Definitions Analysis ; CHECK-NEXT: X86 Execution Dependency Fix +; CHECK-NEXT: Machine Register Class Info Analysis ; CHECK-NEXT: BreakFalseDeps ; CHECK-NEXT: X86 Indirect Branch Tracking ; CHECK-NEXT: X86 vzeroupper inserter