https://github.com/Akshat-Oke updated https://github.com/llvm/llvm-project/pull/109939
>From 4c5184af67fb5eaeec1eb971421b8a3030b22c76 Mon Sep 17 00:00:00 2001 From: Akshat Oke <akshat....@amd.com> Date: Tue, 24 Sep 2024 11:41:18 +0000 Subject: [PATCH] [NewPM][AMDGPU] Port SIPreAllocateWWMRegs to NPM --- llvm/lib/Target/AMDGPU/AMDGPU.h | 6 +- llvm/lib/Target/AMDGPU/AMDGPUPassRegistry.def | 1 + .../lib/Target/AMDGPU/AMDGPUTargetMachine.cpp | 7 ++- .../Target/AMDGPU/SIPreAllocateWWMRegs.cpp | 60 ++++++++++++------- llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.h | 30 ++++++++++ 5 files changed, 77 insertions(+), 27 deletions(-) create mode 100644 llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.h diff --git a/llvm/lib/Target/AMDGPU/AMDGPU.h b/llvm/lib/Target/AMDGPU/AMDGPU.h index b2dd354e496a2e..c0fd5e4625895a 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPU.h +++ b/llvm/lib/Target/AMDGPU/AMDGPU.h @@ -49,7 +49,7 @@ FunctionPass *createSIFixSGPRCopiesLegacyPass(); FunctionPass *createLowerWWMCopiesPass(); FunctionPass *createSIMemoryLegalizerPass(); FunctionPass *createSIInsertWaitcntsPass(); -FunctionPass *createSIPreAllocateWWMRegsPass(); +FunctionPass *createSIPreAllocateWWMRegsLegacyPass(); FunctionPass *createSIFormMemoryClausesPass(); FunctionPass *createSIPostRABundlerPass(); @@ -208,8 +208,8 @@ extern char &SILateBranchLoweringPassID; void initializeSIOptimizeExecMaskingPass(PassRegistry &); extern char &SIOptimizeExecMaskingID; -void initializeSIPreAllocateWWMRegsPass(PassRegistry &); -extern char &SIPreAllocateWWMRegsID; +void initializeSIPreAllocateWWMRegsLegacyPass(PassRegistry &); +extern char &SIPreAllocateWWMRegsLegacyID; void initializeAMDGPUImageIntrinsicOptimizerPass(PassRegistry &); extern char &AMDGPUImageIntrinsicOptimizerID; diff --git a/llvm/lib/Target/AMDGPU/AMDGPUPassRegistry.def b/llvm/lib/Target/AMDGPU/AMDGPUPassRegistry.def index 0ebf34c901c142..174a90f0aa419d 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUPassRegistry.def +++ b/llvm/lib/Target/AMDGPU/AMDGPUPassRegistry.def @@ -102,5 +102,6 @@ MACHINE_FUNCTION_PASS("gcn-dpp-combine", GCNDPPCombinePass()) MACHINE_FUNCTION_PASS("si-load-store-opt", SILoadStoreOptimizerPass()) MACHINE_FUNCTION_PASS("si-lower-sgpr-spills", SILowerSGPRSpillsPass()) MACHINE_FUNCTION_PASS("si-peephole-sdwa", SIPeepholeSDWAPass()) +MACHINE_FUNCTION_PASS("si-pre-allocate-wwm-regs", SIPreAllocateWWMRegsPass()) MACHINE_FUNCTION_PASS("si-shrink-instructions", SIShrinkInstructionsPass()) #undef MACHINE_FUNCTION_PASS diff --git a/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp b/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp index 04fdee0819b502..9a28c648e2c4ed 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp +++ b/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp @@ -41,6 +41,7 @@ #include "SIMachineFunctionInfo.h" #include "SIMachineScheduler.h" #include "SIPeepholeSDWA.h" +#include "SIPreAllocateWWMRegs.h" #include "SIShrinkInstructions.h" #include "TargetInfo/AMDGPUTargetInfo.h" #include "Utils/AMDGPUBaseInfo.h" @@ -461,7 +462,7 @@ extern "C" LLVM_EXTERNAL_VISIBILITY void LLVMInitializeAMDGPUTarget() { initializeSILateBranchLoweringPass(*PR); initializeSIMemoryLegalizerPass(*PR); initializeSIOptimizeExecMaskingPass(*PR); - initializeSIPreAllocateWWMRegsPass(*PR); + initializeSIPreAllocateWWMRegsLegacyPass(*PR); initializeSIFormMemoryClausesPass(*PR); initializeSIPostRABundlerPass(*PR); initializeGCNCreateVOPDPass(*PR); @@ -1443,7 +1444,7 @@ bool GCNPassConfig::addRegAssignAndRewriteFast() { // Equivalent of PEI for SGPRs. addPass(&SILowerSGPRSpillsLegacyID); - addPass(&SIPreAllocateWWMRegsID); + addPass(&SIPreAllocateWWMRegsLegacyID); addPass(createVGPRAllocPass(false)); @@ -1467,7 +1468,7 @@ bool GCNPassConfig::addRegAssignAndRewriteOptimized() { // Equivalent of PEI for SGPRs. addPass(&SILowerSGPRSpillsLegacyID); - addPass(&SIPreAllocateWWMRegsID); + addPass(&SIPreAllocateWWMRegsLegacyID); addPass(createVGPRAllocPass(true)); diff --git a/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.cpp b/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.cpp index 0635cab7b872e2..c1d7a464a81537 100644 --- a/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.cpp +++ b/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.cpp @@ -11,6 +11,7 @@ // //===----------------------------------------------------------------------===// +#include "SIPreAllocateWWMRegs.h" #include "AMDGPU.h" #include "GCNSubtarget.h" #include "MCTargetDesc/AMDGPUMCTargetDesc.h" @@ -34,7 +35,7 @@ static cl::opt<bool> namespace { -class SIPreAllocateWWMRegs : public MachineFunctionPass { +class SIPreAllocateWWMRegs { private: const SIInstrInfo *TII; const SIRegisterInfo *TRI; @@ -48,13 +49,21 @@ class SIPreAllocateWWMRegs : public MachineFunctionPass { #ifndef NDEBUG void printWWMInfo(const MachineInstr &MI); #endif + bool processDef(MachineOperand &MO); + void rewriteRegs(MachineFunction &MF); + +public: + SIPreAllocateWWMRegs(LiveIntervals *LIS, LiveRegMatrix *Matrix, + VirtRegMap *VRM) + : LIS(LIS), Matrix(Matrix), VRM(VRM) {} + bool run(MachineFunction &MF); +}; +class SIPreAllocateWWMRegsLegacy : public MachineFunctionPass { public: static char ID; - SIPreAllocateWWMRegs() : MachineFunctionPass(ID) { - initializeSIPreAllocateWWMRegsPass(*PassRegistry::getPassRegistry()); - } + SIPreAllocateWWMRegsLegacy() : MachineFunctionPass(ID) {} bool runOnMachineFunction(MachineFunction &MF) override; @@ -65,28 +74,24 @@ class SIPreAllocateWWMRegs : public MachineFunctionPass { AU.setPreservesAll(); MachineFunctionPass::getAnalysisUsage(AU); } - -private: - bool processDef(MachineOperand &MO); - void rewriteRegs(MachineFunction &MF); }; } // End anonymous namespace. -INITIALIZE_PASS_BEGIN(SIPreAllocateWWMRegs, DEBUG_TYPE, - "SI Pre-allocate WWM Registers", false, false) +INITIALIZE_PASS_BEGIN(SIPreAllocateWWMRegsLegacy, DEBUG_TYPE, + "SI Pre-allocate WWM Registers", false, false) INITIALIZE_PASS_DEPENDENCY(LiveIntervalsWrapperPass) INITIALIZE_PASS_DEPENDENCY(VirtRegMapWrapperPass) INITIALIZE_PASS_DEPENDENCY(LiveRegMatrixWrapperPass) -INITIALIZE_PASS_END(SIPreAllocateWWMRegs, DEBUG_TYPE, - "SI Pre-allocate WWM Registers", false, false) +INITIALIZE_PASS_END(SIPreAllocateWWMRegsLegacy, DEBUG_TYPE, + "SI Pre-allocate WWM Registers", false, false) -char SIPreAllocateWWMRegs::ID = 0; +char SIPreAllocateWWMRegsLegacy::ID = 0; -char &llvm::SIPreAllocateWWMRegsID = SIPreAllocateWWMRegs::ID; +char &llvm::SIPreAllocateWWMRegsLegacyID = SIPreAllocateWWMRegsLegacy::ID; -FunctionPass *llvm::createSIPreAllocateWWMRegsPass() { - return new SIPreAllocateWWMRegs(); +FunctionPass *llvm::createSIPreAllocateWWMRegsLegacyPass() { + return new SIPreAllocateWWMRegsLegacy(); } bool SIPreAllocateWWMRegs::processDef(MachineOperand &MO) { @@ -184,7 +189,14 @@ SIPreAllocateWWMRegs::printWWMInfo(const MachineInstr &MI) { #endif -bool SIPreAllocateWWMRegs::runOnMachineFunction(MachineFunction &MF) { +bool SIPreAllocateWWMRegsLegacy::runOnMachineFunction(MachineFunction &MF) { + auto *LIS = &getAnalysis<LiveIntervalsWrapperPass>().getLIS(); + auto *Matrix = &getAnalysis<LiveRegMatrixWrapperPass>().getLRM(); + auto *VRM = &getAnalysis<VirtRegMapWrapperPass>().getVRM(); + return SIPreAllocateWWMRegs(LIS, Matrix, VRM).run(MF); +} + +bool SIPreAllocateWWMRegs::run(MachineFunction &MF) { LLVM_DEBUG(dbgs() << "SIPreAllocateWWMRegs: function " << MF.getName() << "\n"); const GCNSubtarget &ST = MF.getSubtarget<GCNSubtarget>(); @@ -193,10 +205,6 @@ bool SIPreAllocateWWMRegs::runOnMachineFunction(MachineFunction &MF) { TRI = &TII->getRegisterInfo(); MRI = &MF.getRegInfo(); - LIS = &getAnalysis<LiveIntervalsWrapperPass>().getLIS(); - Matrix = &getAnalysis<LiveRegMatrixWrapperPass>().getLRM(); - VRM = &getAnalysis<VirtRegMapWrapperPass>().getVRM(); - RegClassInfo.runOnMachineFunction(MF); bool PreallocateSGPRSpillVGPRs = @@ -254,3 +262,13 @@ bool SIPreAllocateWWMRegs::runOnMachineFunction(MachineFunction &MF) { rewriteRegs(MF); return true; } + +PreservedAnalyses +SIPreAllocateWWMRegsPass::run(MachineFunction &MF, + MachineFunctionAnalysisManager &MFAM) { + auto *LIS = &MFAM.getResult<LiveIntervalsAnalysis>(MF); + auto *Matrix = &MFAM.getResult<LiveRegMatrixAnalysis>(MF); + auto *VRM = &MFAM.getResult<VirtRegMapAnalysis>(MF); + SIPreAllocateWWMRegs(LIS, Matrix, VRM).run(MF); + return PreservedAnalyses::all(); +} diff --git a/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.h b/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.h new file mode 100644 index 00000000000000..b86f7fe9213af0 --- /dev/null +++ b/llvm/lib/Target/AMDGPU/SIPreAllocateWWMRegs.h @@ -0,0 +1,30 @@ +//===--- SIPreAllocateWWMRegs.h -------------------------------------------===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// + +#ifndef LLVM_LIB_TARGET_AMDGPU_SIPREALLOCATEWWMREGS_H +#define LLVM_LIB_TARGET_AMDGPU_SIPREALLOCATEWWMREGS_H + +#include "llvm/CodeGen/MachinePassManager.h" + +namespace llvm { + +class SIPreAllocateWWMRegsPass + : public PassInfoMixin<SIPreAllocateWWMRegsPass> { +public: + PreservedAnalyses run(MachineFunction &MF, + MachineFunctionAnalysisManager &MFAM); + + MachineFunctionProperties getRequiredProperties() { + return MachineFunctionProperties().set( + MachineFunctionProperties::Property::IsSSA); + } +}; + +} // namespace llvm + +#endif // LLVM_LIB_TARGET_AMDGPU_SIPREALLOCATEWWMREGS_H _______________________________________________ llvm-branch-commits mailing list llvm-branch-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-branch-commits