1 //===- SIPreAllocateWWMRegs.cpp - WWM Register Pre-allocation -------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
10 /// Pass to pre-allocated WWM registers
12 //===----------------------------------------------------------------------===//
15 #include "AMDGPUSubtarget.h"
16 #include "SIInstrInfo.h"
17 #include "SIRegisterInfo.h"
18 #include "SIMachineFunctionInfo.h"
19 #include "MCTargetDesc/AMDGPUMCTargetDesc.h"
20 #include "llvm/ADT/PostOrderIterator.h"
21 #include "llvm/CodeGen/VirtRegMap.h"
22 #include "llvm/CodeGen/LiveInterval.h"
23 #include "llvm/CodeGen/LiveIntervals.h"
24 #include "llvm/CodeGen/LiveRegMatrix.h"
25 #include "llvm/CodeGen/MachineDominators.h"
26 #include "llvm/CodeGen/MachineFunctionPass.h"
27 #include "llvm/CodeGen/RegisterClassInfo.h"
31 #define DEBUG_TYPE "si-pre-allocate-wwm-regs"
35 class SIPreAllocateWWMRegs
: public MachineFunctionPass
{
37 const SIInstrInfo
*TII
;
38 const SIRegisterInfo
*TRI
;
39 MachineRegisterInfo
*MRI
;
41 LiveRegMatrix
*Matrix
;
43 RegisterClassInfo RegClassInfo
;
45 std::vector
<unsigned> RegsToRewrite
;
50 SIPreAllocateWWMRegs() : MachineFunctionPass(ID
) {
51 initializeSIPreAllocateWWMRegsPass(*PassRegistry::getPassRegistry());
54 bool runOnMachineFunction(MachineFunction
&MF
) override
;
56 void getAnalysisUsage(AnalysisUsage
&AU
) const override
{
57 AU
.addRequired
<LiveIntervals
>();
58 AU
.addPreserved
<LiveIntervals
>();
59 AU
.addRequired
<VirtRegMap
>();
60 AU
.addRequired
<LiveRegMatrix
>();
61 AU
.addPreserved
<SlotIndexes
>();
63 MachineFunctionPass::getAnalysisUsage(AU
);
67 bool processDef(MachineOperand
&MO
);
68 void rewriteRegs(MachineFunction
&MF
);
71 } // End anonymous namespace.
73 INITIALIZE_PASS_BEGIN(SIPreAllocateWWMRegs
, DEBUG_TYPE
,
74 "SI Pre-allocate WWM Registers", false, false)
75 INITIALIZE_PASS_DEPENDENCY(LiveIntervals
)
76 INITIALIZE_PASS_DEPENDENCY(VirtRegMap
)
77 INITIALIZE_PASS_DEPENDENCY(LiveRegMatrix
)
78 INITIALIZE_PASS_END(SIPreAllocateWWMRegs
, DEBUG_TYPE
,
79 "SI Pre-allocate WWM Registers", false, false)
81 char SIPreAllocateWWMRegs::ID
= 0;
83 char &llvm::SIPreAllocateWWMRegsID
= SIPreAllocateWWMRegs::ID
;
85 FunctionPass
*llvm::createSIPreAllocateWWMRegsPass() {
86 return new SIPreAllocateWWMRegs();
89 bool SIPreAllocateWWMRegs::processDef(MachineOperand
&MO
) {
93 unsigned Reg
= MO
.getReg();
95 if (!TRI
->isVGPR(*MRI
, Reg
))
98 if (TRI
->isPhysicalRegister(Reg
))
101 if (VRM
->hasPhys(Reg
))
104 LiveInterval
&LI
= LIS
->getInterval(Reg
);
106 for (unsigned PhysReg
: RegClassInfo
.getOrder(MRI
->getRegClass(Reg
))) {
107 if (!MRI
->isPhysRegUsed(PhysReg
) &&
108 Matrix
->checkInterference(LI
, PhysReg
) == LiveRegMatrix::IK_Free
) {
109 Matrix
->assign(LI
, PhysReg
);
110 assert(PhysReg
!= 0);
111 RegsToRewrite
.push_back(Reg
);
116 llvm_unreachable("physreg not found for WWM expression");
120 void SIPreAllocateWWMRegs::rewriteRegs(MachineFunction
&MF
) {
121 for (MachineBasicBlock
&MBB
: MF
) {
122 for (MachineInstr
&MI
: MBB
) {
123 for (MachineOperand
&MO
: MI
.operands()) {
127 const unsigned VirtReg
= MO
.getReg();
128 if (TRI
->isPhysicalRegister(VirtReg
))
131 if (!VRM
->hasPhys(VirtReg
))
134 unsigned PhysReg
= VRM
->getPhys(VirtReg
);
135 const unsigned SubReg
= MO
.getSubReg();
137 PhysReg
= TRI
->getSubReg(PhysReg
, SubReg
);
142 MO
.setIsRenamable(false);
147 SIMachineFunctionInfo
*MFI
= MF
.getInfo
<SIMachineFunctionInfo
>();
149 for (unsigned Reg
: RegsToRewrite
) {
150 LIS
->removeInterval(Reg
);
152 const unsigned PhysReg
= VRM
->getPhys(Reg
);
153 assert(PhysReg
!= 0);
154 MFI
->ReserveWWMRegister(PhysReg
);
157 RegsToRewrite
.clear();
159 // Update the set of reserved registers to include WWM ones.
160 MRI
->freezeReservedRegs(MF
);
163 bool SIPreAllocateWWMRegs::runOnMachineFunction(MachineFunction
&MF
) {
164 LLVM_DEBUG(dbgs() << "SIPreAllocateWWMRegs: function " << MF
.getName() << "\n");
166 const GCNSubtarget
&ST
= MF
.getSubtarget
<GCNSubtarget
>();
168 TII
= ST
.getInstrInfo();
169 TRI
= &TII
->getRegisterInfo();
170 MRI
= &MF
.getRegInfo();
172 LIS
= &getAnalysis
<LiveIntervals
>();
173 Matrix
= &getAnalysis
<LiveRegMatrix
>();
174 VRM
= &getAnalysis
<VirtRegMap
>();
176 RegClassInfo
.runOnMachineFunction(MF
);
178 bool RegsAssigned
= false;
180 // We use a reverse post-order traversal of the control-flow graph to
181 // guarantee that we visit definitions in dominance order. Since WWM
182 // expressions are guaranteed to never involve phi nodes, and we can only
183 // escape WWM through the special WWM instruction, this means that this is a
184 // perfect elimination order, so we can never do any better.
185 ReversePostOrderTraversal
<MachineFunction
*> RPOT(&MF
);
187 for (MachineBasicBlock
*MBB
: RPOT
) {
189 for (MachineInstr
&MI
: *MBB
) {
190 if (MI
.getOpcode() == AMDGPU::V_SET_INACTIVE_B32
||
191 MI
.getOpcode() == AMDGPU::V_SET_INACTIVE_B64
)
192 RegsAssigned
|= processDef(MI
.getOperand(0));
194 if (MI
.getOpcode() == AMDGPU::ENTER_WWM
) {
195 LLVM_DEBUG(dbgs() << "entering WWM region: " << MI
<< "\n");
200 if (MI
.getOpcode() == AMDGPU::EXIT_WWM
) {
201 LLVM_DEBUG(dbgs() << "exiting WWM region: " << MI
<< "\n");
208 LLVM_DEBUG(dbgs() << "processing " << MI
<< "\n");
210 for (MachineOperand
&DefOpnd
: MI
.defs()) {
211 RegsAssigned
|= processDef(DefOpnd
);