1 //===-- RegUsageInfoCollector.cpp - Register Usage Information Collector --===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 /// This pass is required to take advantage of the interprocedural register
10 /// allocation infrastructure.
12 /// This pass is simple MachineFunction pass which collects register usage
13 /// details by iterating through each physical registers and checking
14 /// MRI::isPhysRegUsed() then creates a RegMask based on this details.
15 /// The pass then stores this RegMask in PhysicalRegisterUsageInfo.cpp
17 //===----------------------------------------------------------------------===//
19 #include "llvm/CodeGen/RegUsageInfoCollector.h"
20 #include "llvm/ADT/Statistic.h"
21 #include "llvm/CodeGen/MachineFunctionPass.h"
22 #include "llvm/CodeGen/MachineOperand.h"
23 #include "llvm/CodeGen/MachinePassManager.h"
24 #include "llvm/CodeGen/MachineRegisterInfo.h"
25 #include "llvm/CodeGen/Passes.h"
26 #include "llvm/CodeGen/RegisterUsageInfo.h"
27 #include "llvm/CodeGen/TargetFrameLowering.h"
28 #include "llvm/IR/Function.h"
29 #include "llvm/Support/Debug.h"
30 #include "llvm/Support/raw_ostream.h"
34 #define DEBUG_TYPE "ip-regalloc"
37 "Number of functions optimized for callee saved registers");
41 class RegUsageInfoCollector
{
42 PhysicalRegisterUsageInfo
&PRUI
;
45 RegUsageInfoCollector(PhysicalRegisterUsageInfo
&PRUI
) : PRUI(PRUI
) {}
46 bool run(MachineFunction
&MF
);
48 // Call getCalleeSaves and then also set the bits for subregs and
49 // fully saved superregs.
50 static void computeCalleeSavedRegs(BitVector
&SavedRegs
, MachineFunction
&MF
);
53 class RegUsageInfoCollectorLegacy
: public MachineFunctionPass
{
56 RegUsageInfoCollectorLegacy() : MachineFunctionPass(ID
) {
57 initializeRegUsageInfoCollectorLegacyPass(*PassRegistry::getPassRegistry());
60 StringRef
getPassName() const override
{
61 return "Register Usage Information Collector Pass";
64 void getAnalysisUsage(AnalysisUsage
&AU
) const override
{
65 AU
.addRequired
<PhysicalRegisterUsageInfoWrapperLegacy
>();
67 MachineFunctionPass::getAnalysisUsage(AU
);
70 bool runOnMachineFunction(MachineFunction
&MF
) override
;
72 } // end of anonymous namespace
74 char RegUsageInfoCollectorLegacy::ID
= 0;
76 INITIALIZE_PASS_BEGIN(RegUsageInfoCollectorLegacy
, "RegUsageInfoCollector",
77 "Register Usage Information Collector", false, false)
78 INITIALIZE_PASS_DEPENDENCY(PhysicalRegisterUsageInfoWrapperLegacy
)
79 INITIALIZE_PASS_END(RegUsageInfoCollectorLegacy
, "RegUsageInfoCollector",
80 "Register Usage Information Collector", false, false)
82 FunctionPass
*llvm::createRegUsageInfoCollector() {
83 return new RegUsageInfoCollectorLegacy();
86 // TODO: Move to hook somwehere?
88 // Return true if it is useful to track the used registers for IPRA / no CSR
89 // optimizations. This is not useful for entry points, and computing the
90 // register usage information is expensive.
91 static bool isCallableFunction(const MachineFunction
&MF
) {
92 switch (MF
.getFunction().getCallingConv()) {
93 case CallingConv::AMDGPU_VS
:
94 case CallingConv::AMDGPU_GS
:
95 case CallingConv::AMDGPU_PS
:
96 case CallingConv::AMDGPU_CS
:
97 case CallingConv::AMDGPU_HS
:
98 case CallingConv::AMDGPU_ES
:
99 case CallingConv::AMDGPU_LS
:
100 case CallingConv::AMDGPU_KERNEL
:
108 RegUsageInfoCollectorPass::run(MachineFunction
&MF
,
109 MachineFunctionAnalysisManager
&MFAM
) {
110 Module
&MFA
= *MF
.getFunction().getParent();
111 auto *PRUI
= MFAM
.getResult
<ModuleAnalysisManagerMachineFunctionProxy
>(MF
)
112 .getCachedResult
<PhysicalRegisterUsageAnalysis
>(MFA
);
113 assert(PRUI
&& "PhysicalRegisterUsageAnalysis not available");
114 RegUsageInfoCollector(*PRUI
).run(MF
);
115 return PreservedAnalyses::all();
118 bool RegUsageInfoCollectorLegacy::runOnMachineFunction(MachineFunction
&MF
) {
119 PhysicalRegisterUsageInfo
&PRUI
=
120 getAnalysis
<PhysicalRegisterUsageInfoWrapperLegacy
>().getPRUI();
121 return RegUsageInfoCollector(PRUI
).run(MF
);
124 bool RegUsageInfoCollector::run(MachineFunction
&MF
) {
125 MachineRegisterInfo
*MRI
= &MF
.getRegInfo();
126 const TargetRegisterInfo
*TRI
= MF
.getSubtarget().getRegisterInfo();
127 const TargetMachine
&TM
= MF
.getTarget();
131 << " -------------------- Register Usage Information Collector Pass"
132 << " -------------------- \nFunction Name : " << MF
.getName() << '\n');
134 // Analyzing the register usage may be expensive on some targets.
135 if (!isCallableFunction(MF
)) {
136 LLVM_DEBUG(dbgs() << "Not analyzing non-callable function\n");
140 // If there are no callers, there's no point in computing more precise
141 // register usage here.
142 if (MF
.getFunction().use_empty()) {
143 LLVM_DEBUG(dbgs() << "Not analyzing function with no callers\n");
147 std::vector
<uint32_t> RegMask
;
149 // Compute the size of the bit vector to represent all the registers.
150 // The bit vector is broken into 32-bit chunks, thus takes the ceil of
151 // the number of registers divided by 32 for the size.
152 unsigned RegMaskSize
= MachineOperand::getRegMaskSize(TRI
->getNumRegs());
153 RegMask
.resize(RegMaskSize
, ~((uint32_t)0));
155 const Function
&F
= MF
.getFunction();
157 PRUI
.setTargetMachine(TM
);
159 LLVM_DEBUG(dbgs() << "Clobbered Registers: ");
162 computeCalleeSavedRegs(SavedRegs
, MF
);
164 const BitVector
&UsedPhysRegsMask
= MRI
->getUsedPhysRegsMask();
165 auto SetRegAsDefined
= [&RegMask
] (unsigned Reg
) {
166 RegMask
[Reg
/ 32] &= ~(1u << Reg
% 32);
169 // Don't include $noreg in any regmasks.
170 SetRegAsDefined(MCRegister::NoRegister
);
172 // Some targets can clobber registers "inside" a call, typically in
173 // linker-generated code.
174 for (const MCPhysReg Reg
: TRI
->getIntraCallClobberedRegs(&MF
))
175 for (MCRegAliasIterator
AI(Reg
, TRI
, true); AI
.isValid(); ++AI
)
176 SetRegAsDefined(*AI
);
178 // Scan all the physical registers. When a register is defined in the current
179 // function set it and all the aliasing registers as defined in the regmask.
180 // FIXME: Rewrite to use regunits.
181 for (unsigned PReg
= 1, PRegE
= TRI
->getNumRegs(); PReg
< PRegE
; ++PReg
) {
182 // Don't count registers that are saved and restored.
183 if (SavedRegs
.test(PReg
))
185 // If a register is defined by an instruction mark it as defined together
186 // with all it's unsaved aliases.
187 if (!MRI
->def_empty(PReg
)) {
188 for (MCRegAliasIterator
AI(PReg
, TRI
, true); AI
.isValid(); ++AI
)
189 if (!SavedRegs
.test(*AI
))
190 SetRegAsDefined(*AI
);
193 // If a register is in the UsedPhysRegsMask set then mark it as defined.
194 // All clobbered aliases will also be in the set, so we can skip setting
195 // as defined all the aliases here.
196 if (UsedPhysRegsMask
.test(PReg
))
197 SetRegAsDefined(PReg
);
200 if (TargetFrameLowering::isSafeForNoCSROpt(F
) &&
201 MF
.getSubtarget().getFrameLowering()->isProfitableForNoCSROpt(F
)) {
203 LLVM_DEBUG(dbgs() << MF
.getName()
204 << " function optimized for not having CSR.\n");
208 for (unsigned PReg
= 1, PRegE
= TRI
->getNumRegs(); PReg
< PRegE
; ++PReg
) {
209 if (MachineOperand::clobbersPhysReg(&(RegMask
[0]), PReg
))
210 dbgs() << printReg(PReg
, TRI
) << " ";
213 dbgs() << " \n----------------------------------------\n";
216 PRUI
.storeUpdateRegUsageInfo(F
, RegMask
);
221 void RegUsageInfoCollector::
222 computeCalleeSavedRegs(BitVector
&SavedRegs
, MachineFunction
&MF
) {
223 const TargetFrameLowering
&TFI
= *MF
.getSubtarget().getFrameLowering();
224 const TargetRegisterInfo
&TRI
= *MF
.getSubtarget().getRegisterInfo();
226 // Target will return the set of registers that it saves/restores as needed.
228 TFI
.getCalleeSaves(MF
, SavedRegs
);
229 if (SavedRegs
.none())
233 const MCPhysReg
*CSRegs
= TRI
.getCalleeSavedRegs(&MF
);
234 for (unsigned i
= 0; CSRegs
[i
]; ++i
) {
235 MCPhysReg Reg
= CSRegs
[i
];
236 if (SavedRegs
.test(Reg
)) {
238 for (MCPhysReg SR
: TRI
.subregs(Reg
))