1 //==-- AArch64DeadRegisterDefinitions.cpp - Replace dead defs w/ zero reg --==//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
8 /// \file When allowed by the instruction, replace a dead definition of a GPR
9 /// with the zero register. This makes the code a bit friendlier towards the
10 /// hardware's register renamer.
11 //===----------------------------------------------------------------------===//
14 #include "AArch64RegisterInfo.h"
15 #include "AArch64Subtarget.h"
16 #include "llvm/ADT/Statistic.h"
17 #include "llvm/CodeGen/ISDOpcodes.h"
18 #include "llvm/CodeGen/MachineFunction.h"
19 #include "llvm/CodeGen/MachineFunctionPass.h"
20 #include "llvm/CodeGen/MachineInstr.h"
21 #include "llvm/CodeGen/MachineRegisterInfo.h"
22 #include "llvm/CodeGen/TargetInstrInfo.h"
23 #include "llvm/CodeGen/TargetSubtargetInfo.h"
24 #include "llvm/Support/Debug.h"
25 #include "llvm/Support/raw_ostream.h"
28 #define DEBUG_TYPE "aarch64-dead-defs"
30 STATISTIC(NumDeadDefsReplaced
, "Number of dead definitions replaced");
32 #define AARCH64_DEAD_REG_DEF_NAME "AArch64 Dead register definitions"
35 class AArch64DeadRegisterDefinitions
: public MachineFunctionPass
{
37 const TargetRegisterInfo
*TRI
;
38 const MachineRegisterInfo
*MRI
;
39 const TargetInstrInfo
*TII
;
41 void processMachineBasicBlock(MachineBasicBlock
&MBB
);
43 static char ID
; // Pass identification, replacement for typeid.
44 AArch64DeadRegisterDefinitions() : MachineFunctionPass(ID
) {
45 initializeAArch64DeadRegisterDefinitionsPass(
46 *PassRegistry::getPassRegistry());
49 bool runOnMachineFunction(MachineFunction
&F
) override
;
51 StringRef
getPassName() const override
{ return AARCH64_DEAD_REG_DEF_NAME
; }
53 void getAnalysisUsage(AnalysisUsage
&AU
) const override
{
55 MachineFunctionPass::getAnalysisUsage(AU
);
58 char AArch64DeadRegisterDefinitions::ID
= 0;
59 } // end anonymous namespace
61 INITIALIZE_PASS(AArch64DeadRegisterDefinitions
, "aarch64-dead-defs",
62 AARCH64_DEAD_REG_DEF_NAME
, false, false)
64 static bool usesFrameIndex(const MachineInstr
&MI
) {
65 for (const MachineOperand
&MO
: MI
.uses())
71 // Instructions that lose their 'read' operation for a subesquent fence acquire
72 // (DMB LD) once the zero register is used.
74 // WARNING: The aquire variants of the instructions are also affected, but they
75 // are split out into `atomicBarrierDroppedOnZero()` to support annotations on
77 static bool atomicReadDroppedOnZero(unsigned Opcode
) {
79 case AArch64::LDADDB
: case AArch64::LDADDH
:
80 case AArch64::LDADDW
: case AArch64::LDADDX
:
81 case AArch64::LDADDLB
: case AArch64::LDADDLH
:
82 case AArch64::LDADDLW
: case AArch64::LDADDLX
:
83 case AArch64::LDCLRB
: case AArch64::LDCLRH
:
84 case AArch64::LDCLRW
: case AArch64::LDCLRX
:
85 case AArch64::LDCLRLB
: case AArch64::LDCLRLH
:
86 case AArch64::LDCLRLW
: case AArch64::LDCLRLX
:
87 case AArch64::LDEORB
: case AArch64::LDEORH
:
88 case AArch64::LDEORW
: case AArch64::LDEORX
:
89 case AArch64::LDEORLB
: case AArch64::LDEORLH
:
90 case AArch64::LDEORLW
: case AArch64::LDEORLX
:
91 case AArch64::LDSETB
: case AArch64::LDSETH
:
92 case AArch64::LDSETW
: case AArch64::LDSETX
:
93 case AArch64::LDSETLB
: case AArch64::LDSETLH
:
94 case AArch64::LDSETLW
: case AArch64::LDSETLX
:
95 case AArch64::LDSMAXB
: case AArch64::LDSMAXH
:
96 case AArch64::LDSMAXW
: case AArch64::LDSMAXX
:
97 case AArch64::LDSMAXLB
: case AArch64::LDSMAXLH
:
98 case AArch64::LDSMAXLW
: case AArch64::LDSMAXLX
:
99 case AArch64::LDSMINB
: case AArch64::LDSMINH
:
100 case AArch64::LDSMINW
: case AArch64::LDSMINX
:
101 case AArch64::LDSMINLB
: case AArch64::LDSMINLH
:
102 case AArch64::LDSMINLW
: case AArch64::LDSMINLX
:
103 case AArch64::LDUMAXB
: case AArch64::LDUMAXH
:
104 case AArch64::LDUMAXW
: case AArch64::LDUMAXX
:
105 case AArch64::LDUMAXLB
: case AArch64::LDUMAXLH
:
106 case AArch64::LDUMAXLW
: case AArch64::LDUMAXLX
:
107 case AArch64::LDUMINB
: case AArch64::LDUMINH
:
108 case AArch64::LDUMINW
: case AArch64::LDUMINX
:
109 case AArch64::LDUMINLB
: case AArch64::LDUMINLH
:
110 case AArch64::LDUMINLW
: case AArch64::LDUMINLX
:
116 void AArch64DeadRegisterDefinitions::processMachineBasicBlock(
117 MachineBasicBlock
&MBB
) {
118 const MachineFunction
&MF
= *MBB
.getParent();
119 for (MachineInstr
&MI
: MBB
) {
120 if (usesFrameIndex(MI
)) {
121 // We need to skip this instruction because while it appears to have a
122 // dead def it uses a frame index which might expand into a multi
123 // instruction sequence during EPI.
124 LLVM_DEBUG(dbgs() << " Ignoring, operand is frame index\n");
127 if (MI
.definesRegister(AArch64::XZR
) || MI
.definesRegister(AArch64::WZR
)) {
128 // It is not allowed to write to the same register (not even the zero
129 // register) twice in a single instruction.
132 << " Ignoring, XZR or WZR already used by the instruction\n");
136 if (atomicBarrierDroppedOnZero(MI
.getOpcode()) || atomicReadDroppedOnZero(MI
.getOpcode())) {
137 LLVM_DEBUG(dbgs() << " Ignoring, semantics change with xzr/wzr.\n");
141 const MCInstrDesc
&Desc
= MI
.getDesc();
142 for (int I
= 0, E
= Desc
.getNumDefs(); I
!= E
; ++I
) {
143 MachineOperand
&MO
= MI
.getOperand(I
);
144 if (!MO
.isReg() || !MO
.isDef())
146 // We should not have any relevant physreg defs that are replacable by
147 // zero before register allocation. So we just check for dead vreg defs.
148 Register Reg
= MO
.getReg();
149 if (!Reg
.isVirtual() || (!MO
.isDead() && !MRI
->use_nodbg_empty(Reg
)))
151 assert(!MO
.isImplicit() && "Unexpected implicit def!");
152 LLVM_DEBUG(dbgs() << " Dead def operand #" << I
<< " in:\n ";
154 // Be careful not to change the register if it's a tied operand.
155 if (MI
.isRegTiedToUseOperand(I
)) {
156 LLVM_DEBUG(dbgs() << " Ignoring, def is tied operand.\n");
159 const TargetRegisterClass
*RC
= TII
->getRegClass(Desc
, I
, TRI
, MF
);
162 LLVM_DEBUG(dbgs() << " Ignoring, register is not a GPR.\n");
164 } else if (RC
->contains(AArch64::WZR
))
165 NewReg
= AArch64::WZR
;
166 else if (RC
->contains(AArch64::XZR
))
167 NewReg
= AArch64::XZR
;
169 LLVM_DEBUG(dbgs() << " Ignoring, register is not a GPR.\n");
172 LLVM_DEBUG(dbgs() << " Replacing with zero register. New:\n ");
175 LLVM_DEBUG(MI
.print(dbgs()));
176 ++NumDeadDefsReplaced
;
178 // Only replace one dead register, see check for zero register above.
184 // Scan the function for instructions that have a dead definition of a
185 // register. Replace that register with the zero register when possible.
186 bool AArch64DeadRegisterDefinitions::runOnMachineFunction(MachineFunction
&MF
) {
187 if (skipFunction(MF
.getFunction()))
190 TRI
= MF
.getSubtarget().getRegisterInfo();
191 TII
= MF
.getSubtarget().getInstrInfo();
192 MRI
= &MF
.getRegInfo();
193 LLVM_DEBUG(dbgs() << "***** AArch64DeadRegisterDefinitions *****\n");
196 processMachineBasicBlock(MBB
);
200 FunctionPass
*llvm::createAArch64DeadRegisterDefinitions() {
201 return new AArch64DeadRegisterDefinitions();