[RISCV] Fix mgather -> riscv.masked.strided.load combine not extending indices (...
[llvm-project.git] / llvm / lib / CodeGen / GlobalISel / CSEMIRBuilder.cpp
blob64e2d517e3b9c48650d1e91d8a4709ec0355c142
1 //===-- llvm/CodeGen/GlobalISel/CSEMIRBuilder.cpp - MIBuilder--*- C++ -*-==//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 /// \file
9 /// This file implements the CSEMIRBuilder class which CSEs as it builds
10 /// instructions.
11 //===----------------------------------------------------------------------===//
14 #include "llvm/CodeGen/GlobalISel/CSEMIRBuilder.h"
15 #include "llvm/CodeGen/GlobalISel/CSEInfo.h"
16 #include "llvm/CodeGen/GlobalISel/GISelChangeObserver.h"
17 #include "llvm/CodeGen/GlobalISel/Utils.h"
18 #include "llvm/CodeGen/MachineInstrBuilder.h"
19 #include "llvm/IR/DebugInfoMetadata.h"
21 using namespace llvm;
23 bool CSEMIRBuilder::dominates(MachineBasicBlock::const_iterator A,
24 MachineBasicBlock::const_iterator B) const {
25 auto MBBEnd = getMBB().end();
26 if (B == MBBEnd)
27 return true;
28 assert(A->getParent() == B->getParent() &&
29 "Iterators should be in same block");
30 const MachineBasicBlock *BBA = A->getParent();
31 MachineBasicBlock::const_iterator I = BBA->begin();
32 for (; &*I != A && &*I != B; ++I)
34 return &*I == A;
37 MachineInstrBuilder
38 CSEMIRBuilder::getDominatingInstrForID(FoldingSetNodeID &ID,
39 void *&NodeInsertPos) {
40 GISelCSEInfo *CSEInfo = getCSEInfo();
41 assert(CSEInfo && "Can't get here without setting CSEInfo");
42 MachineBasicBlock *CurMBB = &getMBB();
43 MachineInstr *MI =
44 CSEInfo->getMachineInstrIfExists(ID, CurMBB, NodeInsertPos);
45 if (MI) {
46 CSEInfo->countOpcodeHit(MI->getOpcode());
47 auto CurrPos = getInsertPt();
48 auto MII = MachineBasicBlock::iterator(MI);
49 if (MII == CurrPos) {
50 // Move the insert point ahead of the instruction so any future uses of
51 // this builder will have the def ready.
52 setInsertPt(*CurMBB, std::next(MII));
53 } else if (!dominates(MI, CurrPos)) {
54 CurMBB->splice(CurrPos, CurMBB, MI);
56 return MachineInstrBuilder(getMF(), MI);
58 return MachineInstrBuilder();
61 bool CSEMIRBuilder::canPerformCSEForOpc(unsigned Opc) const {
62 const GISelCSEInfo *CSEInfo = getCSEInfo();
63 if (!CSEInfo || !CSEInfo->shouldCSE(Opc))
64 return false;
65 return true;
68 void CSEMIRBuilder::profileDstOp(const DstOp &Op,
69 GISelInstProfileBuilder &B) const {
70 switch (Op.getDstOpKind()) {
71 case DstOp::DstType::Ty_RC:
72 B.addNodeIDRegType(Op.getRegClass());
73 break;
74 case DstOp::DstType::Ty_Reg: {
75 // Regs can have LLT&(RB|RC). If those exist, profile them as well.
76 B.addNodeIDReg(Op.getReg());
77 break;
79 default:
80 B.addNodeIDRegType(Op.getLLTTy(*getMRI()));
81 break;
85 void CSEMIRBuilder::profileSrcOp(const SrcOp &Op,
86 GISelInstProfileBuilder &B) const {
87 switch (Op.getSrcOpKind()) {
88 case SrcOp::SrcType::Ty_Imm:
89 B.addNodeIDImmediate(static_cast<int64_t>(Op.getImm()));
90 break;
91 case SrcOp::SrcType::Ty_Predicate:
92 B.addNodeIDImmediate(static_cast<int64_t>(Op.getPredicate()));
93 break;
94 default:
95 B.addNodeIDRegType(Op.getReg());
96 break;
100 void CSEMIRBuilder::profileMBBOpcode(GISelInstProfileBuilder &B,
101 unsigned Opc) const {
102 // First add the MBB (Local CSE).
103 B.addNodeIDMBB(&getMBB());
104 // Then add the opcode.
105 B.addNodeIDOpcode(Opc);
108 void CSEMIRBuilder::profileEverything(unsigned Opc, ArrayRef<DstOp> DstOps,
109 ArrayRef<SrcOp> SrcOps,
110 std::optional<unsigned> Flags,
111 GISelInstProfileBuilder &B) const {
113 profileMBBOpcode(B, Opc);
114 // Then add the DstOps.
115 profileDstOps(DstOps, B);
116 // Then add the SrcOps.
117 profileSrcOps(SrcOps, B);
118 // Add Flags if passed in.
119 if (Flags)
120 B.addNodeIDFlag(*Flags);
123 MachineInstrBuilder CSEMIRBuilder::memoizeMI(MachineInstrBuilder MIB,
124 void *NodeInsertPos) {
125 assert(canPerformCSEForOpc(MIB->getOpcode()) &&
126 "Attempting to CSE illegal op");
127 MachineInstr *MIBInstr = MIB;
128 getCSEInfo()->insertInstr(MIBInstr, NodeInsertPos);
129 return MIB;
132 bool CSEMIRBuilder::checkCopyToDefsPossible(ArrayRef<DstOp> DstOps) {
133 if (DstOps.size() == 1)
134 return true; // always possible to emit copy to just 1 vreg.
136 return llvm::all_of(DstOps, [](const DstOp &Op) {
137 DstOp::DstType DT = Op.getDstOpKind();
138 return DT == DstOp::DstType::Ty_LLT || DT == DstOp::DstType::Ty_RC;
142 MachineInstrBuilder
143 CSEMIRBuilder::generateCopiesIfRequired(ArrayRef<DstOp> DstOps,
144 MachineInstrBuilder &MIB) {
145 assert(checkCopyToDefsPossible(DstOps) &&
146 "Impossible return a single MIB with copies to multiple defs");
147 if (DstOps.size() == 1) {
148 const DstOp &Op = DstOps[0];
149 if (Op.getDstOpKind() == DstOp::DstType::Ty_Reg)
150 return buildCopy(Op.getReg(), MIB.getReg(0));
153 // If we didn't generate a copy then we're re-using an existing node directly
154 // instead of emitting any code. Merge the debug location we wanted to emit
155 // into the instruction we're CSE'ing with. Debug locations arent part of the
156 // profile so we don't need to recompute it.
157 if (getDebugLoc()) {
158 GISelChangeObserver *Observer = getState().Observer;
159 if (Observer)
160 Observer->changingInstr(*MIB);
161 MIB->setDebugLoc(
162 DILocation::getMergedLocation(MIB->getDebugLoc(), getDebugLoc()));
163 if (Observer)
164 Observer->changedInstr(*MIB);
167 return MIB;
170 MachineInstrBuilder CSEMIRBuilder::buildInstr(unsigned Opc,
171 ArrayRef<DstOp> DstOps,
172 ArrayRef<SrcOp> SrcOps,
173 std::optional<unsigned> Flag) {
174 switch (Opc) {
175 default:
176 break;
177 case TargetOpcode::G_ADD:
178 case TargetOpcode::G_PTR_ADD:
179 case TargetOpcode::G_AND:
180 case TargetOpcode::G_ASHR:
181 case TargetOpcode::G_LSHR:
182 case TargetOpcode::G_MUL:
183 case TargetOpcode::G_OR:
184 case TargetOpcode::G_SHL:
185 case TargetOpcode::G_SUB:
186 case TargetOpcode::G_XOR:
187 case TargetOpcode::G_UDIV:
188 case TargetOpcode::G_SDIV:
189 case TargetOpcode::G_UREM:
190 case TargetOpcode::G_SREM:
191 case TargetOpcode::G_SMIN:
192 case TargetOpcode::G_SMAX:
193 case TargetOpcode::G_UMIN:
194 case TargetOpcode::G_UMAX: {
195 // Try to constant fold these.
196 assert(SrcOps.size() == 2 && "Invalid sources");
197 assert(DstOps.size() == 1 && "Invalid dsts");
198 LLT SrcTy = SrcOps[0].getLLTTy(*getMRI());
200 if (Opc == TargetOpcode::G_PTR_ADD &&
201 getDataLayout().isNonIntegralAddressSpace(SrcTy.getAddressSpace()))
202 break;
204 if (SrcTy.isVector()) {
205 // Try to constant fold vector constants.
206 SmallVector<APInt> VecCst = ConstantFoldVectorBinop(
207 Opc, SrcOps[0].getReg(), SrcOps[1].getReg(), *getMRI());
208 if (!VecCst.empty())
209 return buildBuildVectorConstant(DstOps[0], VecCst);
210 break;
213 if (std::optional<APInt> Cst = ConstantFoldBinOp(
214 Opc, SrcOps[0].getReg(), SrcOps[1].getReg(), *getMRI()))
215 return buildConstant(DstOps[0], *Cst);
216 break;
218 case TargetOpcode::G_FADD:
219 case TargetOpcode::G_FSUB:
220 case TargetOpcode::G_FMUL:
221 case TargetOpcode::G_FDIV:
222 case TargetOpcode::G_FREM:
223 case TargetOpcode::G_FMINNUM:
224 case TargetOpcode::G_FMAXNUM:
225 case TargetOpcode::G_FMINNUM_IEEE:
226 case TargetOpcode::G_FMAXNUM_IEEE:
227 case TargetOpcode::G_FMINIMUM:
228 case TargetOpcode::G_FMAXIMUM:
229 case TargetOpcode::G_FCOPYSIGN: {
230 // Try to constant fold these.
231 assert(SrcOps.size() == 2 && "Invalid sources");
232 assert(DstOps.size() == 1 && "Invalid dsts");
233 if (std::optional<APFloat> Cst = ConstantFoldFPBinOp(
234 Opc, SrcOps[0].getReg(), SrcOps[1].getReg(), *getMRI()))
235 return buildFConstant(DstOps[0], *Cst);
236 break;
238 case TargetOpcode::G_SEXT_INREG: {
239 assert(DstOps.size() == 1 && "Invalid dst ops");
240 assert(SrcOps.size() == 2 && "Invalid src ops");
241 const DstOp &Dst = DstOps[0];
242 const SrcOp &Src0 = SrcOps[0];
243 const SrcOp &Src1 = SrcOps[1];
244 if (auto MaybeCst =
245 ConstantFoldExtOp(Opc, Src0.getReg(), Src1.getImm(), *getMRI()))
246 return buildConstant(Dst, *MaybeCst);
247 break;
249 case TargetOpcode::G_SITOFP:
250 case TargetOpcode::G_UITOFP: {
251 // Try to constant fold these.
252 assert(SrcOps.size() == 1 && "Invalid sources");
253 assert(DstOps.size() == 1 && "Invalid dsts");
254 if (std::optional<APFloat> Cst = ConstantFoldIntToFloat(
255 Opc, DstOps[0].getLLTTy(*getMRI()), SrcOps[0].getReg(), *getMRI()))
256 return buildFConstant(DstOps[0], *Cst);
257 break;
259 case TargetOpcode::G_CTLZ: {
260 assert(SrcOps.size() == 1 && "Expected one source");
261 assert(DstOps.size() == 1 && "Expected one dest");
262 auto MaybeCsts = ConstantFoldCTLZ(SrcOps[0].getReg(), *getMRI());
263 if (!MaybeCsts)
264 break;
265 if (MaybeCsts->size() == 1)
266 return buildConstant(DstOps[0], (*MaybeCsts)[0]);
267 // This was a vector constant. Build a G_BUILD_VECTOR for them.
268 SmallVector<Register> ConstantRegs;
269 LLT VecTy = DstOps[0].getLLTTy(*getMRI());
270 for (unsigned Cst : *MaybeCsts)
271 ConstantRegs.emplace_back(
272 buildConstant(VecTy.getScalarType(), Cst).getReg(0));
273 return buildBuildVector(DstOps[0], ConstantRegs);
276 bool CanCopy = checkCopyToDefsPossible(DstOps);
277 if (!canPerformCSEForOpc(Opc))
278 return MachineIRBuilder::buildInstr(Opc, DstOps, SrcOps, Flag);
279 // If we can CSE this instruction, but involves generating copies to multiple
280 // regs, give up. This frequently happens to UNMERGEs.
281 if (!CanCopy) {
282 auto MIB = MachineIRBuilder::buildInstr(Opc, DstOps, SrcOps, Flag);
283 // CSEInfo would have tracked this instruction. Remove it from the temporary
284 // insts.
285 getCSEInfo()->handleRemoveInst(&*MIB);
286 return MIB;
288 FoldingSetNodeID ID;
289 GISelInstProfileBuilder ProfBuilder(ID, *getMRI());
290 void *InsertPos = nullptr;
291 profileEverything(Opc, DstOps, SrcOps, Flag, ProfBuilder);
292 MachineInstrBuilder MIB = getDominatingInstrForID(ID, InsertPos);
293 if (MIB) {
294 // Handle generating copies here.
295 return generateCopiesIfRequired(DstOps, MIB);
297 // This instruction does not exist in the CSEInfo. Build it and CSE it.
298 MachineInstrBuilder NewMIB =
299 MachineIRBuilder::buildInstr(Opc, DstOps, SrcOps, Flag);
300 return memoizeMI(NewMIB, InsertPos);
303 MachineInstrBuilder CSEMIRBuilder::buildConstant(const DstOp &Res,
304 const ConstantInt &Val) {
305 constexpr unsigned Opc = TargetOpcode::G_CONSTANT;
306 if (!canPerformCSEForOpc(Opc))
307 return MachineIRBuilder::buildConstant(Res, Val);
309 // For vectors, CSE the element only for now.
310 LLT Ty = Res.getLLTTy(*getMRI());
311 if (Ty.isVector())
312 return buildSplatVector(Res, buildConstant(Ty.getElementType(), Val));
314 FoldingSetNodeID ID;
315 GISelInstProfileBuilder ProfBuilder(ID, *getMRI());
316 void *InsertPos = nullptr;
317 profileMBBOpcode(ProfBuilder, Opc);
318 profileDstOp(Res, ProfBuilder);
319 ProfBuilder.addNodeIDMachineOperand(MachineOperand::CreateCImm(&Val));
320 MachineInstrBuilder MIB = getDominatingInstrForID(ID, InsertPos);
321 if (MIB) {
322 // Handle generating copies here.
323 return generateCopiesIfRequired({Res}, MIB);
326 MachineInstrBuilder NewMIB = MachineIRBuilder::buildConstant(Res, Val);
327 return memoizeMI(NewMIB, InsertPos);
330 MachineInstrBuilder CSEMIRBuilder::buildFConstant(const DstOp &Res,
331 const ConstantFP &Val) {
332 constexpr unsigned Opc = TargetOpcode::G_FCONSTANT;
333 if (!canPerformCSEForOpc(Opc))
334 return MachineIRBuilder::buildFConstant(Res, Val);
336 // For vectors, CSE the element only for now.
337 LLT Ty = Res.getLLTTy(*getMRI());
338 if (Ty.isVector())
339 return buildSplatVector(Res, buildFConstant(Ty.getElementType(), Val));
341 FoldingSetNodeID ID;
342 GISelInstProfileBuilder ProfBuilder(ID, *getMRI());
343 void *InsertPos = nullptr;
344 profileMBBOpcode(ProfBuilder, Opc);
345 profileDstOp(Res, ProfBuilder);
346 ProfBuilder.addNodeIDMachineOperand(MachineOperand::CreateFPImm(&Val));
347 MachineInstrBuilder MIB = getDominatingInstrForID(ID, InsertPos);
348 if (MIB) {
349 // Handle generating copies here.
350 return generateCopiesIfRequired({Res}, MIB);
352 MachineInstrBuilder NewMIB = MachineIRBuilder::buildFConstant(Res, Val);
353 return memoizeMI(NewMIB, InsertPos);