1 //===- HexagonSplitDouble.cpp ---------------------------------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "HexagonInstrInfo.h"
10 #include "HexagonRegisterInfo.h"
11 #include "HexagonSubtarget.h"
12 #include "llvm/ADT/BitVector.h"
13 #include "llvm/ADT/STLExtras.h"
14 #include "llvm/ADT/SmallVector.h"
15 #include "llvm/ADT/StringRef.h"
16 #include "llvm/CodeGen/MachineBasicBlock.h"
17 #include "llvm/CodeGen/MachineFunction.h"
18 #include "llvm/CodeGen/MachineFunctionPass.h"
19 #include "llvm/CodeGen/MachineInstr.h"
20 #include "llvm/CodeGen/MachineInstrBuilder.h"
21 #include "llvm/CodeGen/MachineLoopInfo.h"
22 #include "llvm/CodeGen/MachineMemOperand.h"
23 #include "llvm/CodeGen/MachineOperand.h"
24 #include "llvm/CodeGen/MachineRegisterInfo.h"
25 #include "llvm/CodeGen/TargetRegisterInfo.h"
26 #include "llvm/Config/llvm-config.h"
27 #include "llvm/IR/DebugLoc.h"
28 #include "llvm/Pass.h"
29 #include "llvm/Support/CommandLine.h"
30 #include "llvm/Support/Compiler.h"
31 #include "llvm/Support/Debug.h"
32 #include "llvm/Support/ErrorHandling.h"
33 #include "llvm/Support/raw_ostream.h"
43 #define DEBUG_TYPE "hsdr"
49 FunctionPass
*createHexagonSplitDoubleRegs();
50 void initializeHexagonSplitDoubleRegsPass(PassRegistry
&);
52 } // end namespace llvm
54 static cl::opt
<int> MaxHSDR("max-hsdr", cl::Hidden
, cl::init(-1),
55 cl::desc("Maximum number of split partitions"));
56 static cl::opt
<bool> MemRefsFixed("hsdr-no-mem", cl::Hidden
, cl::init(true),
57 cl::desc("Do not split loads or stores"));
58 static cl::opt
<bool> SplitAll("hsdr-split-all", cl::Hidden
, cl::init(false),
59 cl::desc("Split all partitions"));
63 class HexagonSplitDoubleRegs
: public MachineFunctionPass
{
67 HexagonSplitDoubleRegs() : MachineFunctionPass(ID
) {}
69 StringRef
getPassName() const override
{
70 return "Hexagon Split Double Registers";
73 void getAnalysisUsage(AnalysisUsage
&AU
) const override
{
74 AU
.addRequired
<MachineLoopInfo
>();
75 AU
.addPreserved
<MachineLoopInfo
>();
76 MachineFunctionPass::getAnalysisUsage(AU
);
79 bool runOnMachineFunction(MachineFunction
&MF
) override
;
82 static const TargetRegisterClass
*const DoubleRC
;
84 const HexagonRegisterInfo
*TRI
= nullptr;
85 const HexagonInstrInfo
*TII
= nullptr;
86 const MachineLoopInfo
*MLI
;
87 MachineRegisterInfo
*MRI
;
89 using USet
= std::set
<unsigned>;
90 using UUSetMap
= std::map
<unsigned, USet
>;
91 using UUPair
= std::pair
<unsigned, unsigned>;
92 using UUPairMap
= std::map
<unsigned, UUPair
>;
93 using LoopRegMap
= std::map
<const MachineLoop
*, USet
>;
95 bool isInduction(unsigned Reg
, LoopRegMap
&IRM
) const;
96 bool isVolatileInstr(const MachineInstr
*MI
) const;
97 bool isFixedInstr(const MachineInstr
*MI
) const;
98 void partitionRegisters(UUSetMap
&P2Rs
);
99 int32_t profit(const MachineInstr
*MI
) const;
100 int32_t profit(Register Reg
) const;
101 bool isProfitable(const USet
&Part
, LoopRegMap
&IRM
) const;
103 void collectIndRegsForLoop(const MachineLoop
*L
, USet
&Rs
);
104 void collectIndRegs(LoopRegMap
&IRM
);
106 void createHalfInstr(unsigned Opc
, MachineInstr
*MI
,
107 const UUPairMap
&PairMap
, unsigned SubR
);
108 void splitMemRef(MachineInstr
*MI
, const UUPairMap
&PairMap
);
109 void splitImmediate(MachineInstr
*MI
, const UUPairMap
&PairMap
);
110 void splitCombine(MachineInstr
*MI
, const UUPairMap
&PairMap
);
111 void splitExt(MachineInstr
*MI
, const UUPairMap
&PairMap
);
112 void splitShift(MachineInstr
*MI
, const UUPairMap
&PairMap
);
113 void splitAslOr(MachineInstr
*MI
, const UUPairMap
&PairMap
);
114 bool splitInstr(MachineInstr
*MI
, const UUPairMap
&PairMap
);
115 void replaceSubregUses(MachineInstr
*MI
, const UUPairMap
&PairMap
);
116 void collapseRegPairs(MachineInstr
*MI
, const UUPairMap
&PairMap
);
117 bool splitPartition(const USet
&Part
);
121 static void dump_partition(raw_ostream
&, const USet
&,
122 const TargetRegisterInfo
&);
125 } // end anonymous namespace
127 char HexagonSplitDoubleRegs::ID
;
128 int HexagonSplitDoubleRegs::Counter
= 0;
129 const TargetRegisterClass
*const HexagonSplitDoubleRegs::DoubleRC
=
130 &Hexagon::DoubleRegsRegClass
;
132 INITIALIZE_PASS(HexagonSplitDoubleRegs
, "hexagon-split-double",
133 "Hexagon Split Double Registers", false, false)
135 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
136 LLVM_DUMP_METHOD
void HexagonSplitDoubleRegs::dump_partition(raw_ostream
&os
,
137 const USet
&Part
, const TargetRegisterInfo
&TRI
) {
140 dbgs() << ' ' << printReg(I
, &TRI
);
145 bool HexagonSplitDoubleRegs::isInduction(unsigned Reg
, LoopRegMap
&IRM
) const {
147 const USet
&Rs
= I
.second
;
148 if (Rs
.find(Reg
) != Rs
.end())
154 bool HexagonSplitDoubleRegs::isVolatileInstr(const MachineInstr
*MI
) const {
155 for (auto &MO
: MI
->memoperands())
156 if (MO
->isVolatile() || MO
->isAtomic())
161 bool HexagonSplitDoubleRegs::isFixedInstr(const MachineInstr
*MI
) const {
162 if (MI
->mayLoadOrStore())
163 if (MemRefsFixed
|| isVolatileInstr(MI
))
165 if (MI
->isDebugInstr())
168 unsigned Opc
= MI
->getOpcode();
173 case TargetOpcode::PHI
:
174 case TargetOpcode::COPY
:
177 case Hexagon::L2_loadrd_io
:
178 // Not handling stack stores (only reg-based addresses).
179 if (MI
->getOperand(1).isReg())
182 case Hexagon::S2_storerd_io
:
183 // Not handling stack stores (only reg-based addresses).
184 if (MI
->getOperand(0).isReg())
187 case Hexagon::L2_loadrd_pi
:
188 case Hexagon::S2_storerd_pi
:
190 case Hexagon::A2_tfrpi
:
191 case Hexagon::A2_combineii
:
192 case Hexagon::A4_combineir
:
193 case Hexagon::A4_combineii
:
194 case Hexagon::A4_combineri
:
195 case Hexagon::A2_combinew
:
196 case Hexagon::CONST64
:
198 case Hexagon::A2_sxtw
:
200 case Hexagon::A2_andp
:
201 case Hexagon::A2_orp
:
202 case Hexagon::A2_xorp
:
203 case Hexagon::S2_asl_i_p_or
:
204 case Hexagon::S2_asl_i_p
:
205 case Hexagon::S2_asr_i_p
:
206 case Hexagon::S2_lsr_i_p
:
210 for (auto &Op
: MI
->operands()) {
213 Register R
= Op
.getReg();
220 void HexagonSplitDoubleRegs::partitionRegisters(UUSetMap
&P2Rs
) {
221 using UUMap
= std::map
<unsigned, unsigned>;
222 using UVect
= std::vector
<unsigned>;
224 unsigned NumRegs
= MRI
->getNumVirtRegs();
225 BitVector
DoubleRegs(NumRegs
);
226 for (unsigned i
= 0; i
< NumRegs
; ++i
) {
227 unsigned R
= Register::index2VirtReg(i
);
228 if (MRI
->getRegClass(R
) == DoubleRC
)
232 BitVector
FixedRegs(NumRegs
);
233 for (int x
= DoubleRegs
.find_first(); x
>= 0; x
= DoubleRegs
.find_next(x
)) {
234 unsigned R
= Register::index2VirtReg(x
);
235 MachineInstr
*DefI
= MRI
->getVRegDef(R
);
236 // In some cases a register may exist, but never be defined or used.
237 // It should never appear anywhere, but mark it as "fixed", just to be
239 if (!DefI
|| isFixedInstr(DefI
))
244 for (int x
= DoubleRegs
.find_first(); x
>= 0; x
= DoubleRegs
.find_next(x
)) {
247 unsigned R
= Register::index2VirtReg(x
);
248 LLVM_DEBUG(dbgs() << printReg(R
, TRI
) << " ~~");
249 USet
&Asc
= AssocMap
[R
];
250 for (auto U
= MRI
->use_nodbg_begin(R
), Z
= MRI
->use_nodbg_end();
252 MachineOperand
&Op
= *U
;
253 MachineInstr
*UseI
= Op
.getParent();
254 if (isFixedInstr(UseI
))
256 for (unsigned i
= 0, n
= UseI
->getNumOperands(); i
< n
; ++i
) {
257 MachineOperand
&MO
= UseI
->getOperand(i
);
258 // Skip non-registers or registers with subregisters.
259 if (&MO
== &Op
|| !MO
.isReg() || MO
.getSubReg())
261 Register T
= MO
.getReg();
262 if (!T
.isVirtual()) {
266 if (MRI
->getRegClass(T
) != DoubleRC
)
268 unsigned u
= Register::virtReg2Index(T
);
271 LLVM_DEBUG(dbgs() << ' ' << printReg(T
, TRI
));
273 // Make it symmetric.
274 AssocMap
[T
].insert(R
);
277 LLVM_DEBUG(dbgs() << '\n');
283 for (int x
= DoubleRegs
.find_first(); x
>= 0; x
= DoubleRegs
.find_next(x
)) {
284 unsigned R
= Register::index2VirtReg(x
);
285 if (Visited
.count(R
))
287 // Create a new partition for R.
288 unsigned ThisP
= FixedRegs
[x
] ? 0 : NextP
++;
291 for (unsigned i
= 0; i
< WorkQ
.size(); ++i
) {
292 unsigned T
= WorkQ
[i
];
293 if (Visited
.count(T
))
297 // Add all registers associated with T.
298 USet
&Asc
= AssocMap
[T
];
299 append_range(WorkQ
, Asc
);
304 P2Rs
[I
.second
].insert(I
.first
);
307 static inline int32_t profitImm(unsigned Imm
) {
309 if (Imm
== 0 || Imm
== 0xFFFFFFFF)
314 int32_t HexagonSplitDoubleRegs::profit(const MachineInstr
*MI
) const {
316 unsigned Opc
= MI
->getOpcode();
318 case TargetOpcode::PHI
:
319 for (const auto &Op
: MI
->operands())
323 case TargetOpcode::COPY
:
324 if (MI
->getOperand(1).getSubReg() != 0)
328 case Hexagon::L2_loadrd_io
:
329 case Hexagon::S2_storerd_io
:
331 case Hexagon::L2_loadrd_pi
:
332 case Hexagon::S2_storerd_pi
:
335 case Hexagon::A2_tfrpi
:
336 case Hexagon::CONST64
: {
337 uint64_t D
= MI
->getOperand(1).getImm();
338 unsigned Lo
= D
& 0xFFFFFFFFULL
;
339 unsigned Hi
= D
>> 32;
340 return profitImm(Lo
) + profitImm(Hi
);
342 case Hexagon::A2_combineii
:
343 case Hexagon::A4_combineii
: {
344 const MachineOperand
&Op1
= MI
->getOperand(1);
345 const MachineOperand
&Op2
= MI
->getOperand(2);
346 int32_t Prof1
= Op1
.isImm() ? profitImm(Op1
.getImm()) : 0;
347 int32_t Prof2
= Op2
.isImm() ? profitImm(Op2
.getImm()) : 0;
348 return Prof1
+ Prof2
;
350 case Hexagon::A4_combineri
:
352 // Fall through into A4_combineir.
354 case Hexagon::A4_combineir
: {
356 const MachineOperand
&OpX
= MI
->getOperand(ImmX
);
358 int64_t V
= OpX
.getImm();
359 if (V
== 0 || V
== -1)
362 // Fall through into A2_combinew.
365 case Hexagon::A2_combinew
:
368 case Hexagon::A2_sxtw
:
371 case Hexagon::A2_andp
:
372 case Hexagon::A2_orp
:
373 case Hexagon::A2_xorp
: {
374 Register Rs
= MI
->getOperand(1).getReg();
375 Register Rt
= MI
->getOperand(2).getReg();
376 return profit(Rs
) + profit(Rt
);
379 case Hexagon::S2_asl_i_p_or
: {
380 unsigned S
= MI
->getOperand(3).getImm();
381 if (S
== 0 || S
== 32)
385 case Hexagon::S2_asl_i_p
:
386 case Hexagon::S2_asr_i_p
:
387 case Hexagon::S2_lsr_i_p
:
388 unsigned S
= MI
->getOperand(2).getImm();
389 if (S
== 0 || S
== 32)
401 int32_t HexagonSplitDoubleRegs::profit(Register Reg
) const {
402 assert(Reg
.isVirtual());
404 const MachineInstr
*DefI
= MRI
->getVRegDef(Reg
);
405 switch (DefI
->getOpcode()) {
406 case Hexagon::A2_tfrpi
:
407 case Hexagon::CONST64
:
408 case Hexagon::A2_combineii
:
409 case Hexagon::A4_combineii
:
410 case Hexagon::A4_combineri
:
411 case Hexagon::A4_combineir
:
412 case Hexagon::A2_combinew
:
420 bool HexagonSplitDoubleRegs::isProfitable(const USet
&Part
, LoopRegMap
&IRM
)
422 unsigned FixedNum
= 0, LoopPhiNum
= 0;
425 for (unsigned DR
: Part
) {
426 MachineInstr
*DefI
= MRI
->getVRegDef(DR
);
427 int32_t P
= profit(DefI
);
428 if (P
== std::numeric_limits
<int>::min())
431 // Reduce the profitability of splitting induction registers.
432 if (isInduction(DR
, IRM
))
435 for (auto U
= MRI
->use_nodbg_begin(DR
), W
= MRI
->use_nodbg_end();
437 MachineInstr
*UseI
= U
->getParent();
438 if (isFixedInstr(UseI
)) {
440 // Calculate the cost of generating REG_SEQUENCE instructions.
441 for (auto &Op
: UseI
->operands()) {
442 if (Op
.isReg() && Part
.count(Op
.getReg()))
448 // If a register from this partition is used in a fixed instruction,
449 // and there is also a register in this partition that is used in
450 // a loop phi node, then decrease the splitting profit as this can
451 // confuse the modulo scheduler.
453 const MachineBasicBlock
*PB
= UseI
->getParent();
454 const MachineLoop
*L
= MLI
->getLoopFor(PB
);
455 if (L
&& L
->getHeader() == PB
)
458 // Splittable instruction.
459 int32_t P
= profit(UseI
);
460 if (P
== std::numeric_limits
<int>::min())
466 if (FixedNum
> 0 && LoopPhiNum
> 0)
467 TotalP
-= 20*LoopPhiNum
;
469 LLVM_DEBUG(dbgs() << "Partition profit: " << TotalP
<< '\n');
475 void HexagonSplitDoubleRegs::collectIndRegsForLoop(const MachineLoop
*L
,
477 const MachineBasicBlock
*HB
= L
->getHeader();
478 const MachineBasicBlock
*LB
= L
->getLoopLatch();
482 // Examine the latch branch. Expect it to be a conditional branch to
483 // the header (either "br-cond header" or "br-cond exit; br header").
484 MachineBasicBlock
*TB
= nullptr, *FB
= nullptr;
485 MachineBasicBlock
*TmpLB
= const_cast<MachineBasicBlock
*>(LB
);
486 SmallVector
<MachineOperand
,2> Cond
;
487 bool BadLB
= TII
->analyzeBranch(*TmpLB
, TB
, FB
, Cond
, false);
488 // Only analyzable conditional branches. HII::analyzeBranch will put
489 // the branch opcode as the first element of Cond, and the predicate
490 // operand as the second.
491 if (BadLB
|| Cond
.size() != 2)
493 // Only simple jump-conditional (with or without negation).
494 if (!TII
->PredOpcodeHasJMP_c(Cond
[0].getImm()))
496 // Must go to the header.
497 if (TB
!= HB
&& FB
!= HB
)
499 assert(Cond
[1].isReg() && "Unexpected Cond vector from analyzeBranch");
500 // Expect a predicate register.
501 Register PR
= Cond
[1].getReg();
502 assert(MRI
->getRegClass(PR
) == &Hexagon::PredRegsRegClass
);
504 // Get the registers on which the loop controlling compare instruction
506 Register CmpR1
, CmpR2
;
507 const MachineInstr
*CmpI
= MRI
->getVRegDef(PR
);
508 while (CmpI
->getOpcode() == Hexagon::C2_not
)
509 CmpI
= MRI
->getVRegDef(CmpI
->getOperand(1).getReg());
511 int Mask
= 0, Val
= 0;
512 bool OkCI
= TII
->analyzeCompare(*CmpI
, CmpR1
, CmpR2
, Mask
, Val
);
515 // Eliminate non-double input registers.
516 if (CmpR1
&& MRI
->getRegClass(CmpR1
) != DoubleRC
)
518 if (CmpR2
&& MRI
->getRegClass(CmpR2
) != DoubleRC
)
520 if (!CmpR1
&& !CmpR2
)
523 // Now examine the top of the loop: the phi nodes that could poten-
524 // tially define loop induction registers. The registers defined by
525 // such a phi node would be used in a 64-bit add, which then would
526 // be used in the loop compare instruction.
528 // Get the set of all double registers defined by phi nodes in the
530 using UVect
= std::vector
<unsigned>;
533 for (auto &MI
: *HB
) {
536 const MachineOperand
&MD
= MI
.getOperand(0);
537 Register R
= MD
.getReg();
538 if (MRI
->getRegClass(R
) == DoubleRC
)
544 auto NoIndOp
= [this, CmpR1
, CmpR2
] (unsigned R
) -> bool {
545 for (auto I
= MRI
->use_nodbg_begin(R
), E
= MRI
->use_nodbg_end();
547 const MachineInstr
*UseI
= I
->getParent();
548 if (UseI
->getOpcode() != Hexagon::A2_addp
)
550 // Get the output from the add. If it is one of the inputs to the
551 // loop-controlling compare instruction, then R is likely an induc-
553 Register T
= UseI
->getOperand(0).getReg();
554 if (T
== CmpR1
|| T
== CmpR2
)
559 UVect::iterator End
= llvm::remove_if(DP
, NoIndOp
);
560 Rs
.insert(DP
.begin(), End
);
565 dbgs() << "For loop at " << printMBBReference(*HB
) << " ind regs: ";
566 dump_partition(dbgs(), Rs
, *TRI
);
571 void HexagonSplitDoubleRegs::collectIndRegs(LoopRegMap
&IRM
) {
572 using LoopVector
= std::vector
<MachineLoop
*>;
576 append_range(WorkQ
, *MLI
);
577 for (unsigned i
= 0; i
< WorkQ
.size(); ++i
)
578 append_range(WorkQ
, *WorkQ
[i
]);
581 for (unsigned i
= 0, n
= WorkQ
.size(); i
< n
; ++i
) {
582 MachineLoop
*L
= WorkQ
[i
];
584 collectIndRegsForLoop(L
, Rs
);
586 IRM
.insert(std::make_pair(L
, Rs
));
590 void HexagonSplitDoubleRegs::createHalfInstr(unsigned Opc
, MachineInstr
*MI
,
591 const UUPairMap
&PairMap
, unsigned SubR
) {
592 MachineBasicBlock
&B
= *MI
->getParent();
593 DebugLoc DL
= MI
->getDebugLoc();
594 MachineInstr
*NewI
= BuildMI(B
, MI
, DL
, TII
->get(Opc
));
596 for (auto &Op
: MI
->operands()) {
598 NewI
->addOperand(Op
);
601 // For register operands, set the subregister.
602 Register R
= Op
.getReg();
603 unsigned SR
= Op
.getSubReg();
604 bool isVirtReg
= R
.isVirtual();
605 bool isKill
= Op
.isKill();
606 if (isVirtReg
&& MRI
->getRegClass(R
) == DoubleRC
) {
608 UUPairMap::const_iterator F
= PairMap
.find(R
);
609 if (F
== PairMap
.end()) {
612 const UUPair
&P
= F
->second
;
613 R
= (SubR
== Hexagon::isub_lo
) ? P
.first
: P
.second
;
617 auto CO
= MachineOperand::CreateReg(R
, Op
.isDef(), Op
.isImplicit(), isKill
,
618 Op
.isDead(), Op
.isUndef(), Op
.isEarlyClobber(), SR
, Op
.isDebug(),
619 Op
.isInternalRead());
620 NewI
->addOperand(CO
);
624 void HexagonSplitDoubleRegs::splitMemRef(MachineInstr
*MI
,
625 const UUPairMap
&PairMap
) {
626 bool Load
= MI
->mayLoad();
627 unsigned OrigOpc
= MI
->getOpcode();
628 bool PostInc
= (OrigOpc
== Hexagon::L2_loadrd_pi
||
629 OrigOpc
== Hexagon::S2_storerd_pi
);
630 MachineInstr
*LowI
, *HighI
;
631 MachineBasicBlock
&B
= *MI
->getParent();
632 DebugLoc DL
= MI
->getDebugLoc();
634 // Index of the base-address-register operand.
635 unsigned AdrX
= PostInc
? (Load
? 2 : 1)
637 MachineOperand
&AdrOp
= MI
->getOperand(AdrX
);
638 unsigned RSA
= getRegState(AdrOp
);
639 MachineOperand
&ValOp
= Load
? MI
->getOperand(0)
640 : (PostInc
? MI
->getOperand(3)
641 : MI
->getOperand(2));
642 UUPairMap::const_iterator F
= PairMap
.find(ValOp
.getReg());
643 assert(F
!= PairMap
.end());
646 const UUPair
&P
= F
->second
;
647 int64_t Off
= PostInc
? 0 : MI
->getOperand(2).getImm();
648 LowI
= BuildMI(B
, MI
, DL
, TII
->get(Hexagon::L2_loadri_io
), P
.first
)
649 .addReg(AdrOp
.getReg(), RSA
& ~RegState::Kill
, AdrOp
.getSubReg())
651 HighI
= BuildMI(B
, MI
, DL
, TII
->get(Hexagon::L2_loadri_io
), P
.second
)
652 .addReg(AdrOp
.getReg(), RSA
& ~RegState::Kill
, AdrOp
.getSubReg())
655 const UUPair
&P
= F
->second
;
656 int64_t Off
= PostInc
? 0 : MI
->getOperand(1).getImm();
657 LowI
= BuildMI(B
, MI
, DL
, TII
->get(Hexagon::S2_storeri_io
))
658 .addReg(AdrOp
.getReg(), RSA
& ~RegState::Kill
, AdrOp
.getSubReg())
661 HighI
= BuildMI(B
, MI
, DL
, TII
->get(Hexagon::S2_storeri_io
))
662 .addReg(AdrOp
.getReg(), RSA
& ~RegState::Kill
, AdrOp
.getSubReg())
668 // Create the increment of the address register.
669 int64_t Inc
= Load
? MI
->getOperand(3).getImm()
670 : MI
->getOperand(2).getImm();
671 MachineOperand
&UpdOp
= Load
? MI
->getOperand(1) : MI
->getOperand(0);
672 const TargetRegisterClass
*RC
= MRI
->getRegClass(UpdOp
.getReg());
673 Register NewR
= MRI
->createVirtualRegister(RC
);
674 assert(!UpdOp
.getSubReg() && "Def operand with subreg");
675 BuildMI(B
, MI
, DL
, TII
->get(Hexagon::A2_addi
), NewR
)
676 .addReg(AdrOp
.getReg(), RSA
)
678 MRI
->replaceRegWith(UpdOp
.getReg(), NewR
);
679 // The original instruction will be deleted later.
682 // Generate a new pair of memory-operands.
683 MachineFunction
&MF
= *B
.getParent();
684 for (auto &MO
: MI
->memoperands()) {
685 const MachinePointerInfo
&Ptr
= MO
->getPointerInfo();
686 MachineMemOperand::Flags F
= MO
->getFlags();
687 Align A
= MO
->getAlign();
689 auto *Tmp1
= MF
.getMachineMemOperand(Ptr
, F
, 4 /*size*/, A
);
690 LowI
->addMemOperand(MF
, Tmp1
);
692 MF
.getMachineMemOperand(Ptr
, F
, 4 /*size*/, std::min(A
, Align(4)));
693 HighI
->addMemOperand(MF
, Tmp2
);
697 void HexagonSplitDoubleRegs::splitImmediate(MachineInstr
*MI
,
698 const UUPairMap
&PairMap
) {
699 MachineOperand
&Op0
= MI
->getOperand(0);
700 MachineOperand
&Op1
= MI
->getOperand(1);
701 assert(Op0
.isReg() && Op1
.isImm());
702 uint64_t V
= Op1
.getImm();
704 MachineBasicBlock
&B
= *MI
->getParent();
705 DebugLoc DL
= MI
->getDebugLoc();
706 UUPairMap::const_iterator F
= PairMap
.find(Op0
.getReg());
707 assert(F
!= PairMap
.end());
708 const UUPair
&P
= F
->second
;
710 // The operand to A2_tfrsi can only have 32 significant bits. Immediate
711 // values in MachineOperand are stored as 64-bit integers, and so the
712 // value -1 may be represented either as 64-bit -1, or 4294967295. Both
713 // will have the 32 higher bits truncated in the end, but -1 will remain
714 // as -1, while the latter may appear to be a large unsigned value
715 // requiring a constant extender. The casting to int32_t will select the
716 // former representation. (The same reasoning applies to all 32-bit
718 BuildMI(B
, MI
, DL
, TII
->get(Hexagon::A2_tfrsi
), P
.first
)
719 .addImm(int32_t(V
& 0xFFFFFFFFULL
));
720 BuildMI(B
, MI
, DL
, TII
->get(Hexagon::A2_tfrsi
), P
.second
)
721 .addImm(int32_t(V
>> 32));
724 void HexagonSplitDoubleRegs::splitCombine(MachineInstr
*MI
,
725 const UUPairMap
&PairMap
) {
726 MachineOperand
&Op0
= MI
->getOperand(0);
727 MachineOperand
&Op1
= MI
->getOperand(1);
728 MachineOperand
&Op2
= MI
->getOperand(2);
731 MachineBasicBlock
&B
= *MI
->getParent();
732 DebugLoc DL
= MI
->getDebugLoc();
733 UUPairMap::const_iterator F
= PairMap
.find(Op0
.getReg());
734 assert(F
!= PairMap
.end());
735 const UUPair
&P
= F
->second
;
738 BuildMI(B
, MI
, DL
, TII
->get(Hexagon::A2_tfrsi
), P
.second
)
741 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::COPY
), P
.second
)
742 .addReg(Op1
.getReg(), getRegState(Op1
), Op1
.getSubReg());
746 BuildMI(B
, MI
, DL
, TII
->get(Hexagon::A2_tfrsi
), P
.first
)
749 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::COPY
), P
.first
)
750 .addReg(Op2
.getReg(), getRegState(Op2
), Op2
.getSubReg());
754 void HexagonSplitDoubleRegs::splitExt(MachineInstr
*MI
,
755 const UUPairMap
&PairMap
) {
756 MachineOperand
&Op0
= MI
->getOperand(0);
757 MachineOperand
&Op1
= MI
->getOperand(1);
758 assert(Op0
.isReg() && Op1
.isReg());
760 MachineBasicBlock
&B
= *MI
->getParent();
761 DebugLoc DL
= MI
->getDebugLoc();
762 UUPairMap::const_iterator F
= PairMap
.find(Op0
.getReg());
763 assert(F
!= PairMap
.end());
764 const UUPair
&P
= F
->second
;
765 unsigned RS
= getRegState(Op1
);
767 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::COPY
), P
.first
)
768 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, Op1
.getSubReg());
769 BuildMI(B
, MI
, DL
, TII
->get(Hexagon::S2_asr_i_r
), P
.second
)
770 .addReg(Op1
.getReg(), RS
, Op1
.getSubReg())
774 void HexagonSplitDoubleRegs::splitShift(MachineInstr
*MI
,
775 const UUPairMap
&PairMap
) {
776 using namespace Hexagon
;
778 MachineOperand
&Op0
= MI
->getOperand(0);
779 MachineOperand
&Op1
= MI
->getOperand(1);
780 MachineOperand
&Op2
= MI
->getOperand(2);
781 assert(Op0
.isReg() && Op1
.isReg() && Op2
.isImm());
782 int64_t Sh64
= Op2
.getImm();
783 assert(Sh64
>= 0 && Sh64
< 64);
786 UUPairMap::const_iterator F
= PairMap
.find(Op0
.getReg());
787 assert(F
!= PairMap
.end());
788 const UUPair
&P
= F
->second
;
789 Register LoR
= P
.first
;
790 Register HiR
= P
.second
;
792 unsigned Opc
= MI
->getOpcode();
793 bool Right
= (Opc
== S2_lsr_i_p
|| Opc
== S2_asr_i_p
);
795 bool Signed
= (Opc
== S2_asr_i_p
);
797 MachineBasicBlock
&B
= *MI
->getParent();
798 DebugLoc DL
= MI
->getDebugLoc();
799 unsigned RS
= getRegState(Op1
);
800 unsigned ShiftOpc
= Left
? S2_asl_i_r
801 : (Signed
? S2_asr_i_r
: S2_lsr_i_r
);
802 unsigned LoSR
= isub_lo
;
803 unsigned HiSR
= isub_hi
;
806 // No shift, subregister copy.
807 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::COPY
), LoR
)
808 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, LoSR
);
809 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::COPY
), HiR
)
810 .addReg(Op1
.getReg(), RS
, HiSR
);
812 const TargetRegisterClass
*IntRC
= &IntRegsRegClass
;
813 Register TmpR
= MRI
->createVirtualRegister(IntRC
);
815 // Shift left: DR = shl R, #s
816 // LoR = shl R.lo, #s
817 // TmpR = extractu R.lo, #s, #32-s
818 // HiR = or (TmpR, asl(R.hi, #s))
819 // Shift right: DR = shr R, #s
820 // HiR = shr R.hi, #s
821 // TmpR = shr R.lo, #s
822 // LoR = insert TmpR, R.hi, #s, #32-s
825 // LoR = shl R.lo, #s
827 // TmpR = shr R.lo, #s
829 // Make a special case for A2_aslh and A2_asrh (they are predicable as
830 // opposed to S2_asl_i_r/S2_asr_i_r).
832 BuildMI(B
, MI
, DL
, TII
->get(A2_aslh
), LoR
)
833 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, LoSR
);
834 else if (S
== 16 && Signed
)
835 BuildMI(B
, MI
, DL
, TII
->get(A2_asrh
), TmpR
)
836 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, LoSR
);
838 BuildMI(B
, MI
, DL
, TII
->get(ShiftOpc
), (Left
? LoR
: TmpR
))
839 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, LoSR
)
843 // TmpR = extractu R.lo, #s, #32-s
844 BuildMI(B
, MI
, DL
, TII
->get(S2_extractu
), TmpR
)
845 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, LoSR
)
848 // HiR = or (TmpR, asl(R.hi, #s))
849 BuildMI(B
, MI
, DL
, TII
->get(S2_asl_i_r_or
), HiR
)
851 .addReg(Op1
.getReg(), RS
, HiSR
)
854 // HiR = shr R.hi, #s
855 BuildMI(B
, MI
, DL
, TII
->get(ShiftOpc
), HiR
)
856 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, HiSR
)
858 // LoR = insert TmpR, R.hi, #s, #32-s
859 BuildMI(B
, MI
, DL
, TII
->get(S2_insert
), LoR
)
861 .addReg(Op1
.getReg(), RS
, HiSR
)
865 } else if (S
== 32) {
866 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::COPY
), (Left
? HiR
: LoR
))
867 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, (Left
? LoSR
: HiSR
));
869 BuildMI(B
, MI
, DL
, TII
->get(A2_tfrsi
), (Left
? LoR
: HiR
))
871 else // Must be right shift.
872 BuildMI(B
, MI
, DL
, TII
->get(S2_asr_i_r
), HiR
)
873 .addReg(Op1
.getReg(), RS
, HiSR
)
878 BuildMI(B
, MI
, DL
, TII
->get(A2_aslh
), HiR
)
879 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, LoSR
);
880 else if (S
== 16 && Signed
)
881 BuildMI(B
, MI
, DL
, TII
->get(A2_asrh
), LoR
)
882 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, HiSR
);
884 BuildMI(B
, MI
, DL
, TII
->get(ShiftOpc
), (Left
? HiR
: LoR
))
885 .addReg(Op1
.getReg(), RS
& ~RegState::Kill
, (Left
? LoSR
: HiSR
))
889 BuildMI(B
, MI
, DL
, TII
->get(S2_asr_i_r
), HiR
)
890 .addReg(Op1
.getReg(), RS
, HiSR
)
893 BuildMI(B
, MI
, DL
, TII
->get(A2_tfrsi
), (Left
? LoR
: HiR
))
898 void HexagonSplitDoubleRegs::splitAslOr(MachineInstr
*MI
,
899 const UUPairMap
&PairMap
) {
900 using namespace Hexagon
;
902 MachineOperand
&Op0
= MI
->getOperand(0);
903 MachineOperand
&Op1
= MI
->getOperand(1);
904 MachineOperand
&Op2
= MI
->getOperand(2);
905 MachineOperand
&Op3
= MI
->getOperand(3);
906 assert(Op0
.isReg() && Op1
.isReg() && Op2
.isReg() && Op3
.isImm());
907 int64_t Sh64
= Op3
.getImm();
908 assert(Sh64
>= 0 && Sh64
< 64);
911 UUPairMap::const_iterator F
= PairMap
.find(Op0
.getReg());
912 assert(F
!= PairMap
.end());
913 const UUPair
&P
= F
->second
;
914 unsigned LoR
= P
.first
;
915 unsigned HiR
= P
.second
;
917 MachineBasicBlock
&B
= *MI
->getParent();
918 DebugLoc DL
= MI
->getDebugLoc();
919 unsigned RS1
= getRegState(Op1
);
920 unsigned RS2
= getRegState(Op2
);
921 const TargetRegisterClass
*IntRC
= &IntRegsRegClass
;
923 unsigned LoSR
= isub_lo
;
924 unsigned HiSR
= isub_hi
;
926 // Op0 = S2_asl_i_p_or Op1, Op2, Op3
927 // means: Op0 = or (Op1, asl(Op2, Op3))
930 // DR = or (R1, asl(R2, #s))
932 // LoR = or (R1.lo, asl(R2.lo, #s))
933 // Tmp1 = extractu R2.lo, #s, #32-s
934 // Tmp2 = or R1.hi, Tmp1
935 // HiR = or (Tmp2, asl(R2.hi, #s))
938 // DR = or (R1, asl(R2, #0))
940 // i.e. LoR = or R1.lo, R2.lo
941 // HiR = or R1.hi, R2.hi
942 BuildMI(B
, MI
, DL
, TII
->get(A2_or
), LoR
)
943 .addReg(Op1
.getReg(), RS1
& ~RegState::Kill
, LoSR
)
944 .addReg(Op2
.getReg(), RS2
& ~RegState::Kill
, LoSR
);
945 BuildMI(B
, MI
, DL
, TII
->get(A2_or
), HiR
)
946 .addReg(Op1
.getReg(), RS1
, HiSR
)
947 .addReg(Op2
.getReg(), RS2
, HiSR
);
949 BuildMI(B
, MI
, DL
, TII
->get(S2_asl_i_r_or
), LoR
)
950 .addReg(Op1
.getReg(), RS1
& ~RegState::Kill
, LoSR
)
951 .addReg(Op2
.getReg(), RS2
& ~RegState::Kill
, LoSR
)
953 Register TmpR1
= MRI
->createVirtualRegister(IntRC
);
954 BuildMI(B
, MI
, DL
, TII
->get(S2_extractu
), TmpR1
)
955 .addReg(Op2
.getReg(), RS2
& ~RegState::Kill
, LoSR
)
958 Register TmpR2
= MRI
->createVirtualRegister(IntRC
);
959 BuildMI(B
, MI
, DL
, TII
->get(A2_or
), TmpR2
)
960 .addReg(Op1
.getReg(), RS1
, HiSR
)
962 BuildMI(B
, MI
, DL
, TII
->get(S2_asl_i_r_or
), HiR
)
964 .addReg(Op2
.getReg(), RS2
, HiSR
)
966 } else if (S
== 32) {
967 // DR = or (R1, asl(R2, #32))
970 // HiR = or R1.hi, R2.lo
971 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::COPY
), LoR
)
972 .addReg(Op1
.getReg(), RS1
& ~RegState::Kill
, LoSR
);
973 BuildMI(B
, MI
, DL
, TII
->get(A2_or
), HiR
)
974 .addReg(Op1
.getReg(), RS1
, HiSR
)
975 .addReg(Op2
.getReg(), RS2
, LoSR
);
977 // DR = or (R1, asl(R2, #s))
980 // HiR = or (R1:hi, asl(R2:lo, #s-32))
982 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::COPY
), LoR
)
983 .addReg(Op1
.getReg(), RS1
& ~RegState::Kill
, LoSR
);
984 BuildMI(B
, MI
, DL
, TII
->get(S2_asl_i_r_or
), HiR
)
985 .addReg(Op1
.getReg(), RS1
, HiSR
)
986 .addReg(Op2
.getReg(), RS2
, LoSR
)
991 bool HexagonSplitDoubleRegs::splitInstr(MachineInstr
*MI
,
992 const UUPairMap
&PairMap
) {
993 using namespace Hexagon
;
995 LLVM_DEBUG(dbgs() << "Splitting: " << *MI
);
997 unsigned Opc
= MI
->getOpcode();
1000 case TargetOpcode::PHI
:
1001 case TargetOpcode::COPY
: {
1002 Register DstR
= MI
->getOperand(0).getReg();
1003 if (MRI
->getRegClass(DstR
) == DoubleRC
) {
1004 createHalfInstr(Opc
, MI
, PairMap
, isub_lo
);
1005 createHalfInstr(Opc
, MI
, PairMap
, isub_hi
);
1011 createHalfInstr(A2_and
, MI
, PairMap
, isub_lo
);
1012 createHalfInstr(A2_and
, MI
, PairMap
, isub_hi
);
1016 createHalfInstr(A2_or
, MI
, PairMap
, isub_lo
);
1017 createHalfInstr(A2_or
, MI
, PairMap
, isub_hi
);
1021 createHalfInstr(A2_xor
, MI
, PairMap
, isub_lo
);
1022 createHalfInstr(A2_xor
, MI
, PairMap
, isub_hi
);
1030 splitMemRef(MI
, PairMap
);
1036 splitImmediate(MI
, PairMap
);
1045 splitCombine(MI
, PairMap
);
1050 splitExt(MI
, PairMap
);
1057 splitShift(MI
, PairMap
);
1062 splitAslOr(MI
, PairMap
);
1067 llvm_unreachable("Instruction not splitable");
1074 void HexagonSplitDoubleRegs::replaceSubregUses(MachineInstr
*MI
,
1075 const UUPairMap
&PairMap
) {
1076 for (auto &Op
: MI
->operands()) {
1077 if (!Op
.isReg() || !Op
.isUse() || !Op
.getSubReg())
1079 Register R
= Op
.getReg();
1080 UUPairMap::const_iterator F
= PairMap
.find(R
);
1081 if (F
== PairMap
.end())
1083 const UUPair
&P
= F
->second
;
1084 switch (Op
.getSubReg()) {
1085 case Hexagon::isub_lo
:
1088 case Hexagon::isub_hi
:
1089 Op
.setReg(P
.second
);
1096 void HexagonSplitDoubleRegs::collapseRegPairs(MachineInstr
*MI
,
1097 const UUPairMap
&PairMap
) {
1098 MachineBasicBlock
&B
= *MI
->getParent();
1099 DebugLoc DL
= MI
->getDebugLoc();
1101 for (auto &Op
: MI
->operands()) {
1102 if (!Op
.isReg() || !Op
.isUse())
1104 Register R
= Op
.getReg();
1107 if (MRI
->getRegClass(R
) != DoubleRC
|| Op
.getSubReg())
1109 UUPairMap::const_iterator F
= PairMap
.find(R
);
1110 if (F
== PairMap
.end())
1112 const UUPair
&Pr
= F
->second
;
1113 Register NewDR
= MRI
->createVirtualRegister(DoubleRC
);
1114 BuildMI(B
, MI
, DL
, TII
->get(TargetOpcode::REG_SEQUENCE
), NewDR
)
1116 .addImm(Hexagon::isub_lo
)
1118 .addImm(Hexagon::isub_hi
);
1123 bool HexagonSplitDoubleRegs::splitPartition(const USet
&Part
) {
1124 using MISet
= std::set
<MachineInstr
*>;
1126 const TargetRegisterClass
*IntRC
= &Hexagon::IntRegsRegClass
;
1127 bool Changed
= false;
1129 LLVM_DEBUG(dbgs() << "Splitting partition: ";
1130 dump_partition(dbgs(), Part
, *TRI
); dbgs() << '\n');
1135 for (unsigned DR
: Part
) {
1136 MachineInstr
*DefI
= MRI
->getVRegDef(DR
);
1137 SplitIns
.insert(DefI
);
1139 // Collect all instructions, including fixed ones. We won't split them,
1140 // but we need to visit them again to insert the REG_SEQUENCE instructions.
1141 for (auto U
= MRI
->use_nodbg_begin(DR
), W
= MRI
->use_nodbg_end();
1143 SplitIns
.insert(U
->getParent());
1145 Register LoR
= MRI
->createVirtualRegister(IntRC
);
1146 Register HiR
= MRI
->createVirtualRegister(IntRC
);
1147 LLVM_DEBUG(dbgs() << "Created mapping: " << printReg(DR
, TRI
) << " -> "
1148 << printReg(HiR
, TRI
) << ':' << printReg(LoR
, TRI
)
1150 PairMap
.insert(std::make_pair(DR
, UUPair(LoR
, HiR
)));
1154 for (auto MI
: SplitIns
) {
1155 if (isFixedInstr(MI
)) {
1156 collapseRegPairs(MI
, PairMap
);
1158 bool Done
= splitInstr(MI
, PairMap
);
1165 for (unsigned DR
: Part
) {
1166 // Before erasing "double" instructions, revisit all uses of the double
1167 // registers in this partition, and replace all uses of them with subre-
1168 // gisters, with the corresponding single registers.
1170 for (auto U
= MRI
->use_nodbg_begin(DR
), W
= MRI
->use_nodbg_end();
1172 Uses
.insert(U
->getParent());
1174 replaceSubregUses(M
, PairMap
);
1177 for (auto MI
: Erase
) {
1178 MachineBasicBlock
*B
= MI
->getParent();
1185 bool HexagonSplitDoubleRegs::runOnMachineFunction(MachineFunction
&MF
) {
1186 if (skipFunction(MF
.getFunction()))
1189 LLVM_DEBUG(dbgs() << "Splitting double registers in function: "
1190 << MF
.getName() << '\n');
1192 auto &ST
= MF
.getSubtarget
<HexagonSubtarget
>();
1193 TRI
= ST
.getRegisterInfo();
1194 TII
= ST
.getInstrInfo();
1195 MRI
= &MF
.getRegInfo();
1196 MLI
= &getAnalysis
<MachineLoopInfo
>();
1201 collectIndRegs(IRM
);
1202 partitionRegisters(P2Rs
);
1205 dbgs() << "Register partitioning: (partition #0 is fixed)\n";
1206 for (UUSetMap::iterator I
= P2Rs
.begin(), E
= P2Rs
.end(); I
!= E
; ++I
) {
1207 dbgs() << '#' << I
->first
<< " -> ";
1208 dump_partition(dbgs(), I
->second
, *TRI
);
1213 bool Changed
= false;
1214 int Limit
= MaxHSDR
;
1216 for (UUSetMap::iterator I
= P2Rs
.begin(), E
= P2Rs
.end(); I
!= E
; ++I
) {
1219 if (Limit
>= 0 && Counter
>= Limit
)
1221 USet
&Part
= I
->second
;
1222 LLVM_DEBUG(dbgs() << "Calculating profit for partition #" << I
->first
1224 if (!isProfitable(Part
, IRM
))
1227 Changed
|= splitPartition(Part
);
1233 FunctionPass
*llvm::createHexagonSplitDoubleRegs() {
1234 return new HexagonSplitDoubleRegs();