1 //===------- HexagonCopyToCombine.cpp - Hexagon Copy-To-Combine Pass ------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
8 // This pass replaces transfer instructions by combine instructions.
9 // We walk along a basic block and look for two combinable instructions and try
10 // to move them together. If we can move them next to each other we do so and
11 // replace them with a combine instruction.
12 //===----------------------------------------------------------------------===//
13 #include "HexagonInstrInfo.h"
14 #include "HexagonSubtarget.h"
15 #include "llvm/ADT/DenseMap.h"
16 #include "llvm/ADT/DenseSet.h"
17 #include "llvm/CodeGen/MachineBasicBlock.h"
18 #include "llvm/CodeGen/MachineFunction.h"
19 #include "llvm/CodeGen/MachineFunctionPass.h"
20 #include "llvm/CodeGen/MachineInstr.h"
21 #include "llvm/CodeGen/MachineInstrBuilder.h"
22 #include "llvm/CodeGen/Passes.h"
23 #include "llvm/CodeGen/TargetRegisterInfo.h"
24 #include "llvm/PassSupport.h"
25 #include "llvm/Support/CodeGen.h"
26 #include "llvm/Support/CommandLine.h"
27 #include "llvm/Support/Debug.h"
28 #include "llvm/Support/raw_ostream.h"
32 #define DEBUG_TYPE "hexagon-copy-combine"
35 cl::opt
<bool> IsCombinesDisabled("disable-merge-into-combines",
36 cl::Hidden
, cl::ZeroOrMore
,
38 cl::desc("Disable merging into combines"));
40 cl::opt
<bool> IsConst64Disabled("disable-const64",
41 cl::Hidden
, cl::ZeroOrMore
,
43 cl::desc("Disable generation of const64"));
46 MaxNumOfInstsBetweenNewValueStoreAndTFR("max-num-inst-between-tfr-and-nv-store",
47 cl::Hidden
, cl::init(4),
48 cl::desc("Maximum distance between a tfr feeding a store we "
49 "consider the store still to be newifiable"));
52 FunctionPass
*createHexagonCopyToCombine();
53 void initializeHexagonCopyToCombinePass(PassRegistry
&);
59 class HexagonCopyToCombine
: public MachineFunctionPass
{
60 const HexagonInstrInfo
*TII
;
61 const TargetRegisterInfo
*TRI
;
62 const HexagonSubtarget
*ST
;
63 bool ShouldCombineAggressively
;
65 DenseSet
<MachineInstr
*> PotentiallyNewifiableTFR
;
66 SmallVector
<MachineInstr
*, 8> DbgMItoMove
;
71 HexagonCopyToCombine() : MachineFunctionPass(ID
) {
72 initializeHexagonCopyToCombinePass(*PassRegistry::getPassRegistry());
75 void getAnalysisUsage(AnalysisUsage
&AU
) const override
{
76 MachineFunctionPass::getAnalysisUsage(AU
);
79 StringRef
getPassName() const override
{
80 return "Hexagon Copy-To-Combine Pass";
83 bool runOnMachineFunction(MachineFunction
&Fn
) override
;
85 MachineFunctionProperties
getRequiredProperties() const override
{
86 return MachineFunctionProperties().set(
87 MachineFunctionProperties::Property::NoVRegs
);
91 MachineInstr
*findPairable(MachineInstr
&I1
, bool &DoInsertAtI1
,
94 void findPotentialNewifiableTFRs(MachineBasicBlock
&);
96 void combine(MachineInstr
&I1
, MachineInstr
&I2
,
97 MachineBasicBlock::iterator
&MI
, bool DoInsertAtI1
,
100 bool isSafeToMoveTogether(MachineInstr
&I1
, MachineInstr
&I2
,
101 unsigned I1DestReg
, unsigned I2DestReg
,
104 void emitCombineRR(MachineBasicBlock::iterator
&Before
, unsigned DestReg
,
105 MachineOperand
&HiOperand
, MachineOperand
&LoOperand
);
107 void emitCombineRI(MachineBasicBlock::iterator
&Before
, unsigned DestReg
,
108 MachineOperand
&HiOperand
, MachineOperand
&LoOperand
);
110 void emitCombineIR(MachineBasicBlock::iterator
&Before
, unsigned DestReg
,
111 MachineOperand
&HiOperand
, MachineOperand
&LoOperand
);
113 void emitCombineII(MachineBasicBlock::iterator
&Before
, unsigned DestReg
,
114 MachineOperand
&HiOperand
, MachineOperand
&LoOperand
);
116 void emitConst64(MachineBasicBlock::iterator
&Before
, unsigned DestReg
,
117 MachineOperand
&HiOperand
, MachineOperand
&LoOperand
);
120 } // End anonymous namespace.
122 char HexagonCopyToCombine::ID
= 0;
124 INITIALIZE_PASS(HexagonCopyToCombine
, "hexagon-copy-combine",
125 "Hexagon Copy-To-Combine Pass", false, false)
127 static bool isCombinableInstType(MachineInstr
&MI
, const HexagonInstrInfo
*TII
,
128 bool ShouldCombineAggressively
) {
129 switch (MI
.getOpcode()) {
130 case Hexagon::A2_tfr
: {
131 // A COPY instruction can be combined if its arguments are IntRegs (32bit).
132 const MachineOperand
&Op0
= MI
.getOperand(0);
133 const MachineOperand
&Op1
= MI
.getOperand(1);
134 assert(Op0
.isReg() && Op1
.isReg());
136 unsigned DestReg
= Op0
.getReg();
137 unsigned SrcReg
= Op1
.getReg();
138 return Hexagon::IntRegsRegClass
.contains(DestReg
) &&
139 Hexagon::IntRegsRegClass
.contains(SrcReg
);
142 case Hexagon::A2_tfrsi
: {
143 // A transfer-immediate can be combined if its argument is a signed 8bit
145 const MachineOperand
&Op0
= MI
.getOperand(0);
146 const MachineOperand
&Op1
= MI
.getOperand(1);
149 unsigned DestReg
= Op0
.getReg();
150 // Ensure that TargetFlags are MO_NO_FLAG for a global. This is a
151 // workaround for an ABI bug that prevents GOT relocations on combine
153 if (!Op1
.isImm() && Op1
.getTargetFlags() != HexagonII::MO_NO_FLAG
)
156 // Only combine constant extended A2_tfrsi if we are in aggressive mode.
157 bool NotExt
= Op1
.isImm() && isInt
<8>(Op1
.getImm());
158 return Hexagon::IntRegsRegClass
.contains(DestReg
) &&
159 (ShouldCombineAggressively
|| NotExt
);
162 case Hexagon::V6_vassign
:
172 template <unsigned N
> static bool isGreaterThanNBitTFRI(const MachineInstr
&I
) {
173 if (I
.getOpcode() == Hexagon::TFRI64_V4
||
174 I
.getOpcode() == Hexagon::A2_tfrsi
) {
175 const MachineOperand
&Op
= I
.getOperand(1);
176 return !Op
.isImm() || !isInt
<N
>(Op
.getImm());
181 /// areCombinableOperations - Returns true if the two instruction can be merge
182 /// into a combine (ignoring register constraints).
183 static bool areCombinableOperations(const TargetRegisterInfo
*TRI
,
184 MachineInstr
&HighRegInst
,
185 MachineInstr
&LowRegInst
, bool AllowC64
) {
186 unsigned HiOpc
= HighRegInst
.getOpcode();
187 unsigned LoOpc
= LowRegInst
.getOpcode();
189 auto verifyOpc
= [](unsigned Opc
) -> void {
191 case Hexagon::A2_tfr
:
192 case Hexagon::A2_tfrsi
:
193 case Hexagon::V6_vassign
:
196 llvm_unreachable("Unexpected opcode");
202 if (HiOpc
== Hexagon::V6_vassign
|| LoOpc
== Hexagon::V6_vassign
)
203 return HiOpc
== LoOpc
;
206 // There is no combine of two constant extended values.
207 if (isGreaterThanNBitTFRI
<8>(HighRegInst
) &&
208 isGreaterThanNBitTFRI
<6>(LowRegInst
))
212 // There is a combine of two constant extended values into CONST64,
213 // provided both constants are true immediates.
214 if (isGreaterThanNBitTFRI
<16>(HighRegInst
) &&
215 isGreaterThanNBitTFRI
<16>(LowRegInst
))
216 return (HighRegInst
.getOperand(1).isImm() &&
217 LowRegInst
.getOperand(1).isImm());
219 // There is no combine of two constant extended values, unless handled above
220 // Make both 8-bit size checks to allow both combine (#,##) and combine(##,#)
221 if (isGreaterThanNBitTFRI
<8>(HighRegInst
) &&
222 isGreaterThanNBitTFRI
<8>(LowRegInst
))
228 static bool isEvenReg(unsigned Reg
) {
229 assert(TargetRegisterInfo::isPhysicalRegister(Reg
));
230 if (Hexagon::IntRegsRegClass
.contains(Reg
))
231 return (Reg
- Hexagon::R0
) % 2 == 0;
232 if (Hexagon::HvxVRRegClass
.contains(Reg
))
233 return (Reg
- Hexagon::V0
) % 2 == 0;
234 llvm_unreachable("Invalid register");
237 static void removeKillInfo(MachineInstr
&MI
, unsigned RegNotKilled
) {
238 for (unsigned I
= 0, E
= MI
.getNumOperands(); I
!= E
; ++I
) {
239 MachineOperand
&Op
= MI
.getOperand(I
);
240 if (!Op
.isReg() || Op
.getReg() != RegNotKilled
|| !Op
.isKill())
246 /// Returns true if it is unsafe to move a copy instruction from \p UseReg to
247 /// \p DestReg over the instruction \p MI.
248 static bool isUnsafeToMoveAcross(MachineInstr
&MI
, unsigned UseReg
,
250 const TargetRegisterInfo
*TRI
) {
251 return (UseReg
&& (MI
.modifiesRegister(UseReg
, TRI
))) ||
252 MI
.modifiesRegister(DestReg
, TRI
) || MI
.readsRegister(DestReg
, TRI
) ||
253 MI
.hasUnmodeledSideEffects() || MI
.isInlineAsm() ||
254 MI
.isMetaInstruction();
257 static unsigned UseReg(const MachineOperand
& MO
) {
258 return MO
.isReg() ? MO
.getReg() : 0;
261 /// isSafeToMoveTogether - Returns true if it is safe to move I1 next to I2 such
262 /// that the two instructions can be paired in a combine.
263 bool HexagonCopyToCombine::isSafeToMoveTogether(MachineInstr
&I1
,
267 bool &DoInsertAtI1
) {
268 unsigned I2UseReg
= UseReg(I2
.getOperand(1));
270 // It is not safe to move I1 and I2 into one combine if I2 has a true
272 if (I2UseReg
&& I1
.modifiesRegister(I2UseReg
, TRI
))
277 // First try to move I2 towards I1.
279 // A reverse_iterator instantiated like below starts before I2, and I1
281 // Look at instructions I in between I2 and (excluding) I1.
282 MachineBasicBlock::reverse_iterator
I(I2
),
283 End
= --(MachineBasicBlock::reverse_iterator(I1
));
284 // At 03 we got better results (dhrystone!) by being more conservative.
285 if (!ShouldCombineAggressively
)
286 End
= MachineBasicBlock::reverse_iterator(I1
);
287 // If I2 kills its operand and we move I2 over an instruction that also
288 // uses I2's use reg we need to modify that (first) instruction to now kill
290 unsigned KilledOperand
= 0;
291 if (I2
.killsRegister(I2UseReg
))
292 KilledOperand
= I2UseReg
;
293 MachineInstr
*KillingInstr
= nullptr;
295 for (; I
!= End
; ++I
) {
296 // If the intervening instruction I:
297 // * modifies I2's use reg
298 // * modifies I2's def reg
299 // * reads I2's def reg
300 // * or has unmodelled side effects
301 // we can't move I2 across it.
302 if (I
->isDebugInstr())
305 if (isUnsafeToMoveAcross(*I
, I2UseReg
, I2DestReg
, TRI
)) {
310 // Update first use of the killed operand.
311 if (!KillingInstr
&& KilledOperand
&&
312 I
->readsRegister(KilledOperand
, TRI
))
316 // Update the intermediate instruction to with the kill flag.
318 bool Added
= KillingInstr
->addRegisterKilled(KilledOperand
, TRI
, true);
319 (void)Added
; // suppress compiler warning
320 assert(Added
&& "Must successfully update kill flag");
321 removeKillInfo(I2
, KilledOperand
);
328 // Try to move I1 towards I2.
330 // Look at instructions I in between I1 and (excluding) I2.
331 MachineBasicBlock::iterator
I(I1
), End(I2
);
332 // At O3 we got better results (dhrystone) by being more conservative here.
333 if (!ShouldCombineAggressively
)
334 End
= std::next(MachineBasicBlock::iterator(I2
));
335 unsigned I1UseReg
= UseReg(I1
.getOperand(1));
336 // Track killed operands. If we move across an instruction that kills our
337 // operand, we need to update the kill information on the moved I1. It kills
339 MachineInstr
*KillingInstr
= nullptr;
340 unsigned KilledOperand
= 0;
343 MachineInstr
&MI
= *I
;
344 // If the intervening instruction MI:
345 // * modifies I1's use reg
346 // * modifies I1's def reg
347 // * reads I1's def reg
348 // * or has unmodelled side effects
349 // We introduce this special case because llvm has no api to remove a
350 // kill flag for a register (a removeRegisterKilled() analogous to
351 // addRegisterKilled) that handles aliased register correctly.
352 // * or has a killed aliased register use of I1's use reg
355 // %r8 = KILL %r8, implicit killed %d4
356 // If we want to move R6 = across the KILL instruction we would have
357 // to remove the implicit killed %d4 operand. For now, we are
358 // conservative and disallow the move.
359 // we can't move I1 across it.
360 if (MI
.isDebugInstr()) {
361 if (MI
.readsRegister(I1DestReg
, TRI
)) // Move this instruction after I2.
362 DbgMItoMove
.push_back(&MI
);
366 if (isUnsafeToMoveAcross(MI
, I1UseReg
, I1DestReg
, TRI
) ||
367 // Check for an aliased register kill. Bail out if we see one.
368 (!MI
.killsRegister(I1UseReg
) && MI
.killsRegister(I1UseReg
, TRI
)))
371 // Check for an exact kill (registers match).
372 if (I1UseReg
&& MI
.killsRegister(I1UseReg
)) {
373 assert(!KillingInstr
&& "Should only see one killing instruction");
374 KilledOperand
= I1UseReg
;
379 removeKillInfo(*KillingInstr
, KilledOperand
);
380 // Update I1 to set the kill flag. This flag will later be picked up by
381 // the new COMBINE instruction.
382 bool Added
= I1
.addRegisterKilled(KilledOperand
, TRI
);
383 (void)Added
; // suppress compiler warning
384 assert(Added
&& "Must successfully update kill flag");
386 DoInsertAtI1
= false;
392 /// findPotentialNewifiableTFRs - Finds tranfers that feed stores that could be
393 /// newified. (A use of a 64 bit register define can not be newified)
395 HexagonCopyToCombine::findPotentialNewifiableTFRs(MachineBasicBlock
&BB
) {
396 DenseMap
<unsigned, MachineInstr
*> LastDef
;
397 for (MachineInstr
&MI
: BB
) {
398 if (MI
.isDebugInstr())
401 // Mark TFRs that feed a potential new value store as such.
402 if (TII
->mayBeNewStore(MI
)) {
403 // Look for uses of TFR instructions.
404 for (unsigned OpdIdx
= 0, OpdE
= MI
.getNumOperands(); OpdIdx
!= OpdE
;
406 MachineOperand
&Op
= MI
.getOperand(OpdIdx
);
408 // Skip over anything except register uses.
409 if (!Op
.isReg() || !Op
.isUse() || !Op
.getReg())
412 // Look for the defining instruction.
413 unsigned Reg
= Op
.getReg();
414 MachineInstr
*DefInst
= LastDef
[Reg
];
417 if (!isCombinableInstType(*DefInst
, TII
, ShouldCombineAggressively
))
420 // Only close newifiable stores should influence the decision.
421 // Ignore the debug instructions in between.
422 MachineBasicBlock::iterator
It(DefInst
);
423 unsigned NumInstsToDef
= 0;
424 while (&*It
!= &MI
) {
425 if (!It
->isDebugInstr())
430 if (NumInstsToDef
> MaxNumOfInstsBetweenNewValueStoreAndTFR
)
433 PotentiallyNewifiableTFR
.insert(DefInst
);
435 // Skip to next instruction.
439 // Put instructions that last defined integer or double registers into the
441 for (MachineOperand
&Op
: MI
.operands()) {
443 if (!Op
.isDef() || !Op
.getReg())
445 unsigned Reg
= Op
.getReg();
446 if (Hexagon::DoubleRegsRegClass
.contains(Reg
)) {
447 for (MCSubRegIterator
SubRegs(Reg
, TRI
); SubRegs
.isValid(); ++SubRegs
)
448 LastDef
[*SubRegs
] = &MI
;
449 } else if (Hexagon::IntRegsRegClass
.contains(Reg
))
451 } else if (Op
.isRegMask()) {
452 for (unsigned Reg
: Hexagon::IntRegsRegClass
)
453 if (Op
.clobbersPhysReg(Reg
))
460 bool HexagonCopyToCombine::runOnMachineFunction(MachineFunction
&MF
) {
461 if (skipFunction(MF
.getFunction()))
464 if (IsCombinesDisabled
) return false;
466 bool HasChanged
= false;
469 ST
= &MF
.getSubtarget
<HexagonSubtarget
>();
470 TRI
= ST
->getRegisterInfo();
471 TII
= ST
->getInstrInfo();
473 const Function
&F
= MF
.getFunction();
474 bool OptForSize
= F
.hasFnAttribute(Attribute::OptimizeForSize
);
476 // Combine aggressively (for code size)
477 ShouldCombineAggressively
=
478 MF
.getTarget().getOptLevel() <= CodeGenOpt::Default
;
480 // Traverse basic blocks.
481 for (MachineFunction::iterator BI
= MF
.begin(), BE
= MF
.end(); BI
!= BE
;
483 PotentiallyNewifiableTFR
.clear();
484 findPotentialNewifiableTFRs(*BI
);
486 // Traverse instructions in basic block.
487 for(MachineBasicBlock::iterator MI
= BI
->begin(), End
= BI
->end();
489 MachineInstr
&I1
= *MI
++;
491 if (I1
.isDebugInstr())
494 // Don't combine a TFR whose user could be newified (instructions that
495 // define double registers can not be newified - Programmer's Ref Manual
496 // 5.4.2 New-value stores).
497 if (ShouldCombineAggressively
&& PotentiallyNewifiableTFR
.count(&I1
))
500 // Ignore instructions that are not combinable.
501 if (!isCombinableInstType(I1
, TII
, ShouldCombineAggressively
))
504 // Find a second instruction that can be merged into a combine
505 // instruction. In addition, also find all the debug instructions that
506 // need to be moved along with it.
507 bool DoInsertAtI1
= false;
509 MachineInstr
*I2
= findPairable(I1
, DoInsertAtI1
, OptForSize
);
512 combine(I1
, *I2
, MI
, DoInsertAtI1
, OptForSize
);
520 /// findPairable - Returns an instruction that can be merged with \p I1 into a
521 /// COMBINE instruction or 0 if no such instruction can be found. Returns true
522 /// in \p DoInsertAtI1 if the combine must be inserted at instruction \p I1
523 /// false if the combine must be inserted at the returned instruction.
524 MachineInstr
*HexagonCopyToCombine::findPairable(MachineInstr
&I1
,
527 MachineBasicBlock::iterator I2
= std::next(MachineBasicBlock::iterator(I1
));
528 while (I2
!= I1
.getParent()->end() && I2
->isDebugInstr())
531 unsigned I1DestReg
= I1
.getOperand(0).getReg();
533 for (MachineBasicBlock::iterator End
= I1
.getParent()->end(); I2
!= End
;
535 // Bail out early if we see a second definition of I1DestReg.
536 if (I2
->modifiesRegister(I1DestReg
, TRI
))
539 // Ignore non-combinable instructions.
540 if (!isCombinableInstType(*I2
, TII
, ShouldCombineAggressively
))
543 // Don't combine a TFR whose user could be newified.
544 if (ShouldCombineAggressively
&& PotentiallyNewifiableTFR
.count(&*I2
))
547 unsigned I2DestReg
= I2
->getOperand(0).getReg();
549 // Check that registers are adjacent and that the first destination register
551 bool IsI1LowReg
= (I2DestReg
- I1DestReg
) == 1;
552 bool IsI2LowReg
= (I1DestReg
- I2DestReg
) == 1;
553 unsigned FirstRegIndex
= IsI1LowReg
? I1DestReg
: I2DestReg
;
554 if ((!IsI1LowReg
&& !IsI2LowReg
) || !isEvenReg(FirstRegIndex
))
557 // Check that the two instructions are combinable.
558 // The order matters because in a A2_tfrsi we might can encode a int8 as
559 // the hi reg operand but only a uint6 as the low reg operand.
560 if ((IsI2LowReg
&& !areCombinableOperations(TRI
, I1
, *I2
, AllowC64
)) ||
561 (IsI1LowReg
&& !areCombinableOperations(TRI
, *I2
, I1
, AllowC64
)))
564 if (isSafeToMoveTogether(I1
, *I2
, I1DestReg
, I2DestReg
, DoInsertAtI1
))
567 // Not safe. Stop searching.
573 void HexagonCopyToCombine::combine(MachineInstr
&I1
, MachineInstr
&I2
,
574 MachineBasicBlock::iterator
&MI
,
575 bool DoInsertAtI1
, bool OptForSize
) {
576 // We are going to delete I2. If MI points to I2 advance it to the next
578 if (MI
== I2
.getIterator())
581 // Figure out whether I1 or I2 goes into the lowreg part.
582 unsigned I1DestReg
= I1
.getOperand(0).getReg();
583 unsigned I2DestReg
= I2
.getOperand(0).getReg();
584 bool IsI1Loreg
= (I2DestReg
- I1DestReg
) == 1;
585 unsigned LoRegDef
= IsI1Loreg
? I1DestReg
: I2DestReg
;
588 const TargetRegisterClass
*SuperRC
= nullptr;
589 if (Hexagon::IntRegsRegClass
.contains(LoRegDef
)) {
590 SuperRC
= &Hexagon::DoubleRegsRegClass
;
591 SubLo
= Hexagon::isub_lo
;
592 } else if (Hexagon::HvxVRRegClass
.contains(LoRegDef
)) {
593 assert(ST
->useHVXOps());
594 SuperRC
= &Hexagon::HvxWRRegClass
;
595 SubLo
= Hexagon::vsub_lo
;
597 llvm_unreachable("Unexpected register class");
599 // Get the double word register.
600 unsigned DoubleRegDest
= TRI
->getMatchingSuperReg(LoRegDef
, SubLo
, SuperRC
);
601 assert(DoubleRegDest
!= 0 && "Expect a valid register");
603 // Setup source operands.
604 MachineOperand
&LoOperand
= IsI1Loreg
? I1
.getOperand(1) : I2
.getOperand(1);
605 MachineOperand
&HiOperand
= IsI1Loreg
? I2
.getOperand(1) : I1
.getOperand(1);
607 // Figure out which source is a register and which a constant.
608 bool IsHiReg
= HiOperand
.isReg();
609 bool IsLoReg
= LoOperand
.isReg();
611 // There is a combine of two constant extended values into CONST64.
612 bool IsC64
= OptForSize
&& LoOperand
.isImm() && HiOperand
.isImm() &&
613 isGreaterThanNBitTFRI
<16>(I1
) && isGreaterThanNBitTFRI
<16>(I2
);
615 MachineBasicBlock::iterator
InsertPt(DoInsertAtI1
? I1
: I2
);
617 if (IsHiReg
&& IsLoReg
)
618 emitCombineRR(InsertPt
, DoubleRegDest
, HiOperand
, LoOperand
);
620 emitCombineRI(InsertPt
, DoubleRegDest
, HiOperand
, LoOperand
);
622 emitCombineIR(InsertPt
, DoubleRegDest
, HiOperand
, LoOperand
);
623 else if (IsC64
&& !IsConst64Disabled
)
624 emitConst64(InsertPt
, DoubleRegDest
, HiOperand
, LoOperand
);
626 emitCombineII(InsertPt
, DoubleRegDest
, HiOperand
, LoOperand
);
628 // Move debug instructions along with I1 if it's being
630 if (!DoInsertAtI1
&& DbgMItoMove
.size() != 0) {
631 // Insert debug instructions at the new location before I2.
632 MachineBasicBlock
*BB
= InsertPt
->getParent();
633 for (auto NewMI
: DbgMItoMove
) {
634 // If iterator MI is pointing to DEBUG_VAL, make sure
635 // MI now points to next relevant instruction.
638 BB
->splice(InsertPt
, BB
, NewMI
);
642 I1
.eraseFromParent();
643 I2
.eraseFromParent();
646 void HexagonCopyToCombine::emitConst64(MachineBasicBlock::iterator
&InsertPt
,
647 unsigned DoubleDestReg
,
648 MachineOperand
&HiOperand
,
649 MachineOperand
&LoOperand
) {
650 LLVM_DEBUG(dbgs() << "Found a CONST64\n");
652 DebugLoc DL
= InsertPt
->getDebugLoc();
653 MachineBasicBlock
*BB
= InsertPt
->getParent();
654 assert(LoOperand
.isImm() && HiOperand
.isImm() &&
655 "Both operands must be immediate");
657 int64_t V
= HiOperand
.getImm();
658 V
= (V
<< 32) | (0x0ffffffffLL
& LoOperand
.getImm());
659 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::CONST64
), DoubleDestReg
)
663 void HexagonCopyToCombine::emitCombineII(MachineBasicBlock::iterator
&InsertPt
,
664 unsigned DoubleDestReg
,
665 MachineOperand
&HiOperand
,
666 MachineOperand
&LoOperand
) {
667 DebugLoc DL
= InsertPt
->getDebugLoc();
668 MachineBasicBlock
*BB
= InsertPt
->getParent();
671 if (HiOperand
.isGlobal()) {
672 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A2_combineii
), DoubleDestReg
)
673 .addGlobalAddress(HiOperand
.getGlobal(), HiOperand
.getOffset(),
674 HiOperand
.getTargetFlags())
675 .addImm(LoOperand
.getImm());
678 if (LoOperand
.isGlobal()) {
679 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineii
), DoubleDestReg
)
680 .addImm(HiOperand
.getImm())
681 .addGlobalAddress(LoOperand
.getGlobal(), LoOperand
.getOffset(),
682 LoOperand
.getTargetFlags());
686 // Handle block addresses.
687 if (HiOperand
.isBlockAddress()) {
688 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A2_combineii
), DoubleDestReg
)
689 .addBlockAddress(HiOperand
.getBlockAddress(), HiOperand
.getOffset(),
690 HiOperand
.getTargetFlags())
691 .addImm(LoOperand
.getImm());
694 if (LoOperand
.isBlockAddress()) {
695 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineii
), DoubleDestReg
)
696 .addImm(HiOperand
.getImm())
697 .addBlockAddress(LoOperand
.getBlockAddress(), LoOperand
.getOffset(),
698 LoOperand
.getTargetFlags());
702 // Handle jump tables.
703 if (HiOperand
.isJTI()) {
704 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A2_combineii
), DoubleDestReg
)
705 .addJumpTableIndex(HiOperand
.getIndex(), HiOperand
.getTargetFlags())
706 .addImm(LoOperand
.getImm());
709 if (LoOperand
.isJTI()) {
710 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineii
), DoubleDestReg
)
711 .addImm(HiOperand
.getImm())
712 .addJumpTableIndex(LoOperand
.getIndex(), LoOperand
.getTargetFlags());
716 // Handle constant pools.
717 if (HiOperand
.isCPI()) {
718 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A2_combineii
), DoubleDestReg
)
719 .addConstantPoolIndex(HiOperand
.getIndex(), HiOperand
.getOffset(),
720 HiOperand
.getTargetFlags())
721 .addImm(LoOperand
.getImm());
724 if (LoOperand
.isCPI()) {
725 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineii
), DoubleDestReg
)
726 .addImm(HiOperand
.getImm())
727 .addConstantPoolIndex(LoOperand
.getIndex(), LoOperand
.getOffset(),
728 LoOperand
.getTargetFlags());
732 // First preference should be given to Hexagon::A2_combineii instruction
733 // as it can include U6 (in Hexagon::A4_combineii) as well.
734 // In this instruction, HiOperand is const extended, if required.
735 if (isInt
<8>(LoOperand
.getImm())) {
736 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A2_combineii
), DoubleDestReg
)
737 .addImm(HiOperand
.getImm())
738 .addImm(LoOperand
.getImm());
742 // In this instruction, LoOperand is const extended, if required.
743 if (isInt
<8>(HiOperand
.getImm())) {
744 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineii
), DoubleDestReg
)
745 .addImm(HiOperand
.getImm())
746 .addImm(LoOperand
.getImm());
750 // Insert new combine instruction.
751 // DoubleRegDest = combine #HiImm, #LoImm
752 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A2_combineii
), DoubleDestReg
)
753 .addImm(HiOperand
.getImm())
754 .addImm(LoOperand
.getImm());
757 void HexagonCopyToCombine::emitCombineIR(MachineBasicBlock::iterator
&InsertPt
,
758 unsigned DoubleDestReg
,
759 MachineOperand
&HiOperand
,
760 MachineOperand
&LoOperand
) {
761 unsigned LoReg
= LoOperand
.getReg();
762 unsigned LoRegKillFlag
= getKillRegState(LoOperand
.isKill());
764 DebugLoc DL
= InsertPt
->getDebugLoc();
765 MachineBasicBlock
*BB
= InsertPt
->getParent();
768 if (HiOperand
.isGlobal()) {
769 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineir
), DoubleDestReg
)
770 .addGlobalAddress(HiOperand
.getGlobal(), HiOperand
.getOffset(),
771 HiOperand
.getTargetFlags())
772 .addReg(LoReg
, LoRegKillFlag
);
775 // Handle block addresses.
776 if (HiOperand
.isBlockAddress()) {
777 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineir
), DoubleDestReg
)
778 .addBlockAddress(HiOperand
.getBlockAddress(), HiOperand
.getOffset(),
779 HiOperand
.getTargetFlags())
780 .addReg(LoReg
, LoRegKillFlag
);
783 // Handle jump tables.
784 if (HiOperand
.isJTI()) {
785 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineir
), DoubleDestReg
)
786 .addJumpTableIndex(HiOperand
.getIndex(), HiOperand
.getTargetFlags())
787 .addReg(LoReg
, LoRegKillFlag
);
790 // Handle constant pools.
791 if (HiOperand
.isCPI()) {
792 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineir
), DoubleDestReg
)
793 .addConstantPoolIndex(HiOperand
.getIndex(), HiOperand
.getOffset(),
794 HiOperand
.getTargetFlags())
795 .addReg(LoReg
, LoRegKillFlag
);
798 // Insert new combine instruction.
799 // DoubleRegDest = combine #HiImm, LoReg
800 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineir
), DoubleDestReg
)
801 .addImm(HiOperand
.getImm())
802 .addReg(LoReg
, LoRegKillFlag
);
805 void HexagonCopyToCombine::emitCombineRI(MachineBasicBlock::iterator
&InsertPt
,
806 unsigned DoubleDestReg
,
807 MachineOperand
&HiOperand
,
808 MachineOperand
&LoOperand
) {
809 unsigned HiRegKillFlag
= getKillRegState(HiOperand
.isKill());
810 unsigned HiReg
= HiOperand
.getReg();
812 DebugLoc DL
= InsertPt
->getDebugLoc();
813 MachineBasicBlock
*BB
= InsertPt
->getParent();
816 if (LoOperand
.isGlobal()) {
817 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineri
), DoubleDestReg
)
818 .addReg(HiReg
, HiRegKillFlag
)
819 .addGlobalAddress(LoOperand
.getGlobal(), LoOperand
.getOffset(),
820 LoOperand
.getTargetFlags());
823 // Handle block addresses.
824 if (LoOperand
.isBlockAddress()) {
825 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineri
), DoubleDestReg
)
826 .addReg(HiReg
, HiRegKillFlag
)
827 .addBlockAddress(LoOperand
.getBlockAddress(), LoOperand
.getOffset(),
828 LoOperand
.getTargetFlags());
831 // Handle jump tables.
832 if (LoOperand
.isJTI()) {
833 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineri
), DoubleDestReg
)
834 .addReg(HiOperand
.getReg(), HiRegKillFlag
)
835 .addJumpTableIndex(LoOperand
.getIndex(), LoOperand
.getTargetFlags());
838 // Handle constant pools.
839 if (LoOperand
.isCPI()) {
840 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineri
), DoubleDestReg
)
841 .addReg(HiOperand
.getReg(), HiRegKillFlag
)
842 .addConstantPoolIndex(LoOperand
.getIndex(), LoOperand
.getOffset(),
843 LoOperand
.getTargetFlags());
847 // Insert new combine instruction.
848 // DoubleRegDest = combine HiReg, #LoImm
849 BuildMI(*BB
, InsertPt
, DL
, TII
->get(Hexagon::A4_combineri
), DoubleDestReg
)
850 .addReg(HiReg
, HiRegKillFlag
)
851 .addImm(LoOperand
.getImm());
854 void HexagonCopyToCombine::emitCombineRR(MachineBasicBlock::iterator
&InsertPt
,
855 unsigned DoubleDestReg
,
856 MachineOperand
&HiOperand
,
857 MachineOperand
&LoOperand
) {
858 unsigned LoRegKillFlag
= getKillRegState(LoOperand
.isKill());
859 unsigned HiRegKillFlag
= getKillRegState(HiOperand
.isKill());
860 unsigned LoReg
= LoOperand
.getReg();
861 unsigned HiReg
= HiOperand
.getReg();
863 DebugLoc DL
= InsertPt
->getDebugLoc();
864 MachineBasicBlock
*BB
= InsertPt
->getParent();
866 // Insert new combine instruction.
867 // DoubleRegDest = combine HiReg, LoReg
869 if (Hexagon::DoubleRegsRegClass
.contains(DoubleDestReg
)) {
870 NewOpc
= Hexagon::A2_combinew
;
871 } else if (Hexagon::HvxWRRegClass
.contains(DoubleDestReg
)) {
872 assert(ST
->useHVXOps());
873 NewOpc
= Hexagon::V6_vcombine
;
875 llvm_unreachable("Unexpected register");
877 BuildMI(*BB
, InsertPt
, DL
, TII
->get(NewOpc
), DoubleDestReg
)
878 .addReg(HiReg
, HiRegKillFlag
)
879 .addReg(LoReg
, LoRegKillFlag
);
882 FunctionPass
*llvm::createHexagonCopyToCombine() {
883 return new HexagonCopyToCombine();