[ORC] Add std::tuple support to SimplePackedSerialization.
[llvm-project.git] / llvm / lib / Target / Hexagon / HexagonCopyToCombine.cpp
blob23d0cc829e52aefbb05bd4243ba709eed27194b4
1 //===------- HexagonCopyToCombine.cpp - Hexagon Copy-To-Combine Pass ------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 // This pass replaces transfer instructions by combine instructions.
9 // We walk along a basic block and look for two combinable instructions and try
10 // to move them together. If we can move them next to each other we do so and
11 // replace them with a combine instruction.
12 //===----------------------------------------------------------------------===//
14 #include "HexagonInstrInfo.h"
15 #include "HexagonSubtarget.h"
16 #include "llvm/ADT/DenseMap.h"
17 #include "llvm/ADT/DenseSet.h"
18 #include "llvm/CodeGen/MachineBasicBlock.h"
19 #include "llvm/CodeGen/MachineFunction.h"
20 #include "llvm/CodeGen/MachineFunctionPass.h"
21 #include "llvm/CodeGen/MachineInstr.h"
22 #include "llvm/CodeGen/MachineInstrBuilder.h"
23 #include "llvm/CodeGen/Passes.h"
24 #include "llvm/CodeGen/TargetRegisterInfo.h"
25 #include "llvm/Pass.h"
26 #include "llvm/Support/CodeGen.h"
27 #include "llvm/Support/CommandLine.h"
28 #include "llvm/Support/Debug.h"
29 #include "llvm/Support/raw_ostream.h"
30 #include "llvm/Target/TargetMachine.h"
32 using namespace llvm;
34 #define DEBUG_TYPE "hexagon-copy-combine"
36 static
37 cl::opt<bool> IsCombinesDisabled("disable-merge-into-combines",
38 cl::Hidden, cl::ZeroOrMore,
39 cl::init(false),
40 cl::desc("Disable merging into combines"));
41 static
42 cl::opt<bool> IsConst64Disabled("disable-const64",
43 cl::Hidden, cl::ZeroOrMore,
44 cl::init(false),
45 cl::desc("Disable generation of const64"));
46 static
47 cl::opt<unsigned>
48 MaxNumOfInstsBetweenNewValueStoreAndTFR("max-num-inst-between-tfr-and-nv-store",
49 cl::Hidden, cl::init(4),
50 cl::desc("Maximum distance between a tfr feeding a store we "
51 "consider the store still to be newifiable"));
53 namespace llvm {
54 FunctionPass *createHexagonCopyToCombine();
55 void initializeHexagonCopyToCombinePass(PassRegistry&);
59 namespace {
61 class HexagonCopyToCombine : public MachineFunctionPass {
62 const HexagonInstrInfo *TII;
63 const TargetRegisterInfo *TRI;
64 const HexagonSubtarget *ST;
65 bool ShouldCombineAggressively;
67 DenseSet<MachineInstr *> PotentiallyNewifiableTFR;
68 SmallVector<MachineInstr *, 8> DbgMItoMove;
70 public:
71 static char ID;
73 HexagonCopyToCombine() : MachineFunctionPass(ID) {
74 initializeHexagonCopyToCombinePass(*PassRegistry::getPassRegistry());
77 void getAnalysisUsage(AnalysisUsage &AU) const override {
78 MachineFunctionPass::getAnalysisUsage(AU);
81 StringRef getPassName() const override {
82 return "Hexagon Copy-To-Combine Pass";
85 bool runOnMachineFunction(MachineFunction &Fn) override;
87 MachineFunctionProperties getRequiredProperties() const override {
88 return MachineFunctionProperties().set(
89 MachineFunctionProperties::Property::NoVRegs);
92 private:
93 MachineInstr *findPairable(MachineInstr &I1, bool &DoInsertAtI1,
94 bool AllowC64);
96 void findPotentialNewifiableTFRs(MachineBasicBlock &);
98 void combine(MachineInstr &I1, MachineInstr &I2,
99 MachineBasicBlock::iterator &MI, bool DoInsertAtI1,
100 bool OptForSize);
102 bool isSafeToMoveTogether(MachineInstr &I1, MachineInstr &I2,
103 unsigned I1DestReg, unsigned I2DestReg,
104 bool &DoInsertAtI1);
106 void emitCombineRR(MachineBasicBlock::iterator &Before, unsigned DestReg,
107 MachineOperand &HiOperand, MachineOperand &LoOperand);
109 void emitCombineRI(MachineBasicBlock::iterator &Before, unsigned DestReg,
110 MachineOperand &HiOperand, MachineOperand &LoOperand);
112 void emitCombineIR(MachineBasicBlock::iterator &Before, unsigned DestReg,
113 MachineOperand &HiOperand, MachineOperand &LoOperand);
115 void emitCombineII(MachineBasicBlock::iterator &Before, unsigned DestReg,
116 MachineOperand &HiOperand, MachineOperand &LoOperand);
118 void emitConst64(MachineBasicBlock::iterator &Before, unsigned DestReg,
119 MachineOperand &HiOperand, MachineOperand &LoOperand);
122 } // End anonymous namespace.
124 char HexagonCopyToCombine::ID = 0;
126 INITIALIZE_PASS(HexagonCopyToCombine, "hexagon-copy-combine",
127 "Hexagon Copy-To-Combine Pass", false, false)
129 static bool isCombinableInstType(MachineInstr &MI, const HexagonInstrInfo *TII,
130 bool ShouldCombineAggressively) {
131 switch (MI.getOpcode()) {
132 case Hexagon::A2_tfr: {
133 // A COPY instruction can be combined if its arguments are IntRegs (32bit).
134 const MachineOperand &Op0 = MI.getOperand(0);
135 const MachineOperand &Op1 = MI.getOperand(1);
136 assert(Op0.isReg() && Op1.isReg());
138 Register DestReg = Op0.getReg();
139 Register SrcReg = Op1.getReg();
140 return Hexagon::IntRegsRegClass.contains(DestReg) &&
141 Hexagon::IntRegsRegClass.contains(SrcReg);
144 case Hexagon::A2_tfrsi: {
145 // A transfer-immediate can be combined if its argument is a signed 8bit
146 // value.
147 const MachineOperand &Op0 = MI.getOperand(0);
148 const MachineOperand &Op1 = MI.getOperand(1);
149 assert(Op0.isReg());
151 Register DestReg = Op0.getReg();
152 // Ensure that TargetFlags are MO_NO_FLAG for a global. This is a
153 // workaround for an ABI bug that prevents GOT relocations on combine
154 // instructions
155 if (!Op1.isImm() && Op1.getTargetFlags() != HexagonII::MO_NO_FLAG)
156 return false;
158 // Only combine constant extended A2_tfrsi if we are in aggressive mode.
159 bool NotExt = Op1.isImm() && isInt<8>(Op1.getImm());
160 return Hexagon::IntRegsRegClass.contains(DestReg) &&
161 (ShouldCombineAggressively || NotExt);
164 case Hexagon::V6_vassign:
165 return true;
167 default:
168 break;
171 return false;
174 template <unsigned N> static bool isGreaterThanNBitTFRI(const MachineInstr &I) {
175 if (I.getOpcode() == Hexagon::TFRI64_V4 ||
176 I.getOpcode() == Hexagon::A2_tfrsi) {
177 const MachineOperand &Op = I.getOperand(1);
178 return !Op.isImm() || !isInt<N>(Op.getImm());
180 return false;
183 /// areCombinableOperations - Returns true if the two instruction can be merge
184 /// into a combine (ignoring register constraints).
185 static bool areCombinableOperations(const TargetRegisterInfo *TRI,
186 MachineInstr &HighRegInst,
187 MachineInstr &LowRegInst, bool AllowC64) {
188 unsigned HiOpc = HighRegInst.getOpcode();
189 unsigned LoOpc = LowRegInst.getOpcode();
191 auto verifyOpc = [](unsigned Opc) -> void {
192 switch (Opc) {
193 case Hexagon::A2_tfr:
194 case Hexagon::A2_tfrsi:
195 case Hexagon::V6_vassign:
196 break;
197 default:
198 llvm_unreachable("Unexpected opcode");
201 verifyOpc(HiOpc);
202 verifyOpc(LoOpc);
204 if (HiOpc == Hexagon::V6_vassign || LoOpc == Hexagon::V6_vassign)
205 return HiOpc == LoOpc;
207 if (!AllowC64) {
208 // There is no combine of two constant extended values.
209 if (isGreaterThanNBitTFRI<8>(HighRegInst) &&
210 isGreaterThanNBitTFRI<6>(LowRegInst))
211 return false;
214 // There is a combine of two constant extended values into CONST64,
215 // provided both constants are true immediates.
216 if (isGreaterThanNBitTFRI<16>(HighRegInst) &&
217 isGreaterThanNBitTFRI<16>(LowRegInst) && !IsConst64Disabled)
218 return (HighRegInst.getOperand(1).isImm() &&
219 LowRegInst.getOperand(1).isImm());
221 // There is no combine of two constant extended values, unless handled above
222 // Make both 8-bit size checks to allow both combine (#,##) and combine(##,#)
223 if (isGreaterThanNBitTFRI<8>(HighRegInst) &&
224 isGreaterThanNBitTFRI<8>(LowRegInst))
225 return false;
227 return true;
230 static bool isEvenReg(unsigned Reg) {
231 assert(Register::isPhysicalRegister(Reg));
232 if (Hexagon::IntRegsRegClass.contains(Reg))
233 return (Reg - Hexagon::R0) % 2 == 0;
234 if (Hexagon::HvxVRRegClass.contains(Reg))
235 return (Reg - Hexagon::V0) % 2 == 0;
236 llvm_unreachable("Invalid register");
239 static void removeKillInfo(MachineInstr &MI, unsigned RegNotKilled) {
240 for (unsigned I = 0, E = MI.getNumOperands(); I != E; ++I) {
241 MachineOperand &Op = MI.getOperand(I);
242 if (!Op.isReg() || Op.getReg() != RegNotKilled || !Op.isKill())
243 continue;
244 Op.setIsKill(false);
248 /// Returns true if it is unsafe to move a copy instruction from \p UseReg to
249 /// \p DestReg over the instruction \p MI.
250 static bool isUnsafeToMoveAcross(MachineInstr &MI, unsigned UseReg,
251 unsigned DestReg,
252 const TargetRegisterInfo *TRI) {
253 return (UseReg && (MI.modifiesRegister(UseReg, TRI))) ||
254 MI.modifiesRegister(DestReg, TRI) || MI.readsRegister(DestReg, TRI) ||
255 MI.hasUnmodeledSideEffects() || MI.isInlineAsm() ||
256 MI.isMetaInstruction();
259 static Register UseReg(const MachineOperand& MO) {
260 return MO.isReg() ? MO.getReg() : Register();
263 /// isSafeToMoveTogether - Returns true if it is safe to move I1 next to I2 such
264 /// that the two instructions can be paired in a combine.
265 bool HexagonCopyToCombine::isSafeToMoveTogether(MachineInstr &I1,
266 MachineInstr &I2,
267 unsigned I1DestReg,
268 unsigned I2DestReg,
269 bool &DoInsertAtI1) {
270 Register I2UseReg = UseReg(I2.getOperand(1));
272 // It is not safe to move I1 and I2 into one combine if I2 has a true
273 // dependence on I1.
274 if (I2UseReg && I1.modifiesRegister(I2UseReg, TRI))
275 return false;
277 bool isSafe = true;
279 // First try to move I2 towards I1.
281 // A reverse_iterator instantiated like below starts before I2, and I1
282 // respectively.
283 // Look at instructions I in between I2 and (excluding) I1.
284 MachineBasicBlock::reverse_iterator I = ++I2.getIterator().getReverse();
285 MachineBasicBlock::reverse_iterator End = I1.getIterator().getReverse();
286 // At 03 we got better results (dhrystone!) by being more conservative.
287 if (!ShouldCombineAggressively)
288 End = ++I1.getIterator().getReverse();
289 // If I2 kills its operand and we move I2 over an instruction that also
290 // uses I2's use reg we need to modify that (first) instruction to now kill
291 // this reg.
292 unsigned KilledOperand = 0;
293 if (I2.killsRegister(I2UseReg))
294 KilledOperand = I2UseReg;
295 MachineInstr *KillingInstr = nullptr;
297 for (; I != End; ++I) {
298 // If the intervening instruction I:
299 // * modifies I2's use reg
300 // * modifies I2's def reg
301 // * reads I2's def reg
302 // * or has unmodelled side effects
303 // we can't move I2 across it.
304 if (I->isDebugInstr())
305 continue;
307 if (isUnsafeToMoveAcross(*I, I2UseReg, I2DestReg, TRI)) {
308 isSafe = false;
309 break;
312 // Update first use of the killed operand.
313 if (!KillingInstr && KilledOperand &&
314 I->readsRegister(KilledOperand, TRI))
315 KillingInstr = &*I;
317 if (isSafe) {
318 // Update the intermediate instruction to with the kill flag.
319 if (KillingInstr) {
320 bool Added = KillingInstr->addRegisterKilled(KilledOperand, TRI, true);
321 (void)Added; // suppress compiler warning
322 assert(Added && "Must successfully update kill flag");
323 removeKillInfo(I2, KilledOperand);
325 DoInsertAtI1 = true;
326 return true;
330 // Try to move I1 towards I2.
332 // Look at instructions I in between I1 and (excluding) I2.
333 MachineBasicBlock::iterator I(I1), End(I2);
334 // At O3 we got better results (dhrystone) by being more conservative here.
335 if (!ShouldCombineAggressively)
336 End = std::next(MachineBasicBlock::iterator(I2));
337 Register I1UseReg = UseReg(I1.getOperand(1));
338 // Track killed operands. If we move across an instruction that kills our
339 // operand, we need to update the kill information on the moved I1. It kills
340 // the operand now.
341 MachineInstr *KillingInstr = nullptr;
342 unsigned KilledOperand = 0;
344 while(++I != End) {
345 MachineInstr &MI = *I;
346 // If the intervening instruction MI:
347 // * modifies I1's use reg
348 // * modifies I1's def reg
349 // * reads I1's def reg
350 // * or has unmodelled side effects
351 // We introduce this special case because llvm has no api to remove a
352 // kill flag for a register (a removeRegisterKilled() analogous to
353 // addRegisterKilled) that handles aliased register correctly.
354 // * or has a killed aliased register use of I1's use reg
355 // %d4 = A2_tfrpi 16
356 // %r6 = A2_tfr %r9
357 // %r8 = KILL %r8, implicit killed %d4
358 // If we want to move R6 = across the KILL instruction we would have
359 // to remove the implicit killed %d4 operand. For now, we are
360 // conservative and disallow the move.
361 // we can't move I1 across it.
362 if (MI.isDebugInstr()) {
363 if (MI.readsRegister(I1DestReg, TRI)) // Move this instruction after I2.
364 DbgMItoMove.push_back(&MI);
365 continue;
368 if (isUnsafeToMoveAcross(MI, I1UseReg, I1DestReg, TRI) ||
369 // Check for an aliased register kill. Bail out if we see one.
370 (!MI.killsRegister(I1UseReg) && MI.killsRegister(I1UseReg, TRI)))
371 return false;
373 // Check for an exact kill (registers match).
374 if (I1UseReg && MI.killsRegister(I1UseReg)) {
375 assert(!KillingInstr && "Should only see one killing instruction");
376 KilledOperand = I1UseReg;
377 KillingInstr = &MI;
380 if (KillingInstr) {
381 removeKillInfo(*KillingInstr, KilledOperand);
382 // Update I1 to set the kill flag. This flag will later be picked up by
383 // the new COMBINE instruction.
384 bool Added = I1.addRegisterKilled(KilledOperand, TRI);
385 (void)Added; // suppress compiler warning
386 assert(Added && "Must successfully update kill flag");
388 DoInsertAtI1 = false;
391 return true;
394 /// findPotentialNewifiableTFRs - Finds tranfers that feed stores that could be
395 /// newified. (A use of a 64 bit register define can not be newified)
396 void
397 HexagonCopyToCombine::findPotentialNewifiableTFRs(MachineBasicBlock &BB) {
398 DenseMap<unsigned, MachineInstr *> LastDef;
399 for (MachineInstr &MI : BB) {
400 if (MI.isDebugInstr())
401 continue;
403 // Mark TFRs that feed a potential new value store as such.
404 if (TII->mayBeNewStore(MI)) {
405 // Look for uses of TFR instructions.
406 for (unsigned OpdIdx = 0, OpdE = MI.getNumOperands(); OpdIdx != OpdE;
407 ++OpdIdx) {
408 MachineOperand &Op = MI.getOperand(OpdIdx);
410 // Skip over anything except register uses.
411 if (!Op.isReg() || !Op.isUse() || !Op.getReg())
412 continue;
414 // Look for the defining instruction.
415 Register Reg = Op.getReg();
416 MachineInstr *DefInst = LastDef[Reg];
417 if (!DefInst)
418 continue;
419 if (!isCombinableInstType(*DefInst, TII, ShouldCombineAggressively))
420 continue;
422 // Only close newifiable stores should influence the decision.
423 // Ignore the debug instructions in between.
424 MachineBasicBlock::iterator It(DefInst);
425 unsigned NumInstsToDef = 0;
426 while (&*It != &MI) {
427 if (!It->isDebugInstr())
428 ++NumInstsToDef;
429 ++It;
432 if (NumInstsToDef > MaxNumOfInstsBetweenNewValueStoreAndTFR)
433 continue;
435 PotentiallyNewifiableTFR.insert(DefInst);
437 // Skip to next instruction.
438 continue;
441 // Put instructions that last defined integer or double registers into the
442 // map.
443 for (MachineOperand &Op : MI.operands()) {
444 if (Op.isReg()) {
445 if (!Op.isDef() || !Op.getReg())
446 continue;
447 Register Reg = Op.getReg();
448 if (Hexagon::DoubleRegsRegClass.contains(Reg)) {
449 for (MCSubRegIterator SubRegs(Reg, TRI); SubRegs.isValid(); ++SubRegs)
450 LastDef[*SubRegs] = &MI;
451 } else if (Hexagon::IntRegsRegClass.contains(Reg))
452 LastDef[Reg] = &MI;
453 } else if (Op.isRegMask()) {
454 for (unsigned Reg : Hexagon::IntRegsRegClass)
455 if (Op.clobbersPhysReg(Reg))
456 LastDef[Reg] = &MI;
462 bool HexagonCopyToCombine::runOnMachineFunction(MachineFunction &MF) {
463 if (skipFunction(MF.getFunction()))
464 return false;
466 if (IsCombinesDisabled) return false;
468 bool HasChanged = false;
470 // Get target info.
471 ST = &MF.getSubtarget<HexagonSubtarget>();
472 TRI = ST->getRegisterInfo();
473 TII = ST->getInstrInfo();
475 const Function &F = MF.getFunction();
476 bool OptForSize = F.hasFnAttribute(Attribute::OptimizeForSize);
478 // Combine aggressively (for code size)
479 ShouldCombineAggressively =
480 MF.getTarget().getOptLevel() <= CodeGenOpt::Default;
482 // Disable CONST64 for tiny core since it takes a LD resource.
483 if (!OptForSize && ST->isTinyCore())
484 IsConst64Disabled = true;
486 // Traverse basic blocks.
487 for (MachineFunction::iterator BI = MF.begin(), BE = MF.end(); BI != BE;
488 ++BI) {
489 PotentiallyNewifiableTFR.clear();
490 findPotentialNewifiableTFRs(*BI);
492 // Traverse instructions in basic block.
493 for(MachineBasicBlock::iterator MI = BI->begin(), End = BI->end();
494 MI != End;) {
495 MachineInstr &I1 = *MI++;
497 if (I1.isDebugInstr())
498 continue;
500 // Don't combine a TFR whose user could be newified (instructions that
501 // define double registers can not be newified - Programmer's Ref Manual
502 // 5.4.2 New-value stores).
503 if (ShouldCombineAggressively && PotentiallyNewifiableTFR.count(&I1))
504 continue;
506 // Ignore instructions that are not combinable.
507 if (!isCombinableInstType(I1, TII, ShouldCombineAggressively))
508 continue;
510 // Find a second instruction that can be merged into a combine
511 // instruction. In addition, also find all the debug instructions that
512 // need to be moved along with it.
513 bool DoInsertAtI1 = false;
514 DbgMItoMove.clear();
515 MachineInstr *I2 = findPairable(I1, DoInsertAtI1, OptForSize);
516 if (I2) {
517 HasChanged = true;
518 combine(I1, *I2, MI, DoInsertAtI1, OptForSize);
523 return HasChanged;
526 /// findPairable - Returns an instruction that can be merged with \p I1 into a
527 /// COMBINE instruction or 0 if no such instruction can be found. Returns true
528 /// in \p DoInsertAtI1 if the combine must be inserted at instruction \p I1
529 /// false if the combine must be inserted at the returned instruction.
530 MachineInstr *HexagonCopyToCombine::findPairable(MachineInstr &I1,
531 bool &DoInsertAtI1,
532 bool AllowC64) {
533 MachineBasicBlock::iterator I2 = std::next(MachineBasicBlock::iterator(I1));
534 while (I2 != I1.getParent()->end() && I2->isDebugInstr())
535 ++I2;
537 Register I1DestReg = I1.getOperand(0).getReg();
539 for (MachineBasicBlock::iterator End = I1.getParent()->end(); I2 != End;
540 ++I2) {
541 // Bail out early if we see a second definition of I1DestReg.
542 if (I2->modifiesRegister(I1DestReg, TRI))
543 break;
545 // Ignore non-combinable instructions.
546 if (!isCombinableInstType(*I2, TII, ShouldCombineAggressively))
547 continue;
549 // Don't combine a TFR whose user could be newified.
550 if (ShouldCombineAggressively && PotentiallyNewifiableTFR.count(&*I2))
551 continue;
553 Register I2DestReg = I2->getOperand(0).getReg();
555 // Check that registers are adjacent and that the first destination register
556 // is even.
557 bool IsI1LowReg = (I2DestReg - I1DestReg) == 1;
558 bool IsI2LowReg = (I1DestReg - I2DestReg) == 1;
559 unsigned FirstRegIndex = IsI1LowReg ? I1DestReg : I2DestReg;
560 if ((!IsI1LowReg && !IsI2LowReg) || !isEvenReg(FirstRegIndex))
561 continue;
563 // Check that the two instructions are combinable.
564 // The order matters because in a A2_tfrsi we might can encode a int8 as
565 // the hi reg operand but only a uint6 as the low reg operand.
566 if ((IsI2LowReg && !areCombinableOperations(TRI, I1, *I2, AllowC64)) ||
567 (IsI1LowReg && !areCombinableOperations(TRI, *I2, I1, AllowC64)))
568 break;
570 if (isSafeToMoveTogether(I1, *I2, I1DestReg, I2DestReg, DoInsertAtI1))
571 return &*I2;
573 // Not safe. Stop searching.
574 break;
576 return nullptr;
579 void HexagonCopyToCombine::combine(MachineInstr &I1, MachineInstr &I2,
580 MachineBasicBlock::iterator &MI,
581 bool DoInsertAtI1, bool OptForSize) {
582 // We are going to delete I2. If MI points to I2 advance it to the next
583 // instruction.
584 if (MI == I2.getIterator())
585 ++MI;
587 // Figure out whether I1 or I2 goes into the lowreg part.
588 Register I1DestReg = I1.getOperand(0).getReg();
589 Register I2DestReg = I2.getOperand(0).getReg();
590 bool IsI1Loreg = (I2DestReg - I1DestReg) == 1;
591 unsigned LoRegDef = IsI1Loreg ? I1DestReg : I2DestReg;
592 unsigned SubLo;
594 const TargetRegisterClass *SuperRC = nullptr;
595 if (Hexagon::IntRegsRegClass.contains(LoRegDef)) {
596 SuperRC = &Hexagon::DoubleRegsRegClass;
597 SubLo = Hexagon::isub_lo;
598 } else if (Hexagon::HvxVRRegClass.contains(LoRegDef)) {
599 assert(ST->useHVXOps());
600 SuperRC = &Hexagon::HvxWRRegClass;
601 SubLo = Hexagon::vsub_lo;
602 } else
603 llvm_unreachable("Unexpected register class");
605 // Get the double word register.
606 unsigned DoubleRegDest = TRI->getMatchingSuperReg(LoRegDef, SubLo, SuperRC);
607 assert(DoubleRegDest != 0 && "Expect a valid register");
609 // Setup source operands.
610 MachineOperand &LoOperand = IsI1Loreg ? I1.getOperand(1) : I2.getOperand(1);
611 MachineOperand &HiOperand = IsI1Loreg ? I2.getOperand(1) : I1.getOperand(1);
613 // Figure out which source is a register and which a constant.
614 bool IsHiReg = HiOperand.isReg();
615 bool IsLoReg = LoOperand.isReg();
617 // There is a combine of two constant extended values into CONST64.
618 bool IsC64 = OptForSize && LoOperand.isImm() && HiOperand.isImm() &&
619 isGreaterThanNBitTFRI<16>(I1) && isGreaterThanNBitTFRI<16>(I2);
621 MachineBasicBlock::iterator InsertPt(DoInsertAtI1 ? I1 : I2);
622 // Emit combine.
623 if (IsHiReg && IsLoReg)
624 emitCombineRR(InsertPt, DoubleRegDest, HiOperand, LoOperand);
625 else if (IsHiReg)
626 emitCombineRI(InsertPt, DoubleRegDest, HiOperand, LoOperand);
627 else if (IsLoReg)
628 emitCombineIR(InsertPt, DoubleRegDest, HiOperand, LoOperand);
629 else if (IsC64 && !IsConst64Disabled)
630 emitConst64(InsertPt, DoubleRegDest, HiOperand, LoOperand);
631 else
632 emitCombineII(InsertPt, DoubleRegDest, HiOperand, LoOperand);
634 // Move debug instructions along with I1 if it's being
635 // moved towards I2.
636 if (!DoInsertAtI1 && DbgMItoMove.size() != 0) {
637 // Insert debug instructions at the new location before I2.
638 MachineBasicBlock *BB = InsertPt->getParent();
639 for (auto NewMI : DbgMItoMove) {
640 // If iterator MI is pointing to DEBUG_VAL, make sure
641 // MI now points to next relevant instruction.
642 if (NewMI == MI)
643 ++MI;
644 BB->splice(InsertPt, BB, NewMI);
648 I1.eraseFromParent();
649 I2.eraseFromParent();
652 void HexagonCopyToCombine::emitConst64(MachineBasicBlock::iterator &InsertPt,
653 unsigned DoubleDestReg,
654 MachineOperand &HiOperand,
655 MachineOperand &LoOperand) {
656 LLVM_DEBUG(dbgs() << "Found a CONST64\n");
658 DebugLoc DL = InsertPt->getDebugLoc();
659 MachineBasicBlock *BB = InsertPt->getParent();
660 assert(LoOperand.isImm() && HiOperand.isImm() &&
661 "Both operands must be immediate");
663 int64_t V = HiOperand.getImm();
664 V = (V << 32) | (0x0ffffffffLL & LoOperand.getImm());
665 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::CONST64), DoubleDestReg)
666 .addImm(V);
669 void HexagonCopyToCombine::emitCombineII(MachineBasicBlock::iterator &InsertPt,
670 unsigned DoubleDestReg,
671 MachineOperand &HiOperand,
672 MachineOperand &LoOperand) {
673 DebugLoc DL = InsertPt->getDebugLoc();
674 MachineBasicBlock *BB = InsertPt->getParent();
676 // Handle globals.
677 if (HiOperand.isGlobal()) {
678 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
679 .addGlobalAddress(HiOperand.getGlobal(), HiOperand.getOffset(),
680 HiOperand.getTargetFlags())
681 .addImm(LoOperand.getImm());
682 return;
684 if (LoOperand.isGlobal()) {
685 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
686 .addImm(HiOperand.getImm())
687 .addGlobalAddress(LoOperand.getGlobal(), LoOperand.getOffset(),
688 LoOperand.getTargetFlags());
689 return;
692 // Handle block addresses.
693 if (HiOperand.isBlockAddress()) {
694 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
695 .addBlockAddress(HiOperand.getBlockAddress(), HiOperand.getOffset(),
696 HiOperand.getTargetFlags())
697 .addImm(LoOperand.getImm());
698 return;
700 if (LoOperand.isBlockAddress()) {
701 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
702 .addImm(HiOperand.getImm())
703 .addBlockAddress(LoOperand.getBlockAddress(), LoOperand.getOffset(),
704 LoOperand.getTargetFlags());
705 return;
708 // Handle jump tables.
709 if (HiOperand.isJTI()) {
710 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
711 .addJumpTableIndex(HiOperand.getIndex(), HiOperand.getTargetFlags())
712 .addImm(LoOperand.getImm());
713 return;
715 if (LoOperand.isJTI()) {
716 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
717 .addImm(HiOperand.getImm())
718 .addJumpTableIndex(LoOperand.getIndex(), LoOperand.getTargetFlags());
719 return;
722 // Handle constant pools.
723 if (HiOperand.isCPI()) {
724 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
725 .addConstantPoolIndex(HiOperand.getIndex(), HiOperand.getOffset(),
726 HiOperand.getTargetFlags())
727 .addImm(LoOperand.getImm());
728 return;
730 if (LoOperand.isCPI()) {
731 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
732 .addImm(HiOperand.getImm())
733 .addConstantPoolIndex(LoOperand.getIndex(), LoOperand.getOffset(),
734 LoOperand.getTargetFlags());
735 return;
738 // First preference should be given to Hexagon::A2_combineii instruction
739 // as it can include U6 (in Hexagon::A4_combineii) as well.
740 // In this instruction, HiOperand is const extended, if required.
741 if (isInt<8>(LoOperand.getImm())) {
742 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
743 .addImm(HiOperand.getImm())
744 .addImm(LoOperand.getImm());
745 return;
748 // In this instruction, LoOperand is const extended, if required.
749 if (isInt<8>(HiOperand.getImm())) {
750 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
751 .addImm(HiOperand.getImm())
752 .addImm(LoOperand.getImm());
753 return;
756 // Insert new combine instruction.
757 // DoubleRegDest = combine #HiImm, #LoImm
758 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
759 .addImm(HiOperand.getImm())
760 .addImm(LoOperand.getImm());
763 void HexagonCopyToCombine::emitCombineIR(MachineBasicBlock::iterator &InsertPt,
764 unsigned DoubleDestReg,
765 MachineOperand &HiOperand,
766 MachineOperand &LoOperand) {
767 Register LoReg = LoOperand.getReg();
768 unsigned LoRegKillFlag = getKillRegState(LoOperand.isKill());
770 DebugLoc DL = InsertPt->getDebugLoc();
771 MachineBasicBlock *BB = InsertPt->getParent();
773 // Handle globals.
774 if (HiOperand.isGlobal()) {
775 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
776 .addGlobalAddress(HiOperand.getGlobal(), HiOperand.getOffset(),
777 HiOperand.getTargetFlags())
778 .addReg(LoReg, LoRegKillFlag);
779 return;
781 // Handle block addresses.
782 if (HiOperand.isBlockAddress()) {
783 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
784 .addBlockAddress(HiOperand.getBlockAddress(), HiOperand.getOffset(),
785 HiOperand.getTargetFlags())
786 .addReg(LoReg, LoRegKillFlag);
787 return;
789 // Handle jump tables.
790 if (HiOperand.isJTI()) {
791 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
792 .addJumpTableIndex(HiOperand.getIndex(), HiOperand.getTargetFlags())
793 .addReg(LoReg, LoRegKillFlag);
794 return;
796 // Handle constant pools.
797 if (HiOperand.isCPI()) {
798 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
799 .addConstantPoolIndex(HiOperand.getIndex(), HiOperand.getOffset(),
800 HiOperand.getTargetFlags())
801 .addReg(LoReg, LoRegKillFlag);
802 return;
804 // Insert new combine instruction.
805 // DoubleRegDest = combine #HiImm, LoReg
806 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
807 .addImm(HiOperand.getImm())
808 .addReg(LoReg, LoRegKillFlag);
811 void HexagonCopyToCombine::emitCombineRI(MachineBasicBlock::iterator &InsertPt,
812 unsigned DoubleDestReg,
813 MachineOperand &HiOperand,
814 MachineOperand &LoOperand) {
815 unsigned HiRegKillFlag = getKillRegState(HiOperand.isKill());
816 Register HiReg = HiOperand.getReg();
818 DebugLoc DL = InsertPt->getDebugLoc();
819 MachineBasicBlock *BB = InsertPt->getParent();
821 // Handle global.
822 if (LoOperand.isGlobal()) {
823 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
824 .addReg(HiReg, HiRegKillFlag)
825 .addGlobalAddress(LoOperand.getGlobal(), LoOperand.getOffset(),
826 LoOperand.getTargetFlags());
827 return;
829 // Handle block addresses.
830 if (LoOperand.isBlockAddress()) {
831 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
832 .addReg(HiReg, HiRegKillFlag)
833 .addBlockAddress(LoOperand.getBlockAddress(), LoOperand.getOffset(),
834 LoOperand.getTargetFlags());
835 return;
837 // Handle jump tables.
838 if (LoOperand.isJTI()) {
839 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
840 .addReg(HiOperand.getReg(), HiRegKillFlag)
841 .addJumpTableIndex(LoOperand.getIndex(), LoOperand.getTargetFlags());
842 return;
844 // Handle constant pools.
845 if (LoOperand.isCPI()) {
846 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
847 .addReg(HiOperand.getReg(), HiRegKillFlag)
848 .addConstantPoolIndex(LoOperand.getIndex(), LoOperand.getOffset(),
849 LoOperand.getTargetFlags());
850 return;
853 // Insert new combine instruction.
854 // DoubleRegDest = combine HiReg, #LoImm
855 BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
856 .addReg(HiReg, HiRegKillFlag)
857 .addImm(LoOperand.getImm());
860 void HexagonCopyToCombine::emitCombineRR(MachineBasicBlock::iterator &InsertPt,
861 unsigned DoubleDestReg,
862 MachineOperand &HiOperand,
863 MachineOperand &LoOperand) {
864 unsigned LoRegKillFlag = getKillRegState(LoOperand.isKill());
865 unsigned HiRegKillFlag = getKillRegState(HiOperand.isKill());
866 Register LoReg = LoOperand.getReg();
867 Register HiReg = HiOperand.getReg();
869 DebugLoc DL = InsertPt->getDebugLoc();
870 MachineBasicBlock *BB = InsertPt->getParent();
872 // Insert new combine instruction.
873 // DoubleRegDest = combine HiReg, LoReg
874 unsigned NewOpc;
875 if (Hexagon::DoubleRegsRegClass.contains(DoubleDestReg)) {
876 NewOpc = Hexagon::A2_combinew;
877 } else if (Hexagon::HvxWRRegClass.contains(DoubleDestReg)) {
878 assert(ST->useHVXOps());
879 NewOpc = Hexagon::V6_vcombine;
880 } else
881 llvm_unreachable("Unexpected register");
883 BuildMI(*BB, InsertPt, DL, TII->get(NewOpc), DoubleDestReg)
884 .addReg(HiReg, HiRegKillFlag)
885 .addReg(LoReg, LoRegKillFlag);
888 FunctionPass *llvm::createHexagonCopyToCombine() {
889 return new HexagonCopyToCombine();