1 //===-- SimpleRegisterCoalescing.cpp - Register Coalescing ----------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file implements a simple register coalescing pass that attempts to
11 // aggressively coalesce every register copy that it can.
13 //===----------------------------------------------------------------------===//
15 #define DEBUG_TYPE "regcoalescing"
16 #include "SimpleRegisterCoalescing.h"
17 #include "VirtRegMap.h"
18 #include "llvm/CodeGen/LiveIntervalAnalysis.h"
19 #include "llvm/Value.h"
20 #include "llvm/CodeGen/MachineFrameInfo.h"
21 #include "llvm/CodeGen/MachineInstr.h"
22 #include "llvm/CodeGen/MachineLoopInfo.h"
23 #include "llvm/CodeGen/MachineRegisterInfo.h"
24 #include "llvm/CodeGen/Passes.h"
25 #include "llvm/CodeGen/RegisterCoalescer.h"
26 #include "llvm/Target/TargetInstrInfo.h"
27 #include "llvm/Target/TargetMachine.h"
28 #include "llvm/Target/TargetOptions.h"
29 #include "llvm/Support/CommandLine.h"
30 #include "llvm/Support/Debug.h"
31 #include "llvm/ADT/SmallSet.h"
32 #include "llvm/ADT/Statistic.h"
33 #include "llvm/ADT/STLExtras.h"
38 STATISTIC(numJoins
, "Number of interval joins performed");
39 STATISTIC(numCrossRCs
, "Number of cross class joins performed");
40 STATISTIC(numCommutes
, "Number of instruction commuting performed");
41 STATISTIC(numExtends
, "Number of copies extended");
42 STATISTIC(NumReMats
, "Number of instructions re-materialized");
43 STATISTIC(numPeep
, "Number of identity moves eliminated after coalescing");
44 STATISTIC(numAborts
, "Number of times interval joining aborted");
45 STATISTIC(numDeadValNo
, "Number of valno def marked dead");
47 char SimpleRegisterCoalescing::ID
= 0;
49 EnableJoining("join-liveintervals",
50 cl::desc("Coalesce copies (default=true)"),
54 NewHeuristic("new-coalescer-heuristic",
55 cl::desc("Use new coalescer heuristic"),
56 cl::init(false), cl::Hidden
);
59 CrossClassJoin("join-cross-class-copies",
60 cl::desc("Coalesce cross register class copies"),
61 cl::init(false), cl::Hidden
);
63 static RegisterPass
<SimpleRegisterCoalescing
>
64 X("simple-register-coalescing", "Simple Register Coalescing");
66 // Declare that we implement the RegisterCoalescer interface
67 static RegisterAnalysisGroup
<RegisterCoalescer
, true/*The Default*/> V(X
);
69 const PassInfo
*const llvm::SimpleRegisterCoalescingID
= &X
;
71 void SimpleRegisterCoalescing::getAnalysisUsage(AnalysisUsage
&AU
) const {
72 AU
.addRequired
<LiveIntervals
>();
73 AU
.addPreserved
<LiveIntervals
>();
74 AU
.addRequired
<MachineLoopInfo
>();
75 AU
.addPreserved
<MachineLoopInfo
>();
76 AU
.addPreservedID(MachineDominatorsID
);
78 AU
.addPreservedID(StrongPHIEliminationID
);
80 AU
.addPreservedID(PHIEliminationID
);
81 AU
.addPreservedID(TwoAddressInstructionPassID
);
82 MachineFunctionPass::getAnalysisUsage(AU
);
85 /// AdjustCopiesBackFrom - We found a non-trivially-coalescable copy with IntA
86 /// being the source and IntB being the dest, thus this defines a value number
87 /// in IntB. If the source value number (in IntA) is defined by a copy from B,
88 /// see if we can merge these two pieces of B into a single value number,
89 /// eliminating a copy. For example:
93 /// B1 = A3 <- this copy
95 /// In this case, B0 can be extended to where the B1 copy lives, allowing the B1
96 /// value number to be replaced with B0 (which simplifies the B liveinterval).
98 /// This returns true if an interval was modified.
100 bool SimpleRegisterCoalescing::AdjustCopiesBackFrom(LiveInterval
&IntA
,
102 MachineInstr
*CopyMI
) {
103 unsigned CopyIdx
= li_
->getDefIndex(li_
->getInstructionIndex(CopyMI
));
105 // BValNo is a value number in B that is defined by a copy from A. 'B3' in
106 // the example above.
107 LiveInterval::iterator BLR
= IntB
.FindLiveRangeContaining(CopyIdx
);
108 assert(BLR
!= IntB
.end() && "Live range not found!");
109 VNInfo
*BValNo
= BLR
->valno
;
111 // Get the location that B is defined at. Two options: either this value has
112 // an unknown definition point or it is defined at CopyIdx. If unknown, we
114 if (!BValNo
->copy
) return false;
115 assert(BValNo
->def
== CopyIdx
&& "Copy doesn't define the value?");
117 // AValNo is the value number in A that defines the copy, A3 in the example.
118 LiveInterval::iterator ALR
= IntA
.FindLiveRangeContaining(CopyIdx
-1);
119 assert(ALR
!= IntA
.end() && "Live range not found!");
120 VNInfo
*AValNo
= ALR
->valno
;
121 // If it's re-defined by an early clobber somewhere in the live range, then
122 // it's not safe to eliminate the copy. FIXME: This is a temporary workaround.
124 // 172 %ECX<def> = MOV32rr %reg1039<kill>
125 // 180 INLINEASM <es:subl $5,$1
126 // sbbl $3,$0>, 10, %EAX<def>, 14, %ECX<earlyclobber,def>, 9, %EAX<kill>,
127 // 36, <fi#0>, 1, %reg0, 0, 9, %ECX<kill>, 36, <fi#1>, 1, %reg0, 0
128 // 188 %EAX<def> = MOV32rr %EAX<kill>
129 // 196 %ECX<def> = MOV32rr %ECX<kill>
130 // 204 %ECX<def> = MOV32rr %ECX<kill>
131 // 212 %EAX<def> = MOV32rr %EAX<kill>
132 // 220 %EAX<def> = MOV32rr %EAX
133 // 228 %reg1039<def> = MOV32rr %ECX<kill>
134 // The early clobber operand ties ECX input to the ECX def.
136 // The live interval of ECX is represented as this:
137 // %reg20,inf = [46,47:1)[174,230:0) 0@174-(230) 1@46-(47)
138 // The coalescer has no idea there was a def in the middle of [174,230].
139 if (AValNo
->redefByEC
)
142 // If AValNo is defined as a copy from IntB, we can potentially process this.
143 // Get the instruction that defines this value number.
144 unsigned SrcReg
= li_
->getVNInfoSourceReg(AValNo
);
145 if (!SrcReg
) return false; // Not defined by a copy.
147 // If the value number is not defined by a copy instruction, ignore it.
149 // If the source register comes from an interval other than IntB, we can't
151 if (SrcReg
!= IntB
.reg
) return false;
153 // Get the LiveRange in IntB that this value number starts with.
154 LiveInterval::iterator ValLR
= IntB
.FindLiveRangeContaining(AValNo
->def
-1);
155 assert(ValLR
!= IntB
.end() && "Live range not found!");
157 // Make sure that the end of the live range is inside the same block as
159 MachineInstr
*ValLREndInst
= li_
->getInstructionFromIndex(ValLR
->end
-1);
161 ValLREndInst
->getParent() != CopyMI
->getParent()) return false;
163 // Okay, we now know that ValLR ends in the same block that the CopyMI
164 // live-range starts. If there are no intervening live ranges between them in
165 // IntB, we can merge them.
166 if (ValLR
+1 != BLR
) return false;
168 // If a live interval is a physical register, conservatively check if any
169 // of its sub-registers is overlapping the live interval of the virtual
170 // register. If so, do not coalesce.
171 if (TargetRegisterInfo::isPhysicalRegister(IntB
.reg
) &&
172 *tri_
->getSubRegisters(IntB
.reg
)) {
173 for (const unsigned* SR
= tri_
->getSubRegisters(IntB
.reg
); *SR
; ++SR
)
174 if (li_
->hasInterval(*SR
) && IntA
.overlaps(li_
->getInterval(*SR
))) {
175 DOUT
<< "Interfere with sub-register ";
176 DEBUG(li_
->getInterval(*SR
).print(DOUT
, tri_
));
181 DOUT
<< "\nExtending: "; IntB
.print(DOUT
, tri_
);
183 unsigned FillerStart
= ValLR
->end
, FillerEnd
= BLR
->start
;
184 // We are about to delete CopyMI, so need to remove it as the 'instruction
185 // that defines this value #'. Update the the valnum with the new defining
187 BValNo
->def
= FillerStart
;
190 // Okay, we can merge them. We need to insert a new liverange:
191 // [ValLR.end, BLR.begin) of either value number, then we merge the
192 // two value numbers.
193 IntB
.addRange(LiveRange(FillerStart
, FillerEnd
, BValNo
));
195 // If the IntB live range is assigned to a physical register, and if that
196 // physreg has sub-registers, update their live intervals as well.
197 if (TargetRegisterInfo::isPhysicalRegister(IntB
.reg
)) {
198 for (const unsigned *SR
= tri_
->getSubRegisters(IntB
.reg
); *SR
; ++SR
) {
199 LiveInterval
&SRLI
= li_
->getInterval(*SR
);
200 SRLI
.addRange(LiveRange(FillerStart
, FillerEnd
,
201 SRLI
.getNextValue(FillerStart
, 0, li_
->getVNInfoAllocator())));
205 // Okay, merge "B1" into the same value number as "B0".
206 if (BValNo
!= ValLR
->valno
) {
207 IntB
.addKills(ValLR
->valno
, BValNo
->kills
);
208 IntB
.MergeValueNumberInto(BValNo
, ValLR
->valno
);
210 DOUT
<< " result = "; IntB
.print(DOUT
, tri_
);
213 // If the source instruction was killing the source register before the
214 // merge, unset the isKill marker given the live range has been extended.
215 int UIdx
= ValLREndInst
->findRegisterUseOperandIdx(IntB
.reg
, true);
217 ValLREndInst
->getOperand(UIdx
).setIsKill(false);
218 IntB
.removeKill(ValLR
->valno
, FillerStart
);
225 /// HasOtherReachingDefs - Return true if there are definitions of IntB
226 /// other than BValNo val# that can reach uses of AValno val# of IntA.
227 bool SimpleRegisterCoalescing::HasOtherReachingDefs(LiveInterval
&IntA
,
231 for (LiveInterval::iterator AI
= IntA
.begin(), AE
= IntA
.end();
233 if (AI
->valno
!= AValNo
) continue;
234 LiveInterval::Ranges::iterator BI
=
235 std::upper_bound(IntB
.ranges
.begin(), IntB
.ranges
.end(), AI
->start
);
236 if (BI
!= IntB
.ranges
.begin())
238 for (; BI
!= IntB
.ranges
.end() && AI
->end
>= BI
->start
; ++BI
) {
239 if (BI
->valno
== BValNo
)
241 if (BI
->start
<= AI
->start
&& BI
->end
> AI
->start
)
243 if (BI
->start
> AI
->start
&& BI
->start
< AI
->end
)
250 /// RemoveCopyByCommutingDef - We found a non-trivially-coalescable copy with IntA
251 /// being the source and IntB being the dest, thus this defines a value number
252 /// in IntB. If the source value number (in IntA) is defined by a commutable
253 /// instruction and its other operand is coalesced to the copy dest register,
254 /// see if we can transform the copy into a noop by commuting the definition. For
257 /// A3 = op A2 B0<kill>
259 /// B1 = A3 <- this copy
261 /// = op A3 <- more uses
265 /// B2 = op B0 A2<kill>
267 /// B1 = B2 <- now an identify copy
269 /// = op B2 <- more uses
271 /// This returns true if an interval was modified.
273 bool SimpleRegisterCoalescing::RemoveCopyByCommutingDef(LiveInterval
&IntA
,
275 MachineInstr
*CopyMI
) {
276 unsigned CopyIdx
= li_
->getDefIndex(li_
->getInstructionIndex(CopyMI
));
278 // FIXME: For now, only eliminate the copy by commuting its def when the
279 // source register is a virtual register. We want to guard against cases
280 // where the copy is a back edge copy and commuting the def lengthen the
281 // live interval of the source register to the entire loop.
282 if (TargetRegisterInfo::isPhysicalRegister(IntA
.reg
))
285 // BValNo is a value number in B that is defined by a copy from A. 'B3' in
286 // the example above.
287 LiveInterval::iterator BLR
= IntB
.FindLiveRangeContaining(CopyIdx
);
288 assert(BLR
!= IntB
.end() && "Live range not found!");
289 VNInfo
*BValNo
= BLR
->valno
;
291 // Get the location that B is defined at. Two options: either this value has
292 // an unknown definition point or it is defined at CopyIdx. If unknown, we
294 if (!BValNo
->copy
) return false;
295 assert(BValNo
->def
== CopyIdx
&& "Copy doesn't define the value?");
297 // AValNo is the value number in A that defines the copy, A3 in the example.
298 LiveInterval::iterator ALR
= IntA
.FindLiveRangeContaining(CopyIdx
-1);
299 assert(ALR
!= IntA
.end() && "Live range not found!");
300 VNInfo
*AValNo
= ALR
->valno
;
301 // If other defs can reach uses of this def, then it's not safe to perform
303 if (AValNo
->def
== ~0U || AValNo
->def
== ~1U || AValNo
->hasPHIKill
)
305 MachineInstr
*DefMI
= li_
->getInstructionFromIndex(AValNo
->def
);
306 const TargetInstrDesc
&TID
= DefMI
->getDesc();
308 if (!TID
.isCommutable() ||
309 !tii_
->CommuteChangesDestination(DefMI
, NewDstIdx
))
312 MachineOperand
&NewDstMO
= DefMI
->getOperand(NewDstIdx
);
313 unsigned NewReg
= NewDstMO
.getReg();
314 if (NewReg
!= IntB
.reg
|| !NewDstMO
.isKill())
317 // Make sure there are no other definitions of IntB that would reach the
318 // uses which the new definition can reach.
319 if (HasOtherReachingDefs(IntA
, IntB
, AValNo
, BValNo
))
322 // If some of the uses of IntA.reg is already coalesced away, return false.
323 // It's not possible to determine whether it's safe to perform the coalescing.
324 for (MachineRegisterInfo::use_iterator UI
= mri_
->use_begin(IntA
.reg
),
325 UE
= mri_
->use_end(); UI
!= UE
; ++UI
) {
326 MachineInstr
*UseMI
= &*UI
;
327 unsigned UseIdx
= li_
->getInstructionIndex(UseMI
);
328 LiveInterval::iterator ULR
= IntA
.FindLiveRangeContaining(UseIdx
);
329 if (ULR
== IntA
.end())
331 if (ULR
->valno
== AValNo
&& JoinedCopies
.count(UseMI
))
335 // At this point we have decided that it is legal to do this
336 // transformation. Start by commuting the instruction.
337 MachineBasicBlock
*MBB
= DefMI
->getParent();
338 MachineInstr
*NewMI
= tii_
->commuteInstruction(DefMI
);
341 if (NewMI
!= DefMI
) {
342 li_
->ReplaceMachineInstrInMaps(DefMI
, NewMI
);
343 MBB
->insert(DefMI
, NewMI
);
346 unsigned OpIdx
= NewMI
->findRegisterUseOperandIdx(IntA
.reg
, false);
347 NewMI
->getOperand(OpIdx
).setIsKill();
349 bool BHasPHIKill
= BValNo
->hasPHIKill
;
350 SmallVector
<VNInfo
*, 4> BDeadValNos
;
351 SmallVector
<unsigned, 4> BKills
;
352 std::map
<unsigned, unsigned> BExtend
;
354 // If ALR and BLR overlaps and end of BLR extends beyond end of ALR, e.g.
363 // then do not add kills of A to the newly created B interval.
364 bool Extended
= BLR
->end
> ALR
->end
&& ALR
->end
!= ALR
->start
;
366 BExtend
[ALR
->end
] = BLR
->end
;
368 // Update uses of IntA of the specific Val# with IntB.
369 bool BHasSubRegs
= false;
370 if (TargetRegisterInfo::isPhysicalRegister(IntB
.reg
))
371 BHasSubRegs
= *tri_
->getSubRegisters(IntB
.reg
);
372 for (MachineRegisterInfo::use_iterator UI
= mri_
->use_begin(IntA
.reg
),
373 UE
= mri_
->use_end(); UI
!= UE
;) {
374 MachineOperand
&UseMO
= UI
.getOperand();
375 MachineInstr
*UseMI
= &*UI
;
377 if (JoinedCopies
.count(UseMI
))
379 unsigned UseIdx
= li_
->getInstructionIndex(UseMI
);
380 LiveInterval::iterator ULR
= IntA
.FindLiveRangeContaining(UseIdx
);
381 if (ULR
== IntA
.end() || ULR
->valno
!= AValNo
)
383 UseMO
.setReg(NewReg
);
386 if (UseMO
.isKill()) {
388 UseMO
.setIsKill(false);
390 BKills
.push_back(li_
->getUseIndex(UseIdx
)+1);
392 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
393 if (!tii_
->isMoveInstr(*UseMI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
))
395 if (DstReg
== IntB
.reg
) {
396 // This copy will become a noop. If it's defining a new val#,
397 // remove that val# as well. However this live range is being
398 // extended to the end of the existing live range defined by the copy.
399 unsigned DefIdx
= li_
->getDefIndex(UseIdx
);
400 const LiveRange
*DLR
= IntB
.getLiveRangeContaining(DefIdx
);
401 BHasPHIKill
|= DLR
->valno
->hasPHIKill
;
402 assert(DLR
->valno
->def
== DefIdx
);
403 BDeadValNos
.push_back(DLR
->valno
);
404 BExtend
[DLR
->start
] = DLR
->end
;
405 JoinedCopies
.insert(UseMI
);
406 // If this is a kill but it's going to be removed, the last use
407 // of the same val# is the new kill.
413 // We need to insert a new liverange: [ALR.start, LastUse). It may be we can
414 // simply extend BLR if CopyMI doesn't end the range.
415 DOUT
<< "\nExtending: "; IntB
.print(DOUT
, tri_
);
417 // Remove val#'s defined by copies that will be coalesced away.
418 for (unsigned i
= 0, e
= BDeadValNos
.size(); i
!= e
; ++i
) {
419 VNInfo
*DeadVNI
= BDeadValNos
[i
];
421 for (const unsigned *SR
= tri_
->getSubRegisters(IntB
.reg
); *SR
; ++SR
) {
422 LiveInterval
&SRLI
= li_
->getInterval(*SR
);
423 const LiveRange
*SRLR
= SRLI
.getLiveRangeContaining(DeadVNI
->def
);
424 SRLI
.removeValNo(SRLR
->valno
);
427 IntB
.removeValNo(BDeadValNos
[i
]);
430 // Extend BValNo by merging in IntA live ranges of AValNo. Val# definition
431 // is updated. Kills are also updated.
432 VNInfo
*ValNo
= BValNo
;
433 ValNo
->def
= AValNo
->def
;
435 for (unsigned j
= 0, ee
= ValNo
->kills
.size(); j
!= ee
; ++j
) {
436 unsigned Kill
= ValNo
->kills
[j
];
437 if (Kill
!= BLR
->end
)
438 BKills
.push_back(Kill
);
440 ValNo
->kills
.clear();
441 for (LiveInterval::iterator AI
= IntA
.begin(), AE
= IntA
.end();
443 if (AI
->valno
!= AValNo
) continue;
444 unsigned End
= AI
->end
;
445 std::map
<unsigned, unsigned>::iterator EI
= BExtend
.find(End
);
446 if (EI
!= BExtend
.end())
448 IntB
.addRange(LiveRange(AI
->start
, End
, ValNo
));
450 // If the IntB live range is assigned to a physical register, and if that
451 // physreg has sub-registers, update their live intervals as well.
453 for (const unsigned *SR
= tri_
->getSubRegisters(IntB
.reg
); *SR
; ++SR
) {
454 LiveInterval
&SRLI
= li_
->getInterval(*SR
);
455 SRLI
.MergeInClobberRange(AI
->start
, End
, li_
->getVNInfoAllocator());
459 IntB
.addKills(ValNo
, BKills
);
460 ValNo
->hasPHIKill
= BHasPHIKill
;
462 DOUT
<< " result = "; IntB
.print(DOUT
, tri_
);
465 DOUT
<< "\nShortening: "; IntA
.print(DOUT
, tri_
);
466 IntA
.removeValNo(AValNo
);
467 DOUT
<< " result = "; IntA
.print(DOUT
, tri_
);
474 /// isSameOrFallThroughBB - Return true if MBB == SuccMBB or MBB simply
475 /// fallthoughs to SuccMBB.
476 static bool isSameOrFallThroughBB(MachineBasicBlock
*MBB
,
477 MachineBasicBlock
*SuccMBB
,
478 const TargetInstrInfo
*tii_
) {
481 MachineBasicBlock
*TBB
= 0, *FBB
= 0;
482 SmallVector
<MachineOperand
, 4> Cond
;
483 return !tii_
->AnalyzeBranch(*MBB
, TBB
, FBB
, Cond
) && !TBB
&& !FBB
&&
484 MBB
->isSuccessor(SuccMBB
);
487 /// removeRange - Wrapper for LiveInterval::removeRange. This removes a range
488 /// from a physical register live interval as well as from the live intervals
489 /// of its sub-registers.
490 static void removeRange(LiveInterval
&li
, unsigned Start
, unsigned End
,
491 LiveIntervals
*li_
, const TargetRegisterInfo
*tri_
) {
492 li
.removeRange(Start
, End
, true);
493 if (TargetRegisterInfo::isPhysicalRegister(li
.reg
)) {
494 for (const unsigned* SR
= tri_
->getSubRegisters(li
.reg
); *SR
; ++SR
) {
495 if (!li_
->hasInterval(*SR
))
497 LiveInterval
&sli
= li_
->getInterval(*SR
);
498 unsigned RemoveEnd
= Start
;
499 while (RemoveEnd
!= End
) {
500 LiveInterval::iterator LR
= sli
.FindLiveRangeContaining(Start
);
503 RemoveEnd
= (LR
->end
< End
) ? LR
->end
: End
;
504 sli
.removeRange(Start
, RemoveEnd
, true);
511 /// TrimLiveIntervalToLastUse - If there is a last use in the same basic block
512 /// as the copy instruction, trim the live interval to the last use and return
515 SimpleRegisterCoalescing::TrimLiveIntervalToLastUse(unsigned CopyIdx
,
516 MachineBasicBlock
*CopyMBB
,
518 const LiveRange
*LR
) {
519 unsigned MBBStart
= li_
->getMBBStartIdx(CopyMBB
);
521 MachineOperand
*LastUse
= lastRegisterUse(LR
->start
, CopyIdx
-1, li
.reg
,
524 MachineInstr
*LastUseMI
= LastUse
->getParent();
525 if (!isSameOrFallThroughBB(LastUseMI
->getParent(), CopyMBB
, tii_
)) {
532 // r1025<dead> = r1024<kill>
533 if (MBBStart
< LR
->end
)
534 removeRange(li
, MBBStart
, LR
->end
, li_
, tri_
);
538 // There are uses before the copy, just shorten the live range to the end
540 LastUse
->setIsKill();
541 removeRange(li
, li_
->getDefIndex(LastUseIdx
), LR
->end
, li_
, tri_
);
542 li
.addKill(LR
->valno
, LastUseIdx
+1);
543 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
544 if (tii_
->isMoveInstr(*LastUseMI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
) &&
546 // Last use is itself an identity code.
547 int DeadIdx
= LastUseMI
->findRegisterDefOperandIdx(li
.reg
, false, tri_
);
548 LastUseMI
->getOperand(DeadIdx
).setIsDead();
554 if (LR
->start
<= MBBStart
&& LR
->end
> MBBStart
) {
555 if (LR
->start
== 0) {
556 assert(TargetRegisterInfo::isPhysicalRegister(li
.reg
));
557 // Live-in to the function but dead. Remove it from entry live-in set.
558 mf_
->begin()->removeLiveIn(li
.reg
);
560 // FIXME: Shorten intervals in BBs that reaches this BB.
566 /// ReMaterializeTrivialDef - If the source of a copy is defined by a trivial
567 /// computation, replace the copy by rematerialize the definition.
568 bool SimpleRegisterCoalescing::ReMaterializeTrivialDef(LiveInterval
&SrcInt
,
570 MachineInstr
*CopyMI
) {
571 unsigned CopyIdx
= li_
->getUseIndex(li_
->getInstructionIndex(CopyMI
));
572 LiveInterval::iterator SrcLR
= SrcInt
.FindLiveRangeContaining(CopyIdx
);
573 assert(SrcLR
!= SrcInt
.end() && "Live range not found!");
574 VNInfo
*ValNo
= SrcLR
->valno
;
575 // If other defs can reach uses of this def, then it's not safe to perform
577 if (ValNo
->def
== ~0U || ValNo
->def
== ~1U || ValNo
->hasPHIKill
)
579 MachineInstr
*DefMI
= li_
->getInstructionFromIndex(ValNo
->def
);
580 const TargetInstrDesc
&TID
= DefMI
->getDesc();
581 if (!TID
.isAsCheapAsAMove())
583 if (!DefMI
->getDesc().isRematerializable() ||
584 !tii_
->isTriviallyReMaterializable(DefMI
))
586 bool SawStore
= false;
587 if (!DefMI
->isSafeToMove(tii_
, SawStore
))
590 unsigned DefIdx
= li_
->getDefIndex(CopyIdx
);
591 const LiveRange
*DLR
= li_
->getInterval(DstReg
).getLiveRangeContaining(DefIdx
);
592 DLR
->valno
->copy
= NULL
;
593 // Don't forget to update sub-register intervals.
594 if (TargetRegisterInfo::isPhysicalRegister(DstReg
)) {
595 for (const unsigned* SR
= tri_
->getSubRegisters(DstReg
); *SR
; ++SR
) {
596 if (!li_
->hasInterval(*SR
))
598 DLR
= li_
->getInterval(*SR
).getLiveRangeContaining(DefIdx
);
599 if (DLR
&& DLR
->valno
->copy
== CopyMI
)
600 DLR
->valno
->copy
= NULL
;
604 // If copy kills the source register, find the last use and propagate
606 MachineBasicBlock
*MBB
= CopyMI
->getParent();
607 if (CopyMI
->killsRegister(SrcInt
.reg
))
608 TrimLiveIntervalToLastUse(CopyIdx
, MBB
, SrcInt
, SrcLR
);
610 MachineBasicBlock::iterator MII
= next(MachineBasicBlock::iterator(CopyMI
));
611 CopyMI
->removeFromParent();
612 tii_
->reMaterialize(*MBB
, MII
, DstReg
, DefMI
);
613 MachineInstr
*NewMI
= prior(MII
);
614 // CopyMI may have implicit operands, transfer them over to the newly
615 // rematerialized instruction. And update implicit def interval valnos.
616 for (unsigned i
= CopyMI
->getDesc().getNumOperands(),
617 e
= CopyMI
->getNumOperands(); i
!= e
; ++i
) {
618 MachineOperand
&MO
= CopyMI
->getOperand(i
);
619 if (MO
.isReg() && MO
.isImplicit())
620 NewMI
->addOperand(MO
);
621 if (MO
.isDef() && li_
->hasInterval(MO
.getReg())) {
622 unsigned Reg
= MO
.getReg();
623 DLR
= li_
->getInterval(Reg
).getLiveRangeContaining(DefIdx
);
624 if (DLR
&& DLR
->valno
->copy
== CopyMI
)
625 DLR
->valno
->copy
= NULL
;
629 li_
->ReplaceMachineInstrInMaps(CopyMI
, NewMI
);
630 MBB
->getParent()->DeleteMachineInstr(CopyMI
);
631 ReMatCopies
.insert(CopyMI
);
632 ReMatDefs
.insert(DefMI
);
637 /// isBackEdgeCopy - Returns true if CopyMI is a back edge copy.
639 bool SimpleRegisterCoalescing::isBackEdgeCopy(MachineInstr
*CopyMI
,
640 unsigned DstReg
) const {
641 MachineBasicBlock
*MBB
= CopyMI
->getParent();
642 const MachineLoop
*L
= loopInfo
->getLoopFor(MBB
);
645 if (MBB
!= L
->getLoopLatch())
648 LiveInterval
&LI
= li_
->getInterval(DstReg
);
649 unsigned DefIdx
= li_
->getInstructionIndex(CopyMI
);
650 LiveInterval::const_iterator DstLR
=
651 LI
.FindLiveRangeContaining(li_
->getDefIndex(DefIdx
));
652 if (DstLR
== LI
.end())
654 unsigned KillIdx
= li_
->getMBBEndIdx(MBB
) + 1;
655 if (DstLR
->valno
->kills
.size() == 1 &&
656 DstLR
->valno
->kills
[0] == KillIdx
&& DstLR
->valno
->hasPHIKill
)
661 /// UpdateRegDefsUses - Replace all defs and uses of SrcReg to DstReg and
662 /// update the subregister number if it is not zero. If DstReg is a
663 /// physical register and the existing subregister number of the def / use
664 /// being updated is not zero, make sure to set it to the correct physical
667 SimpleRegisterCoalescing::UpdateRegDefsUses(unsigned SrcReg
, unsigned DstReg
,
669 bool DstIsPhys
= TargetRegisterInfo::isPhysicalRegister(DstReg
);
670 if (DstIsPhys
&& SubIdx
) {
671 // Figure out the real physical register we are updating with.
672 DstReg
= tri_
->getSubReg(DstReg
, SubIdx
);
676 for (MachineRegisterInfo::reg_iterator I
= mri_
->reg_begin(SrcReg
),
677 E
= mri_
->reg_end(); I
!= E
; ) {
678 MachineOperand
&O
= I
.getOperand();
679 MachineInstr
*UseMI
= &*I
;
681 unsigned OldSubIdx
= O
.getSubReg();
683 unsigned UseDstReg
= DstReg
;
685 UseDstReg
= tri_
->getSubReg(DstReg
, OldSubIdx
);
687 unsigned CopySrcReg
, CopyDstReg
, CopySrcSubIdx
, CopyDstSubIdx
;
688 if (tii_
->isMoveInstr(*UseMI
, CopySrcReg
, CopyDstReg
,
689 CopySrcSubIdx
, CopyDstSubIdx
) &&
690 CopySrcReg
!= CopyDstReg
&&
691 CopySrcReg
== SrcReg
&& CopyDstReg
!= UseDstReg
) {
692 // If the use is a copy and it won't be coalesced away, and its source
693 // is defined by a trivial computation, try to rematerialize it instead.
694 if (ReMaterializeTrivialDef(li_
->getInterval(SrcReg
), CopyDstReg
,UseMI
))
703 // Sub-register indexes goes from small to large. e.g.
704 // RAX: 1 -> AL, 2 -> AX, 3 -> EAX
705 // EAX: 1 -> AL, 2 -> AX
706 // So RAX's sub-register 2 is AX, RAX's sub-regsiter 3 is EAX, whose
707 // sub-register 2 is also AX.
708 if (SubIdx
&& OldSubIdx
&& SubIdx
!= OldSubIdx
)
709 assert(OldSubIdx
< SubIdx
&& "Conflicting sub-register index!");
712 // Remove would-be duplicated kill marker.
713 if (O
.isKill() && UseMI
->killsRegister(DstReg
))
717 // After updating the operand, check if the machine instruction has
718 // become a copy. If so, update its val# information.
719 const TargetInstrDesc
&TID
= UseMI
->getDesc();
720 unsigned CopySrcReg
, CopyDstReg
, CopySrcSubIdx
, CopyDstSubIdx
;
721 if (TID
.getNumDefs() == 1 && TID
.getNumOperands() > 2 &&
722 tii_
->isMoveInstr(*UseMI
, CopySrcReg
, CopyDstReg
,
723 CopySrcSubIdx
, CopyDstSubIdx
) &&
724 CopySrcReg
!= CopyDstReg
&&
725 (TargetRegisterInfo::isVirtualRegister(CopyDstReg
) ||
726 allocatableRegs_
[CopyDstReg
])) {
727 LiveInterval
&LI
= li_
->getInterval(CopyDstReg
);
728 unsigned DefIdx
= li_
->getDefIndex(li_
->getInstructionIndex(UseMI
));
729 const LiveRange
*DLR
= LI
.getLiveRangeContaining(DefIdx
);
730 if (DLR
->valno
->def
== DefIdx
)
731 DLR
->valno
->copy
= UseMI
;
736 /// RemoveDeadImpDef - Remove implicit_def instructions which are "re-defining"
737 /// registers due to insert_subreg coalescing. e.g.
739 /// r1025 = implicit_def
740 /// r1025 = insert_subreg r1025, r1024
744 /// r1025 = implicit_def
745 /// r1025 = insert_subreg r1025, r1025
748 SimpleRegisterCoalescing::RemoveDeadImpDef(unsigned Reg
, LiveInterval
&LI
) {
749 for (MachineRegisterInfo::reg_iterator I
= mri_
->reg_begin(Reg
),
750 E
= mri_
->reg_end(); I
!= E
; ) {
751 MachineOperand
&O
= I
.getOperand();
752 MachineInstr
*DefMI
= &*I
;
756 if (DefMI
->getOpcode() != TargetInstrInfo::IMPLICIT_DEF
)
758 if (!LI
.liveBeforeAndAt(li_
->getInstructionIndex(DefMI
)))
760 li_
->RemoveMachineInstrFromMaps(DefMI
);
761 DefMI
->eraseFromParent();
765 /// RemoveUnnecessaryKills - Remove kill markers that are no longer accurate
766 /// due to live range lengthening as the result of coalescing.
767 void SimpleRegisterCoalescing::RemoveUnnecessaryKills(unsigned Reg
,
769 for (MachineRegisterInfo::use_iterator UI
= mri_
->use_begin(Reg
),
770 UE
= mri_
->use_end(); UI
!= UE
; ++UI
) {
771 MachineOperand
&UseMO
= UI
.getOperand();
772 if (UseMO
.isKill()) {
773 MachineInstr
*UseMI
= UseMO
.getParent();
774 unsigned UseIdx
= li_
->getUseIndex(li_
->getInstructionIndex(UseMI
));
775 if (JoinedCopies
.count(UseMI
))
777 const LiveRange
*UI
= LI
.getLiveRangeContaining(UseIdx
);
778 if (!UI
|| !LI
.isKill(UI
->valno
, UseIdx
+1))
779 UseMO
.setIsKill(false);
784 /// removeIntervalIfEmpty - Check if the live interval of a physical register
785 /// is empty, if so remove it and also remove the empty intervals of its
786 /// sub-registers. Return true if live interval is removed.
787 static bool removeIntervalIfEmpty(LiveInterval
&li
, LiveIntervals
*li_
,
788 const TargetRegisterInfo
*tri_
) {
790 if (TargetRegisterInfo::isPhysicalRegister(li
.reg
))
791 for (const unsigned* SR
= tri_
->getSubRegisters(li
.reg
); *SR
; ++SR
) {
792 if (!li_
->hasInterval(*SR
))
794 LiveInterval
&sli
= li_
->getInterval(*SR
);
796 li_
->removeInterval(*SR
);
798 li_
->removeInterval(li
.reg
);
804 /// ShortenDeadCopyLiveRange - Shorten a live range defined by a dead copy.
805 /// Return true if live interval is removed.
806 bool SimpleRegisterCoalescing::ShortenDeadCopyLiveRange(LiveInterval
&li
,
807 MachineInstr
*CopyMI
) {
808 unsigned CopyIdx
= li_
->getInstructionIndex(CopyMI
);
809 LiveInterval::iterator MLR
=
810 li
.FindLiveRangeContaining(li_
->getDefIndex(CopyIdx
));
812 return false; // Already removed by ShortenDeadCopySrcLiveRange.
813 unsigned RemoveStart
= MLR
->start
;
814 unsigned RemoveEnd
= MLR
->end
;
815 // Remove the liverange that's defined by this.
816 if (RemoveEnd
== li_
->getDefIndex(CopyIdx
)+1) {
817 removeRange(li
, RemoveStart
, RemoveEnd
, li_
, tri_
);
818 return removeIntervalIfEmpty(li
, li_
, tri_
);
823 /// RemoveDeadDef - If a def of a live interval is now determined dead, remove
824 /// the val# it defines. If the live interval becomes empty, remove it as well.
825 bool SimpleRegisterCoalescing::RemoveDeadDef(LiveInterval
&li
,
826 MachineInstr
*DefMI
) {
827 unsigned DefIdx
= li_
->getDefIndex(li_
->getInstructionIndex(DefMI
));
828 LiveInterval::iterator MLR
= li
.FindLiveRangeContaining(DefIdx
);
829 if (DefIdx
!= MLR
->valno
->def
)
831 li
.removeValNo(MLR
->valno
);
832 return removeIntervalIfEmpty(li
, li_
, tri_
);
835 /// PropagateDeadness - Propagate the dead marker to the instruction which
836 /// defines the val#.
837 static void PropagateDeadness(LiveInterval
&li
, MachineInstr
*CopyMI
,
838 unsigned &LRStart
, LiveIntervals
*li_
,
839 const TargetRegisterInfo
* tri_
) {
840 MachineInstr
*DefMI
=
841 li_
->getInstructionFromIndex(li_
->getDefIndex(LRStart
));
842 if (DefMI
&& DefMI
!= CopyMI
) {
843 int DeadIdx
= DefMI
->findRegisterDefOperandIdx(li
.reg
, false, tri_
);
845 DefMI
->getOperand(DeadIdx
).setIsDead();
846 // A dead def should have a single cycle interval.
852 /// ShortenDeadCopySrcLiveRange - Shorten a live range as it's artificially
853 /// extended by a dead copy. Mark the last use (if any) of the val# as kill as
854 /// ends the live range there. If there isn't another use, then this live range
855 /// is dead. Return true if live interval is removed.
857 SimpleRegisterCoalescing::ShortenDeadCopySrcLiveRange(LiveInterval
&li
,
858 MachineInstr
*CopyMI
) {
859 unsigned CopyIdx
= li_
->getInstructionIndex(CopyMI
);
861 // FIXME: special case: function live in. It can be a general case if the
862 // first instruction index starts at > 0 value.
863 assert(TargetRegisterInfo::isPhysicalRegister(li
.reg
));
864 // Live-in to the function but dead. Remove it from entry live-in set.
865 if (mf_
->begin()->isLiveIn(li
.reg
))
866 mf_
->begin()->removeLiveIn(li
.reg
);
867 const LiveRange
*LR
= li
.getLiveRangeContaining(CopyIdx
);
868 removeRange(li
, LR
->start
, LR
->end
, li_
, tri_
);
869 return removeIntervalIfEmpty(li
, li_
, tri_
);
872 LiveInterval::iterator LR
= li
.FindLiveRangeContaining(CopyIdx
-1);
874 // Livein but defined by a phi.
877 unsigned RemoveStart
= LR
->start
;
878 unsigned RemoveEnd
= li_
->getDefIndex(CopyIdx
)+1;
879 if (LR
->end
> RemoveEnd
)
880 // More uses past this copy? Nothing to do.
883 // If there is a last use in the same bb, we can't remove the live range.
884 // Shorten the live interval and return.
885 MachineBasicBlock
*CopyMBB
= CopyMI
->getParent();
886 if (TrimLiveIntervalToLastUse(CopyIdx
, CopyMBB
, li
, LR
))
889 MachineBasicBlock
*StartMBB
= li_
->getMBBFromIndex(RemoveStart
);
890 if (!isSameOrFallThroughBB(StartMBB
, CopyMBB
, tii_
))
891 // If the live range starts in another mbb and the copy mbb is not a fall
892 // through mbb, then we can only cut the range from the beginning of the
894 RemoveStart
= li_
->getMBBStartIdx(CopyMBB
) + 1;
896 if (LR
->valno
->def
== RemoveStart
) {
897 // If the def MI defines the val# and this copy is the only kill of the
898 // val#, then propagate the dead marker.
899 if (li
.isOnlyLROfValNo(LR
)) {
900 PropagateDeadness(li
, CopyMI
, RemoveStart
, li_
, tri_
);
903 if (li
.isKill(LR
->valno
, RemoveEnd
))
904 li
.removeKill(LR
->valno
, RemoveEnd
);
907 removeRange(li
, RemoveStart
, RemoveEnd
, li_
, tri_
);
908 return removeIntervalIfEmpty(li
, li_
, tri_
);
911 /// CanCoalesceWithImpDef - Returns true if the specified copy instruction
912 /// from an implicit def to another register can be coalesced away.
913 bool SimpleRegisterCoalescing::CanCoalesceWithImpDef(MachineInstr
*CopyMI
,
915 LiveInterval
&ImpLi
) const{
916 if (!CopyMI
->killsRegister(ImpLi
.reg
))
918 unsigned CopyIdx
= li_
->getDefIndex(li_
->getInstructionIndex(CopyMI
));
919 LiveInterval::iterator LR
= li
.FindLiveRangeContaining(CopyIdx
);
922 if (LR
->valno
->hasPHIKill
)
924 if (LR
->valno
->def
!= CopyIdx
)
926 // Make sure all of val# uses are copies.
927 for (MachineRegisterInfo::use_iterator UI
= mri_
->use_begin(li
.reg
),
928 UE
= mri_
->use_end(); UI
!= UE
;) {
929 MachineInstr
*UseMI
= &*UI
;
931 if (JoinedCopies
.count(UseMI
))
933 unsigned UseIdx
= li_
->getUseIndex(li_
->getInstructionIndex(UseMI
));
934 LiveInterval::iterator ULR
= li
.FindLiveRangeContaining(UseIdx
);
935 if (ULR
== li
.end() || ULR
->valno
!= LR
->valno
)
937 // If the use is not a use, then it's not safe to coalesce the move.
938 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
939 if (!tii_
->isMoveInstr(*UseMI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
)) {
940 if (UseMI
->getOpcode() == TargetInstrInfo::INSERT_SUBREG
&&
941 UseMI
->getOperand(1).getReg() == li
.reg
)
950 /// RemoveCopiesFromValNo - The specified value# is defined by an implicit
951 /// def and it is being removed. Turn all copies from this value# into
952 /// identity copies so they will be removed.
953 void SimpleRegisterCoalescing::RemoveCopiesFromValNo(LiveInterval
&li
,
955 SmallVector
<MachineInstr
*, 4> ImpDefs
;
956 MachineOperand
*LastUse
= NULL
;
957 unsigned LastUseIdx
= li_
->getUseIndex(VNI
->def
);
958 for (MachineRegisterInfo::reg_iterator RI
= mri_
->reg_begin(li
.reg
),
959 RE
= mri_
->reg_end(); RI
!= RE
;) {
960 MachineOperand
*MO
= &RI
.getOperand();
961 MachineInstr
*MI
= &*RI
;
964 if (MI
->getOpcode() == TargetInstrInfo::IMPLICIT_DEF
) {
965 ImpDefs
.push_back(MI
);
969 if (JoinedCopies
.count(MI
))
971 unsigned UseIdx
= li_
->getUseIndex(li_
->getInstructionIndex(MI
));
972 LiveInterval::iterator ULR
= li
.FindLiveRangeContaining(UseIdx
);
973 if (ULR
== li
.end() || ULR
->valno
!= VNI
)
975 // If the use is a copy, turn it into an identity copy.
976 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
977 if (tii_
->isMoveInstr(*MI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
) &&
979 // Each use MI may have multiple uses of this register. Change them all.
980 for (unsigned i
= 0, e
= MI
->getNumOperands(); i
!= e
; ++i
) {
981 MachineOperand
&MO
= MI
->getOperand(i
);
982 if (MO
.isReg() && MO
.getReg() == li
.reg
)
985 JoinedCopies
.insert(MI
);
986 } else if (UseIdx
> LastUseIdx
) {
992 LastUse
->setIsKill();
993 li
.addKill(VNI
, LastUseIdx
+1);
995 // Remove dead implicit_def's.
996 while (!ImpDefs
.empty()) {
997 MachineInstr
*ImpDef
= ImpDefs
.back();
999 li_
->RemoveMachineInstrFromMaps(ImpDef
);
1000 ImpDef
->eraseFromParent();
1005 /// getMatchingSuperReg - Return a super-register of the specified register
1006 /// Reg so its sub-register of index SubIdx is Reg.
1007 static unsigned getMatchingSuperReg(unsigned Reg
, unsigned SubIdx
,
1008 const TargetRegisterClass
*RC
,
1009 const TargetRegisterInfo
* TRI
) {
1010 for (const unsigned *SRs
= TRI
->getSuperRegisters(Reg
);
1011 unsigned SR
= *SRs
; ++SRs
)
1012 if (Reg
== TRI
->getSubReg(SR
, SubIdx
) && RC
->contains(SR
))
1017 /// isWinToJoinCrossClass - Return true if it's profitable to coalesce
1018 /// two virtual registers from different register classes.
1020 SimpleRegisterCoalescing::isWinToJoinCrossClass(unsigned LargeReg
,
1022 unsigned Threshold
) {
1023 // Then make sure the intervals are *short*.
1024 LiveInterval
&LargeInt
= li_
->getInterval(LargeReg
);
1025 LiveInterval
&SmallInt
= li_
->getInterval(SmallReg
);
1026 unsigned LargeSize
= li_
->getApproximateInstructionCount(LargeInt
);
1027 unsigned SmallSize
= li_
->getApproximateInstructionCount(SmallInt
);
1028 if (SmallSize
> Threshold
|| LargeSize
> Threshold
)
1029 if ((float)std::distance(mri_
->use_begin(SmallReg
),
1030 mri_
->use_end()) / SmallSize
<
1031 (float)std::distance(mri_
->use_begin(LargeReg
),
1032 mri_
->use_end()) / LargeSize
)
1037 /// HasIncompatibleSubRegDefUse - If we are trying to coalesce a virtual
1038 /// register with a physical register, check if any of the virtual register
1039 /// operand is a sub-register use or def. If so, make sure it won't result
1040 /// in an illegal extract_subreg or insert_subreg instruction. e.g.
1041 /// vr1024 = extract_subreg vr1025, 1
1043 /// vr1024 = mov8rr AH
1044 /// If vr1024 is coalesced with AH, the extract_subreg is now illegal since
1045 /// AH does not have a super-reg whose sub-register 1 is AH.
1047 SimpleRegisterCoalescing::HasIncompatibleSubRegDefUse(MachineInstr
*CopyMI
,
1050 for (MachineRegisterInfo::reg_iterator I
= mri_
->reg_begin(VirtReg
),
1051 E
= mri_
->reg_end(); I
!= E
; ++I
) {
1052 MachineOperand
&O
= I
.getOperand();
1053 MachineInstr
*MI
= &*I
;
1054 if (MI
== CopyMI
|| JoinedCopies
.count(MI
))
1056 unsigned SubIdx
= O
.getSubReg();
1057 if (SubIdx
&& !tri_
->getSubReg(PhysReg
, SubIdx
))
1059 if (MI
->getOpcode() == TargetInstrInfo::EXTRACT_SUBREG
) {
1060 SubIdx
= MI
->getOperand(2).getImm();
1061 if (O
.isUse() && !tri_
->getSubReg(PhysReg
, SubIdx
))
1064 unsigned SrcReg
= MI
->getOperand(1).getReg();
1065 const TargetRegisterClass
*RC
=
1066 TargetRegisterInfo::isPhysicalRegister(SrcReg
)
1067 ? tri_
->getPhysicalRegisterRegClass(SrcReg
)
1068 : mri_
->getRegClass(SrcReg
);
1069 if (!getMatchingSuperReg(PhysReg
, SubIdx
, RC
, tri_
))
1073 if (MI
->getOpcode() == TargetInstrInfo::INSERT_SUBREG
||
1074 MI
->getOpcode() == TargetInstrInfo::SUBREG_TO_REG
) {
1075 SubIdx
= MI
->getOperand(3).getImm();
1076 if (VirtReg
== MI
->getOperand(0).getReg()) {
1077 if (!tri_
->getSubReg(PhysReg
, SubIdx
))
1080 unsigned DstReg
= MI
->getOperand(0).getReg();
1081 const TargetRegisterClass
*RC
=
1082 TargetRegisterInfo::isPhysicalRegister(DstReg
)
1083 ? tri_
->getPhysicalRegisterRegClass(DstReg
)
1084 : mri_
->getRegClass(DstReg
);
1085 if (!getMatchingSuperReg(PhysReg
, SubIdx
, RC
, tri_
))
1094 /// CanJoinExtractSubRegToPhysReg - Return true if it's possible to coalesce
1095 /// an extract_subreg where dst is a physical register, e.g.
1096 /// cl = EXTRACT_SUBREG reg1024, 1
1098 SimpleRegisterCoalescing::CanJoinExtractSubRegToPhysReg(unsigned DstReg
,
1099 unsigned SrcReg
, unsigned SubIdx
,
1100 unsigned &RealDstReg
) {
1101 const TargetRegisterClass
*RC
= mri_
->getRegClass(SrcReg
);
1102 RealDstReg
= getMatchingSuperReg(DstReg
, SubIdx
, RC
, tri_
);
1103 assert(RealDstReg
&& "Invalid extract_subreg instruction!");
1105 // For this type of EXTRACT_SUBREG, conservatively
1106 // check if the live interval of the source register interfere with the
1107 // actual super physical register we are trying to coalesce with.
1108 LiveInterval
&RHS
= li_
->getInterval(SrcReg
);
1109 if (li_
->hasInterval(RealDstReg
) &&
1110 RHS
.overlaps(li_
->getInterval(RealDstReg
))) {
1111 DOUT
<< "Interfere with register ";
1112 DEBUG(li_
->getInterval(RealDstReg
).print(DOUT
, tri_
));
1113 return false; // Not coalescable
1115 for (const unsigned* SR
= tri_
->getSubRegisters(RealDstReg
); *SR
; ++SR
)
1116 if (li_
->hasInterval(*SR
) && RHS
.overlaps(li_
->getInterval(*SR
))) {
1117 DOUT
<< "Interfere with sub-register ";
1118 DEBUG(li_
->getInterval(*SR
).print(DOUT
, tri_
));
1119 return false; // Not coalescable
1124 /// CanJoinInsertSubRegToPhysReg - Return true if it's possible to coalesce
1125 /// an insert_subreg where src is a physical register, e.g.
1126 /// reg1024 = INSERT_SUBREG reg1024, c1, 0
1128 SimpleRegisterCoalescing::CanJoinInsertSubRegToPhysReg(unsigned DstReg
,
1129 unsigned SrcReg
, unsigned SubIdx
,
1130 unsigned &RealSrcReg
) {
1131 const TargetRegisterClass
*RC
= mri_
->getRegClass(DstReg
);
1132 RealSrcReg
= getMatchingSuperReg(SrcReg
, SubIdx
, RC
, tri_
);
1133 assert(RealSrcReg
&& "Invalid extract_subreg instruction!");
1135 LiveInterval
&RHS
= li_
->getInterval(DstReg
);
1136 if (li_
->hasInterval(RealSrcReg
) &&
1137 RHS
.overlaps(li_
->getInterval(RealSrcReg
))) {
1138 DOUT
<< "Interfere with register ";
1139 DEBUG(li_
->getInterval(RealSrcReg
).print(DOUT
, tri_
));
1140 return false; // Not coalescable
1142 for (const unsigned* SR
= tri_
->getSubRegisters(RealSrcReg
); *SR
; ++SR
)
1143 if (li_
->hasInterval(*SR
) && RHS
.overlaps(li_
->getInterval(*SR
))) {
1144 DOUT
<< "Interfere with sub-register ";
1145 DEBUG(li_
->getInterval(*SR
).print(DOUT
, tri_
));
1146 return false; // Not coalescable
1151 /// JoinCopy - Attempt to join intervals corresponding to SrcReg/DstReg,
1152 /// which are the src/dst of the copy instruction CopyMI. This returns true
1153 /// if the copy was successfully coalesced away. If it is not currently
1154 /// possible to coalesce this interval, but it may be possible if other
1155 /// things get coalesced, then it returns true by reference in 'Again'.
1156 bool SimpleRegisterCoalescing::JoinCopy(CopyRec
&TheCopy
, bool &Again
) {
1157 MachineInstr
*CopyMI
= TheCopy
.MI
;
1160 if (JoinedCopies
.count(CopyMI
) || ReMatCopies
.count(CopyMI
))
1161 return false; // Already done.
1163 DOUT
<< li_
->getInstructionIndex(CopyMI
) << '\t' << *CopyMI
;
1165 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
1166 bool isExtSubReg
= CopyMI
->getOpcode() == TargetInstrInfo::EXTRACT_SUBREG
;
1167 bool isInsSubReg
= CopyMI
->getOpcode() == TargetInstrInfo::INSERT_SUBREG
;
1168 bool isSubRegToReg
= CopyMI
->getOpcode() == TargetInstrInfo::SUBREG_TO_REG
;
1169 unsigned SubIdx
= 0;
1171 DstReg
= CopyMI
->getOperand(0).getReg();
1172 SrcReg
= CopyMI
->getOperand(1).getReg();
1173 } else if (isInsSubReg
|| isSubRegToReg
) {
1174 if (CopyMI
->getOperand(2).getSubReg()) {
1175 DOUT
<< "\tSource of insert_subreg is already coalesced "
1176 << "to another register.\n";
1177 return false; // Not coalescable.
1179 DstReg
= CopyMI
->getOperand(0).getReg();
1180 SrcReg
= CopyMI
->getOperand(2).getReg();
1181 } else if (!tii_
->isMoveInstr(*CopyMI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
)){
1182 assert(0 && "Unrecognized copy instruction!");
1186 // If they are already joined we continue.
1187 if (SrcReg
== DstReg
) {
1188 DOUT
<< "\tCopy already coalesced.\n";
1189 return false; // Not coalescable.
1192 bool SrcIsPhys
= TargetRegisterInfo::isPhysicalRegister(SrcReg
);
1193 bool DstIsPhys
= TargetRegisterInfo::isPhysicalRegister(DstReg
);
1195 // If they are both physical registers, we cannot join them.
1196 if (SrcIsPhys
&& DstIsPhys
) {
1197 DOUT
<< "\tCan not coalesce physregs.\n";
1198 return false; // Not coalescable.
1201 // We only join virtual registers with allocatable physical registers.
1202 if (SrcIsPhys
&& !allocatableRegs_
[SrcReg
]) {
1203 DOUT
<< "\tSrc reg is unallocatable physreg.\n";
1204 return false; // Not coalescable.
1206 if (DstIsPhys
&& !allocatableRegs_
[DstReg
]) {
1207 DOUT
<< "\tDst reg is unallocatable physreg.\n";
1208 return false; // Not coalescable.
1211 // Should be non-null only when coalescing to a sub-register class.
1212 bool CrossRC
= false;
1213 const TargetRegisterClass
*NewRC
= NULL
;
1214 MachineBasicBlock
*CopyMBB
= CopyMI
->getParent();
1215 unsigned RealDstReg
= 0;
1216 unsigned RealSrcReg
= 0;
1217 if (isExtSubReg
|| isInsSubReg
|| isSubRegToReg
) {
1218 SubIdx
= CopyMI
->getOperand(isExtSubReg
? 2 : 3).getImm();
1219 if (SrcIsPhys
&& isExtSubReg
) {
1220 // r1024 = EXTRACT_SUBREG EAX, 0 then r1024 is really going to be
1221 // coalesced with AX.
1222 unsigned DstSubIdx
= CopyMI
->getOperand(0).getSubReg();
1224 // r1024<2> = EXTRACT_SUBREG EAX, 2. Then r1024 has already been
1225 // coalesced to a larger register so the subreg indices cancel out.
1226 if (DstSubIdx
!= SubIdx
) {
1227 DOUT
<< "\t Sub-register indices mismatch.\n";
1228 return false; // Not coalescable.
1231 SrcReg
= tri_
->getSubReg(SrcReg
, SubIdx
);
1233 } else if (DstIsPhys
&& (isInsSubReg
|| isSubRegToReg
)) {
1234 // EAX = INSERT_SUBREG EAX, r1024, 0
1235 unsigned SrcSubIdx
= CopyMI
->getOperand(2).getSubReg();
1237 // EAX = INSERT_SUBREG EAX, r1024<2>, 2 Then r1024 has already been
1238 // coalesced to a larger register so the subreg indices cancel out.
1239 if (SrcSubIdx
!= SubIdx
) {
1240 DOUT
<< "\t Sub-register indices mismatch.\n";
1241 return false; // Not coalescable.
1244 DstReg
= tri_
->getSubReg(DstReg
, SubIdx
);
1246 } else if ((DstIsPhys
&& isExtSubReg
) ||
1247 (SrcIsPhys
&& (isInsSubReg
|| isSubRegToReg
))) {
1248 if (!isSubRegToReg
&& CopyMI
->getOperand(1).getSubReg()) {
1249 DOUT
<< "\tSrc of extract_subreg already coalesced with reg"
1250 << " of a super-class.\n";
1251 return false; // Not coalescable.
1255 if (!CanJoinExtractSubRegToPhysReg(DstReg
, SrcReg
, SubIdx
, RealDstReg
))
1256 return false; // Not coalescable
1258 if (!CanJoinInsertSubRegToPhysReg(DstReg
, SrcReg
, SubIdx
, RealSrcReg
))
1259 return false; // Not coalescable
1263 unsigned OldSubIdx
= isExtSubReg
? CopyMI
->getOperand(0).getSubReg()
1264 : CopyMI
->getOperand(2).getSubReg();
1266 if (OldSubIdx
== SubIdx
&& !differingRegisterClasses(SrcReg
, DstReg
))
1267 // r1024<2> = EXTRACT_SUBREG r1025, 2. Then r1024 has already been
1268 // coalesced to a larger register so the subreg indices cancel out.
1269 // Also check if the other larger register is of the same register
1270 // class as the would be resulting register.
1273 DOUT
<< "\t Sub-register indices mismatch.\n";
1274 return false; // Not coalescable.
1278 unsigned LargeReg
= isExtSubReg
? SrcReg
: DstReg
;
1279 unsigned SmallReg
= isExtSubReg
? DstReg
: SrcReg
;
1280 unsigned Limit
= allocatableRCRegs_
[mri_
->getRegClass(SmallReg
)].count();
1281 if (!isWinToJoinCrossClass(LargeReg
, SmallReg
, Limit
)) {
1282 Again
= true; // May be possible to coalesce later.
1287 } else if (differingRegisterClasses(SrcReg
, DstReg
)) {
1288 if (!CrossClassJoin
)
1292 // FIXME: What if the result of a EXTRACT_SUBREG is then coalesced
1293 // with another? If it's the resulting destination register, then
1294 // the subidx must be propagated to uses (but only those defined
1295 // by the EXTRACT_SUBREG). If it's being coalesced into another
1296 // register, it should be safe because register is assumed to have
1297 // the register class of the super-register.
1299 // Process moves where one of the registers have a sub-register index.
1300 MachineOperand
*DstMO
= CopyMI
->findRegisterDefOperand(DstReg
);
1301 MachineOperand
*SrcMO
= CopyMI
->findRegisterUseOperand(SrcReg
);
1302 SubIdx
= DstMO
->getSubReg();
1304 if (SrcMO
->getSubReg())
1305 // FIXME: can we handle this?
1307 // This is not an insert_subreg but it looks like one.
1308 // e.g. %reg1024:4 = MOV32rr %EAX
1311 if (!CanJoinInsertSubRegToPhysReg(DstReg
, SrcReg
, SubIdx
, RealSrcReg
))
1312 return false; // Not coalescable
1316 SubIdx
= SrcMO
->getSubReg();
1318 // This is not a extract_subreg but it looks like one.
1319 // e.g. %cl = MOV16rr %reg1024:1
1322 if (!CanJoinExtractSubRegToPhysReg(DstReg
, SrcReg
, SubIdx
,RealDstReg
))
1323 return false; // Not coalescable
1329 const TargetRegisterClass
*SrcRC
= SrcIsPhys
? 0 : mri_
->getRegClass(SrcReg
);
1330 const TargetRegisterClass
*DstRC
= DstIsPhys
? 0 : mri_
->getRegClass(DstReg
);
1331 unsigned LargeReg
= SrcReg
;
1332 unsigned SmallReg
= DstReg
;
1335 // Now determine the register class of the joined register.
1337 if (SubIdx
&& DstRC
&& DstRC
->isASubClass()) {
1338 // This is a move to a sub-register class. However, the source is a
1339 // sub-register of a larger register class. We don't know what should
1340 // the register class be. FIXME.
1344 Limit
= allocatableRCRegs_
[DstRC
].count();
1345 } else if (!SrcIsPhys
&& !DstIsPhys
) {
1346 unsigned SrcSize
= SrcRC
->getSize();
1347 unsigned DstSize
= DstRC
->getSize();
1348 if (SrcSize
< DstSize
)
1349 // For example X86::MOVSD2PDrr copies from FR64 to VR128.
1351 else if (DstSize
> SrcSize
) {
1353 std::swap(LargeReg
, SmallReg
);
1355 unsigned SrcNumRegs
= SrcRC
->getNumRegs();
1356 unsigned DstNumRegs
= DstRC
->getNumRegs();
1357 if (DstNumRegs
< SrcNumRegs
)
1358 // Sub-register class?
1360 else if (SrcNumRegs
< DstNumRegs
) {
1362 std::swap(LargeReg
, SmallReg
);
1364 // No idea what's the right register class to use.
1369 // If we are joining two virtual registers and the resulting register
1370 // class is more restrictive (fewer register, smaller size). Check if it's
1371 // worth doing the merge.
1372 if (!SrcIsPhys
&& !DstIsPhys
&&
1373 (isExtSubReg
|| DstRC
->isASubClass()) &&
1374 !isWinToJoinCrossClass(LargeReg
, SmallReg
,
1375 allocatableRCRegs_
[NewRC
].count())) {
1376 DOUT
<< "\tSrc/Dest are different register classes.\n";
1377 // Allow the coalescer to try again in case either side gets coalesced to
1378 // a physical register that's compatible with the other side. e.g.
1379 // r1024 = MOV32to32_ r1025
1380 // But later r1024 is assigned EAX then r1025 may be coalesced with EAX.
1381 Again
= true; // May be possible to coalesce later.
1386 // Will it create illegal extract_subreg / insert_subreg?
1387 if (SrcIsPhys
&& HasIncompatibleSubRegDefUse(CopyMI
, DstReg
, SrcReg
))
1389 if (DstIsPhys
&& HasIncompatibleSubRegDefUse(CopyMI
, SrcReg
, DstReg
))
1392 LiveInterval
&SrcInt
= li_
->getInterval(SrcReg
);
1393 LiveInterval
&DstInt
= li_
->getInterval(DstReg
);
1394 assert(SrcInt
.reg
== SrcReg
&& DstInt
.reg
== DstReg
&&
1395 "Register mapping is horribly broken!");
1397 DOUT
<< "\t\tInspecting "; SrcInt
.print(DOUT
, tri_
);
1398 DOUT
<< " and "; DstInt
.print(DOUT
, tri_
);
1401 // Save a copy of the virtual register live interval. We'll manually
1402 // merge this into the "real" physical register live interval this is
1404 LiveInterval
*SavedLI
= 0;
1406 SavedLI
= li_
->dupInterval(&SrcInt
);
1407 else if (RealSrcReg
)
1408 SavedLI
= li_
->dupInterval(&DstInt
);
1410 // Check if it is necessary to propagate "isDead" property.
1411 if (!isExtSubReg
&& !isInsSubReg
&& !isSubRegToReg
) {
1412 MachineOperand
*mopd
= CopyMI
->findRegisterDefOperand(DstReg
, false);
1413 bool isDead
= mopd
->isDead();
1415 // We need to be careful about coalescing a source physical register with a
1416 // virtual register. Once the coalescing is done, it cannot be broken and
1417 // these are not spillable! If the destination interval uses are far away,
1418 // think twice about coalescing them!
1419 if (!isDead
&& (SrcIsPhys
|| DstIsPhys
)) {
1420 LiveInterval
&JoinVInt
= SrcIsPhys
? DstInt
: SrcInt
;
1421 unsigned JoinVReg
= SrcIsPhys
? DstReg
: SrcReg
;
1422 unsigned JoinPReg
= SrcIsPhys
? SrcReg
: DstReg
;
1423 const TargetRegisterClass
*RC
= mri_
->getRegClass(JoinVReg
);
1424 unsigned Threshold
= allocatableRCRegs_
[RC
].count() * 2;
1425 if (TheCopy
.isBackEdge
)
1426 Threshold
*= 2; // Favors back edge copies.
1428 // If the virtual register live interval is long but it has low use desity,
1429 // do not join them, instead mark the physical register as its allocation
1431 unsigned Length
= li_
->getApproximateInstructionCount(JoinVInt
);
1432 if (Length
> Threshold
&&
1433 (((float)std::distance(mri_
->use_begin(JoinVReg
), mri_
->use_end())
1434 / Length
) < (1.0 / Threshold
))) {
1435 JoinVInt
.preference
= JoinPReg
;
1437 DOUT
<< "\tMay tie down a physical register, abort!\n";
1438 Again
= true; // May be possible to coalesce later.
1444 // Okay, attempt to join these two intervals. On failure, this returns false.
1445 // Otherwise, if one of the intervals being joined is a physreg, this method
1446 // always canonicalizes DstInt to be it. The output "SrcInt" will not have
1447 // been modified, so we can use this information below to update aliases.
1448 bool Swapped
= false;
1449 // If SrcInt is implicitly defined, it's safe to coalesce.
1450 bool isEmpty
= SrcInt
.empty();
1451 if (isEmpty
&& !CanCoalesceWithImpDef(CopyMI
, DstInt
, SrcInt
)) {
1452 // Only coalesce an empty interval (defined by implicit_def) with
1453 // another interval which has a valno defined by the CopyMI and the CopyMI
1454 // is a kill of the implicit def.
1455 DOUT
<< "Not profitable!\n";
1459 if (!isEmpty
&& !JoinIntervals(DstInt
, SrcInt
, Swapped
)) {
1460 // Coalescing failed.
1462 // If definition of source is defined by trivial computation, try
1463 // rematerializing it.
1464 if (!isExtSubReg
&& !isInsSubReg
&& !isSubRegToReg
&&
1465 ReMaterializeTrivialDef(SrcInt
, DstInt
.reg
, CopyMI
))
1468 // If we can eliminate the copy without merging the live ranges, do so now.
1469 if (!isExtSubReg
&& !isInsSubReg
&& !isSubRegToReg
&&
1470 (AdjustCopiesBackFrom(SrcInt
, DstInt
, CopyMI
) ||
1471 RemoveCopyByCommutingDef(SrcInt
, DstInt
, CopyMI
))) {
1472 JoinedCopies
.insert(CopyMI
);
1476 // Otherwise, we are unable to join the intervals.
1477 DOUT
<< "Interference!\n";
1478 Again
= true; // May be possible to coalesce later.
1482 LiveInterval
*ResSrcInt
= &SrcInt
;
1483 LiveInterval
*ResDstInt
= &DstInt
;
1485 std::swap(SrcReg
, DstReg
);
1486 std::swap(ResSrcInt
, ResDstInt
);
1488 assert(TargetRegisterInfo::isVirtualRegister(SrcReg
) &&
1489 "LiveInterval::join didn't work right!");
1491 // If we're about to merge live ranges into a physical register live interval,
1492 // we have to update any aliased register's live ranges to indicate that they
1493 // have clobbered values for this range.
1494 if (TargetRegisterInfo::isPhysicalRegister(DstReg
)) {
1495 // If this is a extract_subreg where dst is a physical register, e.g.
1496 // cl = EXTRACT_SUBREG reg1024, 1
1497 // then create and update the actual physical register allocated to RHS.
1498 if (RealDstReg
|| RealSrcReg
) {
1499 LiveInterval
&RealInt
=
1500 li_
->getOrCreateInterval(RealDstReg
? RealDstReg
: RealSrcReg
);
1501 for (LiveInterval::const_vni_iterator I
= SavedLI
->vni_begin(),
1502 E
= SavedLI
->vni_end(); I
!= E
; ++I
) {
1503 const VNInfo
*ValNo
= *I
;
1504 VNInfo
*NewValNo
= RealInt
.getNextValue(ValNo
->def
, ValNo
->copy
,
1505 li_
->getVNInfoAllocator());
1506 NewValNo
->hasPHIKill
= ValNo
->hasPHIKill
;
1507 NewValNo
->redefByEC
= ValNo
->redefByEC
;
1508 RealInt
.addKills(NewValNo
, ValNo
->kills
);
1509 RealInt
.MergeValueInAsValue(*SavedLI
, ValNo
, NewValNo
);
1511 RealInt
.weight
+= SavedLI
->weight
;
1512 DstReg
= RealDstReg
? RealDstReg
: RealSrcReg
;
1515 // Update the liveintervals of sub-registers.
1516 for (const unsigned *AS
= tri_
->getSubRegisters(DstReg
); *AS
; ++AS
)
1517 li_
->getOrCreateInterval(*AS
).MergeInClobberRanges(*ResSrcInt
,
1518 li_
->getVNInfoAllocator());
1521 // If this is a EXTRACT_SUBREG, make sure the result of coalescing is the
1522 // larger super-register.
1523 if ((isExtSubReg
|| isInsSubReg
|| isSubRegToReg
) &&
1524 !SrcIsPhys
&& !DstIsPhys
) {
1525 if ((isExtSubReg
&& !Swapped
) ||
1526 ((isInsSubReg
|| isSubRegToReg
) && Swapped
)) {
1527 ResSrcInt
->Copy(*ResDstInt
, li_
->getVNInfoAllocator());
1528 std::swap(SrcReg
, DstReg
);
1529 std::swap(ResSrcInt
, ResDstInt
);
1533 // Coalescing to a virtual register that is of a sub-register class of the
1534 // other. Make sure the resulting register is set to the right register class.
1538 mri_
->setRegClass(DstReg
, NewRC
);
1542 // Add all copies that define val# in the source interval into the queue.
1543 for (LiveInterval::const_vni_iterator i
= ResSrcInt
->vni_begin(),
1544 e
= ResSrcInt
->vni_end(); i
!= e
; ++i
) {
1545 const VNInfo
*vni
= *i
;
1546 if (!vni
->def
|| vni
->def
== ~1U || vni
->def
== ~0U)
1548 MachineInstr
*CopyMI
= li_
->getInstructionFromIndex(vni
->def
);
1549 unsigned NewSrcReg
, NewDstReg
, NewSrcSubIdx
, NewDstSubIdx
;
1551 JoinedCopies
.count(CopyMI
) == 0 &&
1552 tii_
->isMoveInstr(*CopyMI
, NewSrcReg
, NewDstReg
,
1553 NewSrcSubIdx
, NewDstSubIdx
)) {
1554 unsigned LoopDepth
= loopInfo
->getLoopDepth(CopyMBB
);
1555 JoinQueue
->push(CopyRec(CopyMI
, LoopDepth
,
1556 isBackEdgeCopy(CopyMI
, DstReg
)));
1561 // Remember to delete the copy instruction.
1562 JoinedCopies
.insert(CopyMI
);
1564 // Some live range has been lengthened due to colaescing, eliminate the
1565 // unnecessary kills.
1566 RemoveUnnecessaryKills(SrcReg
, *ResDstInt
);
1567 if (TargetRegisterInfo::isVirtualRegister(DstReg
))
1568 RemoveUnnecessaryKills(DstReg
, *ResDstInt
);
1573 // r1024 = implicit_def
1576 RemoveDeadImpDef(DstReg
, *ResDstInt
);
1577 UpdateRegDefsUses(SrcReg
, DstReg
, SubIdx
);
1579 // SrcReg is guarateed to be the register whose live interval that is
1581 li_
->removeInterval(SrcReg
);
1583 // Manually deleted the live interval copy.
1590 // Now the copy is being coalesced away, the val# previously defined
1591 // by the copy is being defined by an IMPLICIT_DEF which defines a zero
1592 // length interval. Remove the val#.
1593 unsigned CopyIdx
= li_
->getDefIndex(li_
->getInstructionIndex(CopyMI
));
1594 const LiveRange
*LR
= ResDstInt
->getLiveRangeContaining(CopyIdx
);
1595 VNInfo
*ImpVal
= LR
->valno
;
1596 assert(ImpVal
->def
== CopyIdx
);
1597 unsigned NextDef
= LR
->end
;
1598 RemoveCopiesFromValNo(*ResDstInt
, ImpVal
);
1599 ResDstInt
->removeValNo(ImpVal
);
1600 LR
= ResDstInt
->FindLiveRangeContaining(NextDef
);
1601 if (LR
!= ResDstInt
->end() && LR
->valno
->def
== NextDef
) {
1602 // Special case: vr1024 = implicit_def
1603 // vr1024 = insert_subreg vr1024, vr1025, c
1604 // The insert_subreg becomes a "copy" that defines a val# which can itself
1605 // be coalesced away.
1606 MachineInstr
*DefMI
= li_
->getInstructionFromIndex(NextDef
);
1607 if (DefMI
->getOpcode() == TargetInstrInfo::INSERT_SUBREG
)
1608 LR
->valno
->copy
= DefMI
;
1612 // If resulting interval has a preference that no longer fits because of subreg
1613 // coalescing, just clear the preference.
1614 if (ResDstInt
->preference
&& (isExtSubReg
|| isInsSubReg
|| isSubRegToReg
) &&
1615 TargetRegisterInfo::isVirtualRegister(ResDstInt
->reg
)) {
1616 const TargetRegisterClass
*RC
= mri_
->getRegClass(ResDstInt
->reg
);
1617 if (!RC
->contains(ResDstInt
->preference
))
1618 ResDstInt
->preference
= 0;
1621 DOUT
<< "\n\t\tJoined. Result = "; ResDstInt
->print(DOUT
, tri_
);
1628 /// ComputeUltimateVN - Assuming we are going to join two live intervals,
1629 /// compute what the resultant value numbers for each value in the input two
1630 /// ranges will be. This is complicated by copies between the two which can
1631 /// and will commonly cause multiple value numbers to be merged into one.
1633 /// VN is the value number that we're trying to resolve. InstDefiningValue
1634 /// keeps track of the new InstDefiningValue assignment for the result
1635 /// LiveInterval. ThisFromOther/OtherFromThis are sets that keep track of
1636 /// whether a value in this or other is a copy from the opposite set.
1637 /// ThisValNoAssignments/OtherValNoAssignments keep track of value #'s that have
1638 /// already been assigned.
1640 /// ThisFromOther[x] - If x is defined as a copy from the other interval, this
1641 /// contains the value number the copy is from.
1643 static unsigned ComputeUltimateVN(VNInfo
*VNI
,
1644 SmallVector
<VNInfo
*, 16> &NewVNInfo
,
1645 DenseMap
<VNInfo
*, VNInfo
*> &ThisFromOther
,
1646 DenseMap
<VNInfo
*, VNInfo
*> &OtherFromThis
,
1647 SmallVector
<int, 16> &ThisValNoAssignments
,
1648 SmallVector
<int, 16> &OtherValNoAssignments
) {
1649 unsigned VN
= VNI
->id
;
1651 // If the VN has already been computed, just return it.
1652 if (ThisValNoAssignments
[VN
] >= 0)
1653 return ThisValNoAssignments
[VN
];
1654 // assert(ThisValNoAssignments[VN] != -2 && "Cyclic case?");
1656 // If this val is not a copy from the other val, then it must be a new value
1657 // number in the destination.
1658 DenseMap
<VNInfo
*, VNInfo
*>::iterator I
= ThisFromOther
.find(VNI
);
1659 if (I
== ThisFromOther
.end()) {
1660 NewVNInfo
.push_back(VNI
);
1661 return ThisValNoAssignments
[VN
] = NewVNInfo
.size()-1;
1663 VNInfo
*OtherValNo
= I
->second
;
1665 // Otherwise, this *is* a copy from the RHS. If the other side has already
1666 // been computed, return it.
1667 if (OtherValNoAssignments
[OtherValNo
->id
] >= 0)
1668 return ThisValNoAssignments
[VN
] = OtherValNoAssignments
[OtherValNo
->id
];
1670 // Mark this value number as currently being computed, then ask what the
1671 // ultimate value # of the other value is.
1672 ThisValNoAssignments
[VN
] = -2;
1673 unsigned UltimateVN
=
1674 ComputeUltimateVN(OtherValNo
, NewVNInfo
, OtherFromThis
, ThisFromOther
,
1675 OtherValNoAssignments
, ThisValNoAssignments
);
1676 return ThisValNoAssignments
[VN
] = UltimateVN
;
1679 static bool InVector(VNInfo
*Val
, const SmallVector
<VNInfo
*, 8> &V
) {
1680 return std::find(V
.begin(), V
.end(), Val
) != V
.end();
1683 /// RangeIsDefinedByCopyFromReg - Return true if the specified live range of
1684 /// the specified live interval is defined by a copy from the specified
1686 bool SimpleRegisterCoalescing::RangeIsDefinedByCopyFromReg(LiveInterval
&li
,
1689 unsigned SrcReg
= li_
->getVNInfoSourceReg(LR
->valno
);
1692 if (LR
->valno
->def
== ~0U &&
1693 TargetRegisterInfo::isPhysicalRegister(li
.reg
) &&
1694 *tri_
->getSuperRegisters(li
.reg
)) {
1695 // It's a sub-register live interval, we may not have precise information.
1697 MachineInstr
*DefMI
= li_
->getInstructionFromIndex(LR
->start
);
1698 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
1700 tii_
->isMoveInstr(*DefMI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
) &&
1701 DstReg
== li
.reg
&& SrcReg
== Reg
) {
1702 // Cache computed info.
1703 LR
->valno
->def
= LR
->start
;
1704 LR
->valno
->copy
= DefMI
;
1711 /// SimpleJoin - Attempt to joint the specified interval into this one. The
1712 /// caller of this method must guarantee that the RHS only contains a single
1713 /// value number and that the RHS is not defined by a copy from this
1714 /// interval. This returns false if the intervals are not joinable, or it
1715 /// joins them and returns true.
1716 bool SimpleRegisterCoalescing::SimpleJoin(LiveInterval
&LHS
, LiveInterval
&RHS
){
1717 assert(RHS
.containsOneValue());
1719 // Some number (potentially more than one) value numbers in the current
1720 // interval may be defined as copies from the RHS. Scan the overlapping
1721 // portions of the LHS and RHS, keeping track of this and looking for
1722 // overlapping live ranges that are NOT defined as copies. If these exist, we
1725 LiveInterval::iterator LHSIt
= LHS
.begin(), LHSEnd
= LHS
.end();
1726 LiveInterval::iterator RHSIt
= RHS
.begin(), RHSEnd
= RHS
.end();
1728 if (LHSIt
->start
< RHSIt
->start
) {
1729 LHSIt
= std::upper_bound(LHSIt
, LHSEnd
, RHSIt
->start
);
1730 if (LHSIt
!= LHS
.begin()) --LHSIt
;
1731 } else if (RHSIt
->start
< LHSIt
->start
) {
1732 RHSIt
= std::upper_bound(RHSIt
, RHSEnd
, LHSIt
->start
);
1733 if (RHSIt
!= RHS
.begin()) --RHSIt
;
1736 SmallVector
<VNInfo
*, 8> EliminatedLHSVals
;
1739 // Determine if these live intervals overlap.
1740 bool Overlaps
= false;
1741 if (LHSIt
->start
<= RHSIt
->start
)
1742 Overlaps
= LHSIt
->end
> RHSIt
->start
;
1744 Overlaps
= RHSIt
->end
> LHSIt
->start
;
1746 // If the live intervals overlap, there are two interesting cases: if the
1747 // LHS interval is defined by a copy from the RHS, it's ok and we record
1748 // that the LHS value # is the same as the RHS. If it's not, then we cannot
1749 // coalesce these live ranges and we bail out.
1751 // If we haven't already recorded that this value # is safe, check it.
1752 if (!InVector(LHSIt
->valno
, EliminatedLHSVals
)) {
1753 // Copy from the RHS?
1754 if (!RangeIsDefinedByCopyFromReg(LHS
, LHSIt
, RHS
.reg
))
1755 return false; // Nope, bail out.
1757 if (LHSIt
->contains(RHSIt
->valno
->def
))
1758 // Here is an interesting situation:
1760 // vr1025 = copy vr1024
1765 // Even though vr1025 is copied from vr1024, it's not safe to
1766 // coalesce them since the live range of vr1025 intersects the
1767 // def of vr1024. This happens because vr1025 is assigned the
1768 // value of the previous iteration of vr1024.
1770 EliminatedLHSVals
.push_back(LHSIt
->valno
);
1773 // We know this entire LHS live range is okay, so skip it now.
1774 if (++LHSIt
== LHSEnd
) break;
1778 if (LHSIt
->end
< RHSIt
->end
) {
1779 if (++LHSIt
== LHSEnd
) break;
1781 // One interesting case to check here. It's possible that we have
1782 // something like "X3 = Y" which defines a new value number in the LHS,
1783 // and is the last use of this liverange of the RHS. In this case, we
1784 // want to notice this copy (so that it gets coalesced away) even though
1785 // the live ranges don't actually overlap.
1786 if (LHSIt
->start
== RHSIt
->end
) {
1787 if (InVector(LHSIt
->valno
, EliminatedLHSVals
)) {
1788 // We already know that this value number is going to be merged in
1789 // if coalescing succeeds. Just skip the liverange.
1790 if (++LHSIt
== LHSEnd
) break;
1792 // Otherwise, if this is a copy from the RHS, mark it as being merged
1794 if (RangeIsDefinedByCopyFromReg(LHS
, LHSIt
, RHS
.reg
)) {
1795 if (LHSIt
->contains(RHSIt
->valno
->def
))
1796 // Here is an interesting situation:
1798 // vr1025 = copy vr1024
1803 // Even though vr1025 is copied from vr1024, it's not safe to
1804 // coalesced them since live range of vr1025 intersects the
1805 // def of vr1024. This happens because vr1025 is assigned the
1806 // value of the previous iteration of vr1024.
1808 EliminatedLHSVals
.push_back(LHSIt
->valno
);
1810 // We know this entire LHS live range is okay, so skip it now.
1811 if (++LHSIt
== LHSEnd
) break;
1816 if (++RHSIt
== RHSEnd
) break;
1820 // If we got here, we know that the coalescing will be successful and that
1821 // the value numbers in EliminatedLHSVals will all be merged together. Since
1822 // the most common case is that EliminatedLHSVals has a single number, we
1823 // optimize for it: if there is more than one value, we merge them all into
1824 // the lowest numbered one, then handle the interval as if we were merging
1825 // with one value number.
1826 VNInfo
*LHSValNo
= NULL
;
1827 if (EliminatedLHSVals
.size() > 1) {
1828 // Loop through all the equal value numbers merging them into the smallest
1830 VNInfo
*Smallest
= EliminatedLHSVals
[0];
1831 for (unsigned i
= 1, e
= EliminatedLHSVals
.size(); i
!= e
; ++i
) {
1832 if (EliminatedLHSVals
[i
]->id
< Smallest
->id
) {
1833 // Merge the current notion of the smallest into the smaller one.
1834 LHS
.MergeValueNumberInto(Smallest
, EliminatedLHSVals
[i
]);
1835 Smallest
= EliminatedLHSVals
[i
];
1837 // Merge into the smallest.
1838 LHS
.MergeValueNumberInto(EliminatedLHSVals
[i
], Smallest
);
1841 LHSValNo
= Smallest
;
1842 } else if (EliminatedLHSVals
.empty()) {
1843 if (TargetRegisterInfo::isPhysicalRegister(LHS
.reg
) &&
1844 *tri_
->getSuperRegisters(LHS
.reg
))
1845 // Imprecise sub-register information. Can't handle it.
1847 assert(0 && "No copies from the RHS?");
1849 LHSValNo
= EliminatedLHSVals
[0];
1852 // Okay, now that there is a single LHS value number that we're merging the
1853 // RHS into, update the value number info for the LHS to indicate that the
1854 // value number is defined where the RHS value number was.
1855 const VNInfo
*VNI
= RHS
.getValNumInfo(0);
1856 LHSValNo
->def
= VNI
->def
;
1857 LHSValNo
->copy
= VNI
->copy
;
1859 // Okay, the final step is to loop over the RHS live intervals, adding them to
1861 LHSValNo
->hasPHIKill
|= VNI
->hasPHIKill
;
1862 LHS
.addKills(LHSValNo
, VNI
->kills
);
1863 LHS
.MergeRangesInAsValue(RHS
, LHSValNo
);
1864 LHS
.weight
+= RHS
.weight
;
1865 if (RHS
.preference
&& !LHS
.preference
)
1866 LHS
.preference
= RHS
.preference
;
1868 // Update the liveintervals of sub-registers.
1869 if (TargetRegisterInfo::isPhysicalRegister(LHS
.reg
))
1870 for (const unsigned *AS
= tri_
->getSubRegisters(LHS
.reg
); *AS
; ++AS
)
1871 li_
->getOrCreateInterval(*AS
).MergeInClobberRanges(LHS
,
1872 li_
->getVNInfoAllocator());
1877 /// JoinIntervals - Attempt to join these two intervals. On failure, this
1878 /// returns false. Otherwise, if one of the intervals being joined is a
1879 /// physreg, this method always canonicalizes LHS to be it. The output
1880 /// "RHS" will not have been modified, so we can use this information
1881 /// below to update aliases.
1883 SimpleRegisterCoalescing::JoinIntervals(LiveInterval
&LHS
, LiveInterval
&RHS
,
1885 // Compute the final value assignment, assuming that the live ranges can be
1887 SmallVector
<int, 16> LHSValNoAssignments
;
1888 SmallVector
<int, 16> RHSValNoAssignments
;
1889 DenseMap
<VNInfo
*, VNInfo
*> LHSValsDefinedFromRHS
;
1890 DenseMap
<VNInfo
*, VNInfo
*> RHSValsDefinedFromLHS
;
1891 SmallVector
<VNInfo
*, 16> NewVNInfo
;
1893 // If a live interval is a physical register, conservatively check if any
1894 // of its sub-registers is overlapping the live interval of the virtual
1895 // register. If so, do not coalesce.
1896 if (TargetRegisterInfo::isPhysicalRegister(LHS
.reg
) &&
1897 *tri_
->getSubRegisters(LHS
.reg
)) {
1898 // If it's coalescing a virtual register to a physical register, estimate
1899 // its live interval length. This is the *cost* of scanning an entire live
1900 // interval. If the cost is low, we'll do an exhaustive check instead.
1902 // If this is something like this:
1910 // That is, the live interval of v1024 crosses a bb. Then we can't rely on
1911 // less conservative check. It's possible a sub-register is defined before
1912 // v1024 (or live in) and live out of BB1.
1913 if (RHS
.containsOneValue() &&
1914 li_
->intervalIsInOneMBB(RHS
) &&
1915 li_
->getApproximateInstructionCount(RHS
) <= 10) {
1916 // Perform a more exhaustive check for some common cases.
1917 if (li_
->conflictsWithPhysRegRef(RHS
, LHS
.reg
, true, JoinedCopies
))
1920 for (const unsigned* SR
= tri_
->getSubRegisters(LHS
.reg
); *SR
; ++SR
)
1921 if (li_
->hasInterval(*SR
) && RHS
.overlaps(li_
->getInterval(*SR
))) {
1922 DOUT
<< "Interfere with sub-register ";
1923 DEBUG(li_
->getInterval(*SR
).print(DOUT
, tri_
));
1927 } else if (TargetRegisterInfo::isPhysicalRegister(RHS
.reg
) &&
1928 *tri_
->getSubRegisters(RHS
.reg
)) {
1929 if (LHS
.containsOneValue() &&
1930 li_
->getApproximateInstructionCount(LHS
) <= 10) {
1931 // Perform a more exhaustive check for some common cases.
1932 if (li_
->conflictsWithPhysRegRef(LHS
, RHS
.reg
, false, JoinedCopies
))
1935 for (const unsigned* SR
= tri_
->getSubRegisters(RHS
.reg
); *SR
; ++SR
)
1936 if (li_
->hasInterval(*SR
) && LHS
.overlaps(li_
->getInterval(*SR
))) {
1937 DOUT
<< "Interfere with sub-register ";
1938 DEBUG(li_
->getInterval(*SR
).print(DOUT
, tri_
));
1944 // Compute ultimate value numbers for the LHS and RHS values.
1945 if (RHS
.containsOneValue()) {
1946 // Copies from a liveinterval with a single value are simple to handle and
1947 // very common, handle the special case here. This is important, because
1948 // often RHS is small and LHS is large (e.g. a physreg).
1950 // Find out if the RHS is defined as a copy from some value in the LHS.
1951 int RHSVal0DefinedFromLHS
= -1;
1953 VNInfo
*RHSValNoInfo
= NULL
;
1954 VNInfo
*RHSValNoInfo0
= RHS
.getValNumInfo(0);
1955 unsigned RHSSrcReg
= li_
->getVNInfoSourceReg(RHSValNoInfo0
);
1956 if (RHSSrcReg
== 0 || RHSSrcReg
!= LHS
.reg
) {
1957 // If RHS is not defined as a copy from the LHS, we can use simpler and
1958 // faster checks to see if the live ranges are coalescable. This joiner
1959 // can't swap the LHS/RHS intervals though.
1960 if (!TargetRegisterInfo::isPhysicalRegister(RHS
.reg
)) {
1961 return SimpleJoin(LHS
, RHS
);
1963 RHSValNoInfo
= RHSValNoInfo0
;
1966 // It was defined as a copy from the LHS, find out what value # it is.
1967 RHSValNoInfo
= LHS
.getLiveRangeContaining(RHSValNoInfo0
->def
-1)->valno
;
1968 RHSValID
= RHSValNoInfo
->id
;
1969 RHSVal0DefinedFromLHS
= RHSValID
;
1972 LHSValNoAssignments
.resize(LHS
.getNumValNums(), -1);
1973 RHSValNoAssignments
.resize(RHS
.getNumValNums(), -1);
1974 NewVNInfo
.resize(LHS
.getNumValNums(), NULL
);
1976 // Okay, *all* of the values in LHS that are defined as a copy from RHS
1977 // should now get updated.
1978 for (LiveInterval::vni_iterator i
= LHS
.vni_begin(), e
= LHS
.vni_end();
1981 unsigned VN
= VNI
->id
;
1982 if (unsigned LHSSrcReg
= li_
->getVNInfoSourceReg(VNI
)) {
1983 if (LHSSrcReg
!= RHS
.reg
) {
1984 // If this is not a copy from the RHS, its value number will be
1985 // unmodified by the coalescing.
1986 NewVNInfo
[VN
] = VNI
;
1987 LHSValNoAssignments
[VN
] = VN
;
1988 } else if (RHSValID
== -1) {
1989 // Otherwise, it is a copy from the RHS, and we don't already have a
1990 // value# for it. Keep the current value number, but remember it.
1991 LHSValNoAssignments
[VN
] = RHSValID
= VN
;
1992 NewVNInfo
[VN
] = RHSValNoInfo
;
1993 LHSValsDefinedFromRHS
[VNI
] = RHSValNoInfo0
;
1995 // Otherwise, use the specified value #.
1996 LHSValNoAssignments
[VN
] = RHSValID
;
1997 if (VN
== (unsigned)RHSValID
) { // Else this val# is dead.
1998 NewVNInfo
[VN
] = RHSValNoInfo
;
1999 LHSValsDefinedFromRHS
[VNI
] = RHSValNoInfo0
;
2003 NewVNInfo
[VN
] = VNI
;
2004 LHSValNoAssignments
[VN
] = VN
;
2008 assert(RHSValID
!= -1 && "Didn't find value #?");
2009 RHSValNoAssignments
[0] = RHSValID
;
2010 if (RHSVal0DefinedFromLHS
!= -1) {
2011 // This path doesn't go through ComputeUltimateVN so just set
2013 RHSValsDefinedFromLHS
[RHSValNoInfo0
] = (VNInfo
*)1;
2016 // Loop over the value numbers of the LHS, seeing if any are defined from
2018 for (LiveInterval::vni_iterator i
= LHS
.vni_begin(), e
= LHS
.vni_end();
2021 if (VNI
->def
== ~1U || VNI
->copy
== 0) // Src not defined by a copy?
2024 // DstReg is known to be a register in the LHS interval. If the src is
2025 // from the RHS interval, we can use its value #.
2026 if (li_
->getVNInfoSourceReg(VNI
) != RHS
.reg
)
2029 // Figure out the value # from the RHS.
2030 LHSValsDefinedFromRHS
[VNI
]=RHS
.getLiveRangeContaining(VNI
->def
-1)->valno
;
2033 // Loop over the value numbers of the RHS, seeing if any are defined from
2035 for (LiveInterval::vni_iterator i
= RHS
.vni_begin(), e
= RHS
.vni_end();
2038 if (VNI
->def
== ~1U || VNI
->copy
== 0) // Src not defined by a copy?
2041 // DstReg is known to be a register in the RHS interval. If the src is
2042 // from the LHS interval, we can use its value #.
2043 if (li_
->getVNInfoSourceReg(VNI
) != LHS
.reg
)
2046 // Figure out the value # from the LHS.
2047 RHSValsDefinedFromLHS
[VNI
]=LHS
.getLiveRangeContaining(VNI
->def
-1)->valno
;
2050 LHSValNoAssignments
.resize(LHS
.getNumValNums(), -1);
2051 RHSValNoAssignments
.resize(RHS
.getNumValNums(), -1);
2052 NewVNInfo
.reserve(LHS
.getNumValNums() + RHS
.getNumValNums());
2054 for (LiveInterval::vni_iterator i
= LHS
.vni_begin(), e
= LHS
.vni_end();
2057 unsigned VN
= VNI
->id
;
2058 if (LHSValNoAssignments
[VN
] >= 0 || VNI
->def
== ~1U)
2060 ComputeUltimateVN(VNI
, NewVNInfo
,
2061 LHSValsDefinedFromRHS
, RHSValsDefinedFromLHS
,
2062 LHSValNoAssignments
, RHSValNoAssignments
);
2064 for (LiveInterval::vni_iterator i
= RHS
.vni_begin(), e
= RHS
.vni_end();
2067 unsigned VN
= VNI
->id
;
2068 if (RHSValNoAssignments
[VN
] >= 0 || VNI
->def
== ~1U)
2070 // If this value number isn't a copy from the LHS, it's a new number.
2071 if (RHSValsDefinedFromLHS
.find(VNI
) == RHSValsDefinedFromLHS
.end()) {
2072 NewVNInfo
.push_back(VNI
);
2073 RHSValNoAssignments
[VN
] = NewVNInfo
.size()-1;
2077 ComputeUltimateVN(VNI
, NewVNInfo
,
2078 RHSValsDefinedFromLHS
, LHSValsDefinedFromRHS
,
2079 RHSValNoAssignments
, LHSValNoAssignments
);
2083 // Armed with the mappings of LHS/RHS values to ultimate values, walk the
2084 // interval lists to see if these intervals are coalescable.
2085 LiveInterval::const_iterator I
= LHS
.begin();
2086 LiveInterval::const_iterator IE
= LHS
.end();
2087 LiveInterval::const_iterator J
= RHS
.begin();
2088 LiveInterval::const_iterator JE
= RHS
.end();
2090 // Skip ahead until the first place of potential sharing.
2091 if (I
->start
< J
->start
) {
2092 I
= std::upper_bound(I
, IE
, J
->start
);
2093 if (I
!= LHS
.begin()) --I
;
2094 } else if (J
->start
< I
->start
) {
2095 J
= std::upper_bound(J
, JE
, I
->start
);
2096 if (J
!= RHS
.begin()) --J
;
2100 // Determine if these two live ranges overlap.
2102 if (I
->start
< J
->start
) {
2103 Overlaps
= I
->end
> J
->start
;
2105 Overlaps
= J
->end
> I
->start
;
2108 // If so, check value # info to determine if they are really different.
2110 // If the live range overlap will map to the same value number in the
2111 // result liverange, we can still coalesce them. If not, we can't.
2112 if (LHSValNoAssignments
[I
->valno
->id
] !=
2113 RHSValNoAssignments
[J
->valno
->id
])
2117 if (I
->end
< J
->end
) {
2126 // Update kill info. Some live ranges are extended due to copy coalescing.
2127 for (DenseMap
<VNInfo
*, VNInfo
*>::iterator I
= LHSValsDefinedFromRHS
.begin(),
2128 E
= LHSValsDefinedFromRHS
.end(); I
!= E
; ++I
) {
2129 VNInfo
*VNI
= I
->first
;
2130 unsigned LHSValID
= LHSValNoAssignments
[VNI
->id
];
2131 LiveInterval::removeKill(NewVNInfo
[LHSValID
], VNI
->def
);
2132 NewVNInfo
[LHSValID
]->hasPHIKill
|= VNI
->hasPHIKill
;
2133 RHS
.addKills(NewVNInfo
[LHSValID
], VNI
->kills
);
2136 // Update kill info. Some live ranges are extended due to copy coalescing.
2137 for (DenseMap
<VNInfo
*, VNInfo
*>::iterator I
= RHSValsDefinedFromLHS
.begin(),
2138 E
= RHSValsDefinedFromLHS
.end(); I
!= E
; ++I
) {
2139 VNInfo
*VNI
= I
->first
;
2140 unsigned RHSValID
= RHSValNoAssignments
[VNI
->id
];
2141 LiveInterval::removeKill(NewVNInfo
[RHSValID
], VNI
->def
);
2142 NewVNInfo
[RHSValID
]->hasPHIKill
|= VNI
->hasPHIKill
;
2143 LHS
.addKills(NewVNInfo
[RHSValID
], VNI
->kills
);
2146 // If we get here, we know that we can coalesce the live ranges. Ask the
2147 // intervals to coalesce themselves now.
2148 if ((RHS
.ranges
.size() > LHS
.ranges
.size() &&
2149 TargetRegisterInfo::isVirtualRegister(LHS
.reg
)) ||
2150 TargetRegisterInfo::isPhysicalRegister(RHS
.reg
)) {
2151 RHS
.join(LHS
, &RHSValNoAssignments
[0], &LHSValNoAssignments
[0], NewVNInfo
);
2154 LHS
.join(RHS
, &LHSValNoAssignments
[0], &RHSValNoAssignments
[0], NewVNInfo
);
2161 // DepthMBBCompare - Comparison predicate that sort first based on the loop
2162 // depth of the basic block (the unsigned), and then on the MBB number.
2163 struct DepthMBBCompare
{
2164 typedef std::pair
<unsigned, MachineBasicBlock
*> DepthMBBPair
;
2165 bool operator()(const DepthMBBPair
&LHS
, const DepthMBBPair
&RHS
) const {
2166 if (LHS
.first
> RHS
.first
) return true; // Deeper loops first
2167 return LHS
.first
== RHS
.first
&&
2168 LHS
.second
->getNumber() < RHS
.second
->getNumber();
2173 /// getRepIntervalSize - Returns the size of the interval that represents the
2174 /// specified register.
2176 unsigned JoinPriorityQueue
<SF
>::getRepIntervalSize(unsigned Reg
) {
2177 return Rc
->getRepIntervalSize(Reg
);
2180 /// CopyRecSort::operator - Join priority queue sorting function.
2182 bool CopyRecSort::operator()(CopyRec left
, CopyRec right
) const {
2183 // Inner loops first.
2184 if (left
.LoopDepth
> right
.LoopDepth
)
2186 else if (left
.LoopDepth
== right
.LoopDepth
)
2187 if (left
.isBackEdge
&& !right
.isBackEdge
)
2192 void SimpleRegisterCoalescing::CopyCoalesceInMBB(MachineBasicBlock
*MBB
,
2193 std::vector
<CopyRec
> &TryAgain
) {
2194 DOUT
<< ((Value
*)MBB
->getBasicBlock())->getName() << ":\n";
2196 std::vector
<CopyRec
> VirtCopies
;
2197 std::vector
<CopyRec
> PhysCopies
;
2198 std::vector
<CopyRec
> ImpDefCopies
;
2199 unsigned LoopDepth
= loopInfo
->getLoopDepth(MBB
);
2200 for (MachineBasicBlock::iterator MII
= MBB
->begin(), E
= MBB
->end();
2202 MachineInstr
*Inst
= MII
++;
2204 // If this isn't a copy nor a extract_subreg, we can't join intervals.
2205 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
2206 if (Inst
->getOpcode() == TargetInstrInfo::EXTRACT_SUBREG
) {
2207 DstReg
= Inst
->getOperand(0).getReg();
2208 SrcReg
= Inst
->getOperand(1).getReg();
2209 } else if (Inst
->getOpcode() == TargetInstrInfo::INSERT_SUBREG
||
2210 Inst
->getOpcode() == TargetInstrInfo::SUBREG_TO_REG
) {
2211 DstReg
= Inst
->getOperand(0).getReg();
2212 SrcReg
= Inst
->getOperand(2).getReg();
2213 } else if (!tii_
->isMoveInstr(*Inst
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
))
2216 bool SrcIsPhys
= TargetRegisterInfo::isPhysicalRegister(SrcReg
);
2217 bool DstIsPhys
= TargetRegisterInfo::isPhysicalRegister(DstReg
);
2219 JoinQueue
->push(CopyRec(Inst
, LoopDepth
, isBackEdgeCopy(Inst
, DstReg
)));
2221 if (li_
->hasInterval(SrcReg
) && li_
->getInterval(SrcReg
).empty())
2222 ImpDefCopies
.push_back(CopyRec(Inst
, 0, false));
2223 else if (SrcIsPhys
|| DstIsPhys
)
2224 PhysCopies
.push_back(CopyRec(Inst
, 0, false));
2226 VirtCopies
.push_back(CopyRec(Inst
, 0, false));
2233 // Try coalescing implicit copies first, followed by copies to / from
2234 // physical registers, then finally copies from virtual registers to
2235 // virtual registers.
2236 for (unsigned i
= 0, e
= ImpDefCopies
.size(); i
!= e
; ++i
) {
2237 CopyRec
&TheCopy
= ImpDefCopies
[i
];
2239 if (!JoinCopy(TheCopy
, Again
))
2241 TryAgain
.push_back(TheCopy
);
2243 for (unsigned i
= 0, e
= PhysCopies
.size(); i
!= e
; ++i
) {
2244 CopyRec
&TheCopy
= PhysCopies
[i
];
2246 if (!JoinCopy(TheCopy
, Again
))
2248 TryAgain
.push_back(TheCopy
);
2250 for (unsigned i
= 0, e
= VirtCopies
.size(); i
!= e
; ++i
) {
2251 CopyRec
&TheCopy
= VirtCopies
[i
];
2253 if (!JoinCopy(TheCopy
, Again
))
2255 TryAgain
.push_back(TheCopy
);
2259 void SimpleRegisterCoalescing::joinIntervals() {
2260 DOUT
<< "********** JOINING INTERVALS ***********\n";
2263 JoinQueue
= new JoinPriorityQueue
<CopyRecSort
>(this);
2265 std::vector
<CopyRec
> TryAgainList
;
2266 if (loopInfo
->empty()) {
2267 // If there are no loops in the function, join intervals in function order.
2268 for (MachineFunction::iterator I
= mf_
->begin(), E
= mf_
->end();
2270 CopyCoalesceInMBB(I
, TryAgainList
);
2272 // Otherwise, join intervals in inner loops before other intervals.
2273 // Unfortunately we can't just iterate over loop hierarchy here because
2274 // there may be more MBB's than BB's. Collect MBB's for sorting.
2276 // Join intervals in the function prolog first. We want to join physical
2277 // registers with virtual registers before the intervals got too long.
2278 std::vector
<std::pair
<unsigned, MachineBasicBlock
*> > MBBs
;
2279 for (MachineFunction::iterator I
= mf_
->begin(), E
= mf_
->end();I
!= E
;++I
){
2280 MachineBasicBlock
*MBB
= I
;
2281 MBBs
.push_back(std::make_pair(loopInfo
->getLoopDepth(MBB
), I
));
2284 // Sort by loop depth.
2285 std::sort(MBBs
.begin(), MBBs
.end(), DepthMBBCompare());
2287 // Finally, join intervals in loop nest order.
2288 for (unsigned i
= 0, e
= MBBs
.size(); i
!= e
; ++i
)
2289 CopyCoalesceInMBB(MBBs
[i
].second
, TryAgainList
);
2292 // Joining intervals can allow other intervals to be joined. Iteratively join
2293 // until we make no progress.
2295 SmallVector
<CopyRec
, 16> TryAgain
;
2296 bool ProgressMade
= true;
2297 while (ProgressMade
) {
2298 ProgressMade
= false;
2299 while (!JoinQueue
->empty()) {
2300 CopyRec R
= JoinQueue
->pop();
2302 bool Success
= JoinCopy(R
, Again
);
2304 ProgressMade
= true;
2306 TryAgain
.push_back(R
);
2310 while (!TryAgain
.empty()) {
2311 JoinQueue
->push(TryAgain
.back());
2312 TryAgain
.pop_back();
2317 bool ProgressMade
= true;
2318 while (ProgressMade
) {
2319 ProgressMade
= false;
2321 for (unsigned i
= 0, e
= TryAgainList
.size(); i
!= e
; ++i
) {
2322 CopyRec
&TheCopy
= TryAgainList
[i
];
2325 bool Success
= JoinCopy(TheCopy
, Again
);
2326 if (Success
|| !Again
) {
2327 TheCopy
.MI
= 0; // Mark this one as done.
2328 ProgressMade
= true;
2339 /// Return true if the two specified registers belong to different register
2340 /// classes. The registers may be either phys or virt regs.
2342 SimpleRegisterCoalescing::differingRegisterClasses(unsigned RegA
,
2343 unsigned RegB
) const {
2344 // Get the register classes for the first reg.
2345 if (TargetRegisterInfo::isPhysicalRegister(RegA
)) {
2346 assert(TargetRegisterInfo::isVirtualRegister(RegB
) &&
2347 "Shouldn't consider two physregs!");
2348 return !mri_
->getRegClass(RegB
)->contains(RegA
);
2351 // Compare against the regclass for the second reg.
2352 const TargetRegisterClass
*RegClassA
= mri_
->getRegClass(RegA
);
2353 if (TargetRegisterInfo::isVirtualRegister(RegB
)) {
2354 const TargetRegisterClass
*RegClassB
= mri_
->getRegClass(RegB
);
2355 return RegClassA
!= RegClassB
;
2357 return !RegClassA
->contains(RegB
);
2360 /// lastRegisterUse - Returns the last use of the specific register between
2361 /// cycles Start and End or NULL if there are no uses.
2363 SimpleRegisterCoalescing::lastRegisterUse(unsigned Start
, unsigned End
,
2364 unsigned Reg
, unsigned &UseIdx
) const{
2366 if (TargetRegisterInfo::isVirtualRegister(Reg
)) {
2367 MachineOperand
*LastUse
= NULL
;
2368 for (MachineRegisterInfo::use_iterator I
= mri_
->use_begin(Reg
),
2369 E
= mri_
->use_end(); I
!= E
; ++I
) {
2370 MachineOperand
&Use
= I
.getOperand();
2371 MachineInstr
*UseMI
= Use
.getParent();
2372 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
2373 if (tii_
->isMoveInstr(*UseMI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
) &&
2375 // Ignore identity copies.
2377 unsigned Idx
= li_
->getInstructionIndex(UseMI
);
2378 if (Idx
>= Start
&& Idx
< End
&& Idx
>= UseIdx
) {
2380 UseIdx
= li_
->getUseIndex(Idx
);
2386 int e
= (End
-1) / InstrSlots::NUM
* InstrSlots::NUM
;
2389 // Skip deleted instructions
2390 MachineInstr
*MI
= li_
->getInstructionFromIndex(e
);
2391 while ((e
- InstrSlots::NUM
) >= s
&& !MI
) {
2392 e
-= InstrSlots::NUM
;
2393 MI
= li_
->getInstructionFromIndex(e
);
2395 if (e
< s
|| MI
== NULL
)
2398 // Ignore identity copies.
2399 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
2400 if (!(tii_
->isMoveInstr(*MI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
) &&
2402 for (unsigned i
= 0, NumOps
= MI
->getNumOperands(); i
!= NumOps
; ++i
) {
2403 MachineOperand
&Use
= MI
->getOperand(i
);
2404 if (Use
.isReg() && Use
.isUse() && Use
.getReg() &&
2405 tri_
->regsOverlap(Use
.getReg(), Reg
)) {
2406 UseIdx
= li_
->getUseIndex(e
);
2411 e
-= InstrSlots::NUM
;
2418 void SimpleRegisterCoalescing::printRegName(unsigned reg
) const {
2419 if (TargetRegisterInfo::isPhysicalRegister(reg
))
2420 cerr
<< tri_
->getName(reg
);
2422 cerr
<< "%reg" << reg
;
2425 void SimpleRegisterCoalescing::releaseMemory() {
2426 JoinedCopies
.clear();
2427 ReMatCopies
.clear();
2431 static bool isZeroLengthInterval(LiveInterval
*li
) {
2432 for (LiveInterval::Ranges::const_iterator
2433 i
= li
->ranges
.begin(), e
= li
->ranges
.end(); i
!= e
; ++i
)
2434 if (i
->end
- i
->start
> LiveIntervals::InstrSlots::NUM
)
2439 /// TurnCopyIntoImpDef - If source of the specified copy is an implicit def,
2440 /// turn the copy into an implicit def.
2442 SimpleRegisterCoalescing::TurnCopyIntoImpDef(MachineBasicBlock::iterator
&I
,
2443 MachineBasicBlock
*MBB
,
2444 unsigned DstReg
, unsigned SrcReg
) {
2445 MachineInstr
*CopyMI
= &*I
;
2446 unsigned CopyIdx
= li_
->getDefIndex(li_
->getInstructionIndex(CopyMI
));
2447 if (!li_
->hasInterval(SrcReg
))
2449 LiveInterval
&SrcInt
= li_
->getInterval(SrcReg
);
2450 if (!SrcInt
.empty())
2452 if (!li_
->hasInterval(DstReg
))
2454 LiveInterval
&DstInt
= li_
->getInterval(DstReg
);
2455 const LiveRange
*DstLR
= DstInt
.getLiveRangeContaining(CopyIdx
);
2456 DstInt
.removeValNo(DstLR
->valno
);
2457 CopyMI
->setDesc(tii_
->get(TargetInstrInfo::IMPLICIT_DEF
));
2458 for (int i
= CopyMI
->getNumOperands() - 1, e
= 0; i
> e
; --i
)
2459 CopyMI
->RemoveOperand(i
);
2460 bool NoUse
= mri_
->use_empty(SrcReg
);
2462 for (MachineRegisterInfo::reg_iterator I
= mri_
->reg_begin(SrcReg
),
2463 E
= mri_
->reg_end(); I
!= E
; ) {
2464 assert(I
.getOperand().isDef());
2465 MachineInstr
*DefMI
= &*I
;
2467 // The implicit_def source has no other uses, delete it.
2468 assert(DefMI
->getOpcode() == TargetInstrInfo::IMPLICIT_DEF
);
2469 li_
->RemoveMachineInstrFromMaps(DefMI
);
2470 DefMI
->eraseFromParent();
2478 bool SimpleRegisterCoalescing::runOnMachineFunction(MachineFunction
&fn
) {
2480 mri_
= &fn
.getRegInfo();
2481 tm_
= &fn
.getTarget();
2482 tri_
= tm_
->getRegisterInfo();
2483 tii_
= tm_
->getInstrInfo();
2484 li_
= &getAnalysis
<LiveIntervals
>();
2485 loopInfo
= &getAnalysis
<MachineLoopInfo
>();
2487 DOUT
<< "********** SIMPLE REGISTER COALESCING **********\n"
2488 << "********** Function: "
2489 << ((Value
*)mf_
->getFunction())->getName() << '\n';
2491 allocatableRegs_
= tri_
->getAllocatableSet(fn
);
2492 for (TargetRegisterInfo::regclass_iterator I
= tri_
->regclass_begin(),
2493 E
= tri_
->regclass_end(); I
!= E
; ++I
)
2494 allocatableRCRegs_
.insert(std::make_pair(*I
,
2495 tri_
->getAllocatableSet(fn
, *I
)));
2497 // Join (coalesce) intervals if requested.
2498 if (EnableJoining
) {
2501 DOUT
<< "********** INTERVALS POST JOINING **********\n";
2502 for (LiveIntervals::iterator I
= li_
->begin(), E
= li_
->end(); I
!= E
; ++I
){
2503 I
->second
->print(DOUT
, tri_
);
2509 // Perform a final pass over the instructions and compute spill weights
2510 // and remove identity moves.
2511 SmallVector
<unsigned, 4> DeadDefs
;
2512 for (MachineFunction::iterator mbbi
= mf_
->begin(), mbbe
= mf_
->end();
2513 mbbi
!= mbbe
; ++mbbi
) {
2514 MachineBasicBlock
* mbb
= mbbi
;
2515 unsigned loopDepth
= loopInfo
->getLoopDepth(mbb
);
2517 for (MachineBasicBlock::iterator mii
= mbb
->begin(), mie
= mbb
->end();
2519 MachineInstr
*MI
= mii
;
2520 unsigned SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
;
2521 if (JoinedCopies
.count(MI
)) {
2522 // Delete all coalesced copies.
2523 if (!tii_
->isMoveInstr(*MI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
)) {
2524 assert((MI
->getOpcode() == TargetInstrInfo::EXTRACT_SUBREG
||
2525 MI
->getOpcode() == TargetInstrInfo::INSERT_SUBREG
||
2526 MI
->getOpcode() == TargetInstrInfo::SUBREG_TO_REG
) &&
2527 "Unrecognized copy instruction");
2528 DstReg
= MI
->getOperand(0).getReg();
2530 if (MI
->registerDefIsDead(DstReg
)) {
2531 LiveInterval
&li
= li_
->getInterval(DstReg
);
2532 if (!ShortenDeadCopySrcLiveRange(li
, MI
))
2533 ShortenDeadCopyLiveRange(li
, MI
);
2535 li_
->RemoveMachineInstrFromMaps(MI
);
2536 mii
= mbbi
->erase(mii
);
2541 // Now check if this is a remat'ed def instruction which is now dead.
2542 if (ReMatDefs
.count(MI
)) {
2544 for (unsigned i
= 0, e
= MI
->getNumOperands(); i
!= e
; ++i
) {
2545 const MachineOperand
&MO
= MI
->getOperand(i
);
2548 unsigned Reg
= MO
.getReg();
2551 if (TargetRegisterInfo::isVirtualRegister(Reg
))
2552 DeadDefs
.push_back(Reg
);
2555 if (TargetRegisterInfo::isPhysicalRegister(Reg
) ||
2556 !mri_
->use_empty(Reg
)) {
2562 while (!DeadDefs
.empty()) {
2563 unsigned DeadDef
= DeadDefs
.back();
2564 DeadDefs
.pop_back();
2565 RemoveDeadDef(li_
->getInterval(DeadDef
), MI
);
2567 li_
->RemoveMachineInstrFromMaps(mii
);
2568 mii
= mbbi
->erase(mii
);
2574 // If the move will be an identity move delete it
2575 bool isMove
= tii_
->isMoveInstr(*MI
, SrcReg
, DstReg
, SrcSubIdx
, DstSubIdx
);
2576 if (isMove
&& SrcReg
== DstReg
) {
2577 if (li_
->hasInterval(SrcReg
)) {
2578 LiveInterval
&RegInt
= li_
->getInterval(SrcReg
);
2579 // If def of this move instruction is dead, remove its live range
2580 // from the dstination register's live interval.
2581 if (MI
->registerDefIsDead(DstReg
)) {
2582 if (!ShortenDeadCopySrcLiveRange(RegInt
, MI
))
2583 ShortenDeadCopyLiveRange(RegInt
, MI
);
2586 li_
->RemoveMachineInstrFromMaps(MI
);
2587 mii
= mbbi
->erase(mii
);
2589 } else if (!isMove
|| !TurnCopyIntoImpDef(mii
, mbb
, DstReg
, SrcReg
)) {
2590 SmallSet
<unsigned, 4> UniqueUses
;
2591 for (unsigned i
= 0, e
= MI
->getNumOperands(); i
!= e
; ++i
) {
2592 const MachineOperand
&mop
= MI
->getOperand(i
);
2593 if (mop
.isReg() && mop
.getReg() &&
2594 TargetRegisterInfo::isVirtualRegister(mop
.getReg())) {
2595 unsigned reg
= mop
.getReg();
2596 // Multiple uses of reg by the same instruction. It should not
2597 // contribute to spill weight again.
2598 if (UniqueUses
.count(reg
) != 0)
2600 LiveInterval
&RegInt
= li_
->getInterval(reg
);
2602 li_
->getSpillWeight(mop
.isDef(), mop
.isUse(), loopDepth
);
2603 UniqueUses
.insert(reg
);
2611 for (LiveIntervals::iterator I
= li_
->begin(), E
= li_
->end(); I
!= E
; ++I
) {
2612 LiveInterval
&LI
= *I
->second
;
2613 if (TargetRegisterInfo::isVirtualRegister(LI
.reg
)) {
2614 // If the live interval length is essentially zero, i.e. in every live
2615 // range the use follows def immediately, it doesn't make sense to spill
2616 // it and hope it will be easier to allocate for this li.
2617 if (isZeroLengthInterval(&LI
))
2618 LI
.weight
= HUGE_VALF
;
2620 bool isLoad
= false;
2621 SmallVector
<LiveInterval
*, 4> SpillIs
;
2622 if (li_
->isReMaterializable(LI
, SpillIs
, isLoad
)) {
2623 // If all of the definitions of the interval are re-materializable,
2624 // it is a preferred candidate for spilling. If non of the defs are
2625 // loads, then it's potentially very cheap to re-materialize.
2626 // FIXME: this gets much more complicated once we support non-trivial
2627 // re-materialization.
2635 // Slightly prefer live interval that has been assigned a preferred reg.
2639 // Divide the weight of the interval by its size. This encourages
2640 // spilling of intervals that are large and have few uses, and
2641 // discourages spilling of small intervals with many uses.
2642 LI
.weight
/= li_
->getApproximateInstructionCount(LI
) * InstrSlots::NUM
;
2650 /// print - Implement the dump method.
2651 void SimpleRegisterCoalescing::print(std::ostream
&O
, const Module
* m
) const {
2655 RegisterCoalescer
* llvm::createSimpleRegisterCoalescer() {
2656 return new SimpleRegisterCoalescing();
2659 // Make sure that anything that uses RegisterCoalescer pulls in this file...
2660 DEFINING_FILE_FOR(SimpleRegisterCoalescing
)