1 //===- SplitKit.h - Toolkit for splitting live ranges -----------*- C++ -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file contains the SplitAnalysis class as well as mutator functions for
10 // live range splitting.
12 //===----------------------------------------------------------------------===//
14 #ifndef LLVM_LIB_CODEGEN_SPLITKIT_H
15 #define LLVM_LIB_CODEGEN_SPLITKIT_H
17 #include "llvm/ADT/ArrayRef.h"
18 #include "llvm/ADT/BitVector.h"
19 #include "llvm/ADT/DenseMap.h"
20 #include "llvm/ADT/DenseSet.h"
21 #include "llvm/ADT/IntervalMap.h"
22 #include "llvm/ADT/PointerIntPair.h"
23 #include "llvm/ADT/SmallPtrSet.h"
24 #include "llvm/ADT/SmallVector.h"
25 #include "llvm/CodeGen/LiveIntervalCalc.h"
26 #include "llvm/CodeGen/LiveIntervals.h"
27 #include "llvm/CodeGen/MachineBasicBlock.h"
28 #include "llvm/CodeGen/MachineFunction.h"
29 #include "llvm/CodeGen/SlotIndexes.h"
30 #include "llvm/Support/Compiler.h"
39 class MachineBlockFrequencyInfo
;
40 class MachineDominatorTree
;
41 class MachineLoopInfo
;
42 class MachineRegisterInfo
;
43 class TargetInstrInfo
;
44 class TargetRegisterInfo
;
48 /// Determines the latest safe point in a block in which we can insert a split,
49 /// spill or other instruction related with CurLI.
50 class LLVM_LIBRARY_VISIBILITY InsertPointAnalysis
{
52 const LiveIntervals
&LIS
;
54 /// Last legal insert point in each basic block in the current function.
55 /// The first entry is the first terminator, the second entry is the
56 /// last valid point to insert a split or spill for a variable that is
57 /// live into a landing pad or inlineasm_br successor.
58 SmallVector
<std::pair
<SlotIndex
, SlotIndex
>, 8> LastInsertPoint
;
60 SlotIndex
computeLastInsertPoint(const LiveInterval
&CurLI
,
61 const MachineBasicBlock
&MBB
);
64 InsertPointAnalysis(const LiveIntervals
&lis
, unsigned BBNum
);
66 /// Return the base index of the last valid insert point for \pCurLI in \pMBB.
67 SlotIndex
getLastInsertPoint(const LiveInterval
&CurLI
,
68 const MachineBasicBlock
&MBB
) {
69 unsigned Num
= MBB
.getNumber();
70 // Inline the common simple case.
71 if (LastInsertPoint
[Num
].first
.isValid() &&
72 !LastInsertPoint
[Num
].second
.isValid())
73 return LastInsertPoint
[Num
].first
;
74 return computeLastInsertPoint(CurLI
, MBB
);
77 /// Returns the last insert point as an iterator for \pCurLI in \pMBB.
78 MachineBasicBlock::iterator
getLastInsertPointIter(const LiveInterval
&CurLI
,
79 MachineBasicBlock
&MBB
);
81 /// Return the base index of the first insert point in \pMBB.
82 SlotIndex
getFirstInsertPoint(MachineBasicBlock
&MBB
) {
83 SlotIndex Res
= LIS
.getMBBStartIdx(&MBB
);
85 MachineBasicBlock::iterator MII
= MBB
.SkipPHIsLabelsAndDebug(MBB
.begin());
87 Res
= LIS
.getInstructionIndex(*MII
);
94 /// SplitAnalysis - Analyze a LiveInterval, looking for live range splitting
96 class LLVM_LIBRARY_VISIBILITY SplitAnalysis
{
98 const MachineFunction
&MF
;
99 const VirtRegMap
&VRM
;
100 const LiveIntervals
&LIS
;
101 const MachineLoopInfo
&Loops
;
102 const TargetInstrInfo
&TII
;
104 /// Additional information about basic blocks where the current variable is
105 /// live. Such a block will look like one of these templates:
107 /// 1. | o---x | Internal to block. Variable is only live in this block.
108 /// 2. |---x | Live-in, kill.
109 /// 3. | o---| Def, live-out.
110 /// 4. |---x o---| Live-in, kill, def, live-out. Counted by NumGapBlocks.
111 /// 5. |---o---o---| Live-through with uses or defs.
112 /// 6. |-----------| Live-through without uses. Counted by NumThroughBlocks.
114 /// Two BlockInfo entries are created for template 4. One for the live-in
115 /// segment, and one for the live-out segment. These entries look as if the
116 /// block were split in the middle where the live range isn't live.
118 /// Live-through blocks without any uses don't get BlockInfo entries. They
119 /// are simply listed in ThroughBlocks instead.
122 MachineBasicBlock
*MBB
;
123 SlotIndex FirstInstr
; ///< First instr accessing current reg.
124 SlotIndex LastInstr
; ///< Last instr accessing current reg.
125 SlotIndex FirstDef
; ///< First non-phi valno->def, or SlotIndex().
126 bool LiveIn
; ///< Current reg is live in.
127 bool LiveOut
; ///< Current reg is live out.
129 /// isOneInstr - Returns true when this BlockInfo describes a single
131 bool isOneInstr() const {
132 return SlotIndex::isSameInstr(FirstInstr
, LastInstr
);
135 void print(raw_ostream
&OS
) const;
140 // Current live interval.
141 const LiveInterval
*CurLI
= nullptr;
143 /// Insert Point Analysis.
144 InsertPointAnalysis IPA
;
146 // Sorted slot indexes of using instructions.
147 SmallVector
<SlotIndex
, 8> UseSlots
;
149 /// UseBlocks - Blocks where CurLI has uses.
150 SmallVector
<BlockInfo
, 8> UseBlocks
;
152 /// NumGapBlocks - Number of duplicate entries in UseBlocks for blocks where
153 /// the live range has a gap.
154 unsigned NumGapBlocks
= 0u;
156 /// ThroughBlocks - Block numbers where CurLI is live through without uses.
157 BitVector ThroughBlocks
;
159 /// NumThroughBlocks - Number of live-through blocks.
160 unsigned NumThroughBlocks
= 0u;
162 // Sumarize statistics by counting instructions using CurLI.
165 /// calcLiveBlockInfo - Compute per-block information about CurLI.
166 void calcLiveBlockInfo();
169 SplitAnalysis(const VirtRegMap
&vrm
, const LiveIntervals
&lis
,
170 const MachineLoopInfo
&mli
);
172 /// analyze - set CurLI to the specified interval, and analyze how it may be
174 void analyze(const LiveInterval
*li
);
176 /// clear - clear all data structures so SplitAnalysis is ready to analyze a
180 /// getParent - Return the last analyzed interval.
181 const LiveInterval
&getParent() const { return *CurLI
; }
183 /// isOriginalEndpoint - Return true if the original live range was killed or
184 /// (re-)defined at Idx. Idx should be the 'def' slot for a normal kill/def,
185 /// and 'use' for an early-clobber def.
186 /// This can be used to recognize code inserted by earlier live range
188 bool isOriginalEndpoint(SlotIndex Idx
) const;
190 /// getUseSlots - Return an array of SlotIndexes of instructions using CurLI.
191 /// This include both use and def operands, at most one entry per instruction.
192 ArrayRef
<SlotIndex
> getUseSlots() const { return UseSlots
; }
194 /// getUseBlocks - Return an array of BlockInfo objects for the basic blocks
195 /// where CurLI has uses.
196 ArrayRef
<BlockInfo
> getUseBlocks() const { return UseBlocks
; }
198 /// getNumThroughBlocks - Return the number of through blocks.
199 unsigned getNumThroughBlocks() const { return NumThroughBlocks
; }
201 /// isThroughBlock - Return true if CurLI is live through MBB without uses.
202 bool isThroughBlock(unsigned MBB
) const { return ThroughBlocks
.test(MBB
); }
204 /// getThroughBlocks - Return the set of through blocks.
205 const BitVector
&getThroughBlocks() const { return ThroughBlocks
; }
207 /// getNumLiveBlocks - Return the number of blocks where CurLI is live.
208 unsigned getNumLiveBlocks() const {
209 return getUseBlocks().size() - NumGapBlocks
+ getNumThroughBlocks();
212 /// countLiveBlocks - Return the number of blocks where li is live. This is
213 /// guaranteed to return the same number as getNumLiveBlocks() after calling
215 unsigned countLiveBlocks(const LiveInterval
*li
) const;
217 using BlockPtrSet
= SmallPtrSet
<const MachineBasicBlock
*, 16>;
219 /// shouldSplitSingleBlock - Returns true if it would help to create a local
220 /// live range for the instructions in BI. There is normally no benefit to
221 /// creating a live range for a single instruction, but it does enable
222 /// register class inflation if the instruction has a restricted register
225 /// @param BI The block to be isolated.
226 /// @param SingleInstrs True when single instructions should be isolated.
227 bool shouldSplitSingleBlock(const BlockInfo
&BI
, bool SingleInstrs
) const;
229 SlotIndex
getLastSplitPoint(unsigned Num
) {
230 return IPA
.getLastInsertPoint(*CurLI
, *MF
.getBlockNumbered(Num
));
233 SlotIndex
getLastSplitPoint(MachineBasicBlock
*BB
) {
234 return IPA
.getLastInsertPoint(*CurLI
, *BB
);
237 MachineBasicBlock::iterator
getLastSplitPointIter(MachineBasicBlock
*BB
) {
238 return IPA
.getLastInsertPointIter(*CurLI
, *BB
);
241 SlotIndex
getFirstSplitPoint(unsigned Num
) {
242 return IPA
.getFirstInsertPoint(*MF
.getBlockNumbered(Num
));
246 /// SplitEditor - Edit machine code and LiveIntervals for live range
249 /// - Create a SplitEditor from a SplitAnalysis.
250 /// - Start a new live interval with openIntv.
251 /// - Mark the places where the new interval is entered using enterIntv*
252 /// - Mark the ranges where the new interval is used with useIntv*
253 /// - Mark the places where the interval is exited with exitIntv*.
254 /// - Finish the current interval with closeIntv and repeat from 2.
255 /// - Rewrite instructions with finish().
257 class LLVM_LIBRARY_VISIBILITY SplitEditor
{
261 MachineRegisterInfo
&MRI
;
262 MachineDominatorTree
&MDT
;
263 const TargetInstrInfo
&TII
;
264 const TargetRegisterInfo
&TRI
;
265 const MachineBlockFrequencyInfo
&MBFI
;
266 VirtRegAuxInfo
&VRAI
;
269 /// ComplementSpillMode - Select how the complement live range should be
270 /// created. SplitEditor automatically creates interval 0 to contain
271 /// anything that isn't added to another interval. This complement interval
272 /// can get quite complicated, and it can sometimes be an advantage to allow
273 /// it to overlap the other intervals. If it is going to spill anyway, no
274 /// registers are wasted by keeping a value in two places at the same time.
275 enum ComplementSpillMode
{
276 /// SM_Partition(Default) - Try to create the complement interval so it
277 /// doesn't overlap any other intervals, and the original interval is
278 /// partitioned. This may require a large number of back copies and extra
279 /// PHI-defs. Only segments marked with overlapIntv will be overlapping.
282 /// SM_Size - Overlap intervals to minimize the number of inserted COPY
283 /// instructions. Copies to the complement interval are hoisted to their
284 /// common dominator, so only one COPY is required per value in the
285 /// complement interval. This also means that no extra PHI-defs need to be
286 /// inserted in the complement interval.
289 /// SM_Speed - Overlap intervals to minimize the expected execution
290 /// frequency of the inserted copies. This is very similar to SM_Size, but
291 /// the complement interval may get some extra PHI-defs.
296 /// Edit - The current parent register and new intervals created.
297 LiveRangeEdit
*Edit
= nullptr;
299 /// Index into Edit of the currently open interval.
300 /// The index 0 is used for the complement, so the first interval started by
301 /// openIntv will be 1.
302 unsigned OpenIdx
= 0;
304 /// The current spill mode, selected by reset().
305 ComplementSpillMode SpillMode
= SM_Partition
;
307 using RegAssignMap
= IntervalMap
<SlotIndex
, unsigned>;
309 /// Allocator for the interval map. This will eventually be shared with
310 /// SlotIndexes and LiveIntervals.
311 RegAssignMap::Allocator Allocator
;
313 /// RegAssign - Map of the assigned register indexes.
314 /// Edit.get(RegAssign.lookup(Idx)) is the register that should be live at
316 RegAssignMap RegAssign
;
318 using ValueForcePair
= PointerIntPair
<VNInfo
*, 1>;
319 using ValueMap
= DenseMap
<std::pair
<unsigned, unsigned>, ValueForcePair
>;
321 /// Values - keep track of the mapping from parent values to values in the new
322 /// intervals. Given a pair (RegIdx, ParentVNI->id), Values contains:
324 /// 1. No entry - the value is not mapped to Edit.get(RegIdx).
325 /// 2. (Null, false) - the value is mapped to multiple values in
326 /// Edit.get(RegIdx). Each value is represented by a minimal live range at
327 /// its def. The full live range can be inferred exactly from the range
328 /// of RegIdx in RegAssign.
329 /// 3. (Null, true). As above, but the ranges in RegAssign are too large, and
330 /// the live range must be recomputed using ::extend().
331 /// 4. (VNI, false) The value is mapped to a single new value.
332 /// The new value has no live ranges anywhere.
335 /// LICalc - Cache for computing live ranges and SSA update. Each instance
336 /// can only handle non-overlapping live ranges, so use a separate
337 /// LiveIntervalCalc instance for the complement interval when in spill mode.
338 LiveIntervalCalc LICalc
[2];
340 /// getLICalc - Return the LICalc to use for RegIdx. In spill mode, the
341 /// complement interval can overlap the other intervals, so it gets its own
342 /// LICalc instance. When not in spill mode, all intervals can share one.
343 LiveIntervalCalc
&getLICalc(unsigned RegIdx
) {
344 return LICalc
[SpillMode
!= SM_Partition
&& RegIdx
!= 0];
347 /// Add a segment to the interval LI for the value number VNI. If LI has
348 /// subranges, corresponding segments will be added to them as well, but
349 /// with newly created value numbers. If Original is true, dead def will
350 /// only be added a subrange of LI if the corresponding subrange of the
351 /// original interval has a def at this index. Otherwise, all subranges
352 /// of LI will be updated.
353 void addDeadDef(LiveInterval
&LI
, VNInfo
*VNI
, bool Original
);
355 /// defValue - define a value in RegIdx from ParentVNI at Idx.
356 /// Idx does not have to be ParentVNI->def, but it must be contained within
357 /// ParentVNI's live range in ParentLI. The new value is added to the value
358 /// map. The value being defined may either come from rematerialization
359 /// (or an inserted copy), or it may be coming from the original interval.
360 /// The parameter Original should be true in the latter case, otherwise
361 /// it should be false.
362 /// Return the new LI value.
363 VNInfo
*defValue(unsigned RegIdx
, const VNInfo
*ParentVNI
, SlotIndex Idx
,
366 /// forceRecompute - Force the live range of ParentVNI in RegIdx to be
367 /// recomputed by LiveRangeCalc::extend regardless of the number of defs.
368 /// This is used for values whose live range doesn't match RegAssign exactly.
369 /// They could have rematerialized, or back-copies may have been moved.
370 void forceRecompute(unsigned RegIdx
, const VNInfo
&ParentVNI
);
372 /// Calls forceRecompute() on any affected regidx and on ParentVNI
373 /// predecessors in case of a phi definition.
374 void forceRecomputeVNI(const VNInfo
&ParentVNI
);
376 /// defFromParent - Define Reg from ParentVNI at UseIdx using either
377 /// rematerialization or a COPY from parent. Return the new value.
378 VNInfo
*defFromParent(unsigned RegIdx
, const VNInfo
*ParentVNI
,
379 SlotIndex UseIdx
, MachineBasicBlock
&MBB
,
380 MachineBasicBlock::iterator I
);
382 /// removeBackCopies - Remove the copy instructions that defines the values
383 /// in the vector in the complement interval.
384 void removeBackCopies(SmallVectorImpl
<VNInfo
*> &Copies
);
386 /// getShallowDominator - Returns the least busy dominator of MBB that is
387 /// also dominated by DefMBB. Busy is measured by loop depth.
388 MachineBasicBlock
*findShallowDominator(MachineBasicBlock
*MBB
,
389 MachineBasicBlock
*DefMBB
);
391 /// Find out all the backCopies dominated by others.
392 void computeRedundantBackCopies(DenseSet
<unsigned> &NotToHoistSet
,
393 SmallVectorImpl
<VNInfo
*> &BackCopies
);
395 /// Hoist back-copies to the complement interval. It tries to hoist all
396 /// the back-copies to one BB if it is beneficial, or else simply remove
397 /// redundant backcopies dominated by others.
400 /// transferValues - Transfer values to the new ranges.
401 /// Return true if any ranges were skipped.
402 bool transferValues();
404 /// Live range @p LR corresponding to the lane Mask @p LM has a live
405 /// PHI def at the beginning of block @p B. Extend the range @p LR of
406 /// all predecessor values that reach this def. If @p LR is a subrange,
407 /// the array @p Undefs is the set of all locations where it is undefined
408 /// via <def,read-undef> in other subranges for the same register.
409 void extendPHIRange(MachineBasicBlock
&B
, LiveIntervalCalc
&LIC
,
410 LiveRange
&LR
, LaneBitmask LM
,
411 ArrayRef
<SlotIndex
> Undefs
);
413 /// extendPHIKillRanges - Extend the ranges of all values killed by original
415 void extendPHIKillRanges();
417 /// rewriteAssigned - Rewrite all uses of Edit.getReg() to assigned registers.
418 void rewriteAssigned(bool ExtendRanges
);
420 /// deleteRematVictims - Delete defs that are dead after rematerializing.
421 void deleteRematVictims();
423 /// Add a copy instruction copying \p FromReg to \p ToReg before
424 /// \p InsertBefore. This can be invoked with a \p LaneMask which may make it
425 /// necessary to construct a sequence of copies to cover it exactly.
426 SlotIndex
buildCopy(Register FromReg
, Register ToReg
, LaneBitmask LaneMask
,
427 MachineBasicBlock
&MBB
, MachineBasicBlock::iterator InsertBefore
,
428 bool Late
, unsigned RegIdx
);
430 SlotIndex
buildSingleSubRegCopy(Register FromReg
, Register ToReg
,
431 MachineBasicBlock
&MB
,
432 MachineBasicBlock::iterator InsertBefore
,
433 unsigned SubIdx
, LiveInterval
&DestLI
,
434 bool Late
, SlotIndex Def
,
435 const MCInstrDesc
&Desc
);
438 /// Create a new SplitEditor for editing the LiveInterval analyzed by SA.
439 /// Newly created intervals will be appended to newIntervals.
440 SplitEditor(SplitAnalysis
&SA
, LiveIntervals
&LIS
, VirtRegMap
&VRM
,
441 MachineDominatorTree
&MDT
, MachineBlockFrequencyInfo
&MBFI
,
442 VirtRegAuxInfo
&VRAI
);
444 /// reset - Prepare for a new split.
445 void reset(LiveRangeEdit
&, ComplementSpillMode
= SM_Partition
);
447 /// Create a new virtual register and live interval.
448 /// Return the interval index, starting from 1. Interval index 0 is the
449 /// implicit complement interval.
452 /// currentIntv - Return the current interval index.
453 unsigned currentIntv() const { return OpenIdx
; }
455 /// selectIntv - Select a previously opened interval index.
456 void selectIntv(unsigned Idx
);
458 /// enterIntvBefore - Enter the open interval before the instruction at Idx.
459 /// If the parent interval is not live before Idx, a COPY is not inserted.
460 /// Return the beginning of the new live range.
461 SlotIndex
enterIntvBefore(SlotIndex Idx
);
463 /// enterIntvAfter - Enter the open interval after the instruction at Idx.
464 /// Return the beginning of the new live range.
465 SlotIndex
enterIntvAfter(SlotIndex Idx
);
467 /// enterIntvAtEnd - Enter the open interval at the end of MBB.
468 /// Use the open interval from the inserted copy to the MBB end.
469 /// Return the beginning of the new live range.
470 SlotIndex
enterIntvAtEnd(MachineBasicBlock
&MBB
);
472 /// useIntv - indicate that all instructions in MBB should use OpenLI.
473 void useIntv(const MachineBasicBlock
&MBB
);
475 /// useIntv - indicate that all instructions in range should use OpenLI.
476 void useIntv(SlotIndex Start
, SlotIndex End
);
478 /// leaveIntvAfter - Leave the open interval after the instruction at Idx.
479 /// Return the end of the live range.
480 SlotIndex
leaveIntvAfter(SlotIndex Idx
);
482 /// leaveIntvBefore - Leave the open interval before the instruction at Idx.
483 /// Return the end of the live range.
484 SlotIndex
leaveIntvBefore(SlotIndex Idx
);
486 /// leaveIntvAtTop - Leave the interval at the top of MBB.
487 /// Add liveness from the MBB top to the copy.
488 /// Return the end of the live range.
489 SlotIndex
leaveIntvAtTop(MachineBasicBlock
&MBB
);
491 /// overlapIntv - Indicate that all instructions in range should use the open
492 /// interval if End does not have tied-def usage of the register and in this
493 /// case complement interval is used. Let the complement interval be live.
495 /// This doubles the register pressure, but is sometimes required to deal with
496 /// register uses after the last valid split point.
498 /// The Start index should be a return value from a leaveIntv* call, and End
499 /// should be in the same basic block. The parent interval must have the same
500 /// value across the range.
502 void overlapIntv(SlotIndex Start
, SlotIndex End
);
504 /// finish - after all the new live ranges have been created, compute the
505 /// remaining live range, and rewrite instructions to use the new registers.
506 /// @param LRMap When not null, this vector will map each live range in Edit
507 /// back to the indices returned by openIntv.
508 /// There may be extra indices created by dead code elimination.
509 void finish(SmallVectorImpl
<unsigned> *LRMap
= nullptr);
511 /// dump - print the current interval mapping to dbgs().
514 // ===--- High level methods ---===
516 /// splitSingleBlock - Split CurLI into a separate live interval around the
517 /// uses in a single block. This is intended to be used as part of a larger
518 /// split, and doesn't call finish().
519 void splitSingleBlock(const SplitAnalysis::BlockInfo
&BI
);
521 /// splitLiveThroughBlock - Split CurLI in the given block such that it
522 /// enters the block in IntvIn and leaves it in IntvOut. There may be uses in
523 /// the block, but they will be ignored when placing split points.
525 /// @param MBBNum Block number.
526 /// @param IntvIn Interval index entering the block.
527 /// @param LeaveBefore When set, leave IntvIn before this point.
528 /// @param IntvOut Interval index leaving the block.
529 /// @param EnterAfter When set, enter IntvOut after this point.
530 void splitLiveThroughBlock(unsigned MBBNum
,
531 unsigned IntvIn
, SlotIndex LeaveBefore
,
532 unsigned IntvOut
, SlotIndex EnterAfter
);
534 /// splitRegInBlock - Split CurLI in the given block such that it enters the
535 /// block in IntvIn and leaves it on the stack (or not at all). Split points
536 /// are placed in a way that avoids putting uses in the stack interval. This
537 /// may require creating a local interval when there is interference.
539 /// @param BI Block descriptor.
540 /// @param IntvIn Interval index entering the block. Not 0.
541 /// @param LeaveBefore When set, leave IntvIn before this point.
542 void splitRegInBlock(const SplitAnalysis::BlockInfo
&BI
,
543 unsigned IntvIn
, SlotIndex LeaveBefore
);
545 /// splitRegOutBlock - Split CurLI in the given block such that it enters the
546 /// block on the stack (or isn't live-in at all) and leaves it in IntvOut.
547 /// Split points are placed to avoid interference and such that the uses are
548 /// not in the stack interval. This may require creating a local interval
549 /// when there is interference.
551 /// @param BI Block descriptor.
552 /// @param IntvOut Interval index leaving the block.
553 /// @param EnterAfter When set, enter IntvOut after this point.
554 void splitRegOutBlock(const SplitAnalysis::BlockInfo
&BI
,
555 unsigned IntvOut
, SlotIndex EnterAfter
);
558 } // end namespace llvm
560 #endif // LLVM_LIB_CODEGEN_SPLITKIT_H