1 //===- BranchRelaxation.cpp -----------------------------------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "llvm/ADT/SmallVector.h"
10 #include "llvm/ADT/Statistic.h"
11 #include "llvm/CodeGen/LivePhysRegs.h"
12 #include "llvm/CodeGen/MachineBasicBlock.h"
13 #include "llvm/CodeGen/MachineFunction.h"
14 #include "llvm/CodeGen/MachineFunctionPass.h"
15 #include "llvm/CodeGen/MachineInstr.h"
16 #include "llvm/CodeGen/RegisterScavenging.h"
17 #include "llvm/CodeGen/TargetInstrInfo.h"
18 #include "llvm/CodeGen/TargetRegisterInfo.h"
19 #include "llvm/CodeGen/TargetSubtargetInfo.h"
20 #include "llvm/Config/llvm-config.h"
21 #include "llvm/IR/DebugLoc.h"
22 #include "llvm/InitializePasses.h"
23 #include "llvm/Pass.h"
24 #include "llvm/Support/Compiler.h"
25 #include "llvm/Support/Debug.h"
26 #include "llvm/Support/ErrorHandling.h"
27 #include "llvm/Support/Format.h"
28 #include "llvm/Support/raw_ostream.h"
29 #include "llvm/Target/TargetMachine.h"
37 #define DEBUG_TYPE "branch-relaxation"
39 STATISTIC(NumSplit
, "Number of basic blocks split");
40 STATISTIC(NumConditionalRelaxed
, "Number of conditional branches relaxed");
41 STATISTIC(NumUnconditionalRelaxed
, "Number of unconditional branches relaxed");
43 #define BRANCH_RELAX_NAME "Branch relaxation pass"
47 class BranchRelaxation
: public MachineFunctionPass
{
48 /// BasicBlockInfo - Information about the offset and size of a single
50 struct BasicBlockInfo
{
51 /// Offset - Distance from the beginning of the function to the beginning
52 /// of this basic block.
54 /// The offset is always aligned as required by the basic block.
57 /// Size - Size of the basic block in bytes. If the block contains
58 /// inline assembly, this is a worst case estimate.
60 /// The size does not include any alignment padding whether from the
61 /// beginning of the block, or from an aligned jump table at the end.
64 BasicBlockInfo() = default;
66 /// Compute the offset immediately following this block. \p MBB is the next
68 unsigned postOffset(const MachineBasicBlock
&MBB
) const {
69 const unsigned PO
= Offset
+ Size
;
70 const Align Alignment
= MBB
.getAlignment();
71 const Align ParentAlign
= MBB
.getParent()->getAlignment();
72 if (Alignment
<= ParentAlign
)
73 return alignTo(PO
, Alignment
);
75 // The alignment of this MBB is larger than the function's alignment, so
76 // we can't tell whether or not it will insert nops. Assume that it will.
77 return alignTo(PO
, Alignment
) + Alignment
.value() - ParentAlign
.value();
81 SmallVector
<BasicBlockInfo
, 16> BlockInfo
;
83 // The basic block after which trampolines are inserted. This is the last
84 // basic block that isn't in the cold section.
85 MachineBasicBlock
*TrampolineInsertionPoint
= nullptr;
86 SmallDenseSet
<std::pair
<MachineBasicBlock
*, MachineBasicBlock
*>>
87 RelaxedUnconditionals
;
88 std::unique_ptr
<RegScavenger
> RS
;
89 LivePhysRegs LiveRegs
;
91 MachineFunction
*MF
= nullptr;
92 const TargetRegisterInfo
*TRI
= nullptr;
93 const TargetInstrInfo
*TII
= nullptr;
94 const TargetMachine
*TM
= nullptr;
96 bool relaxBranchInstructions();
99 MachineBasicBlock
*createNewBlockAfter(MachineBasicBlock
&OrigMBB
);
100 MachineBasicBlock
*createNewBlockAfter(MachineBasicBlock
&OrigMBB
,
101 const BasicBlock
*BB
);
103 MachineBasicBlock
*splitBlockBeforeInstr(MachineInstr
&MI
,
104 MachineBasicBlock
*DestBB
);
105 void adjustBlockOffsets(MachineBasicBlock
&Start
);
106 void adjustBlockOffsets(MachineBasicBlock
&Start
,
107 MachineFunction::iterator End
);
108 bool isBlockInRange(const MachineInstr
&MI
,
109 const MachineBasicBlock
&BB
) const;
111 bool fixupConditionalBranch(MachineInstr
&MI
);
112 bool fixupUnconditionalBranch(MachineInstr
&MI
);
113 uint64_t computeBlockSize(const MachineBasicBlock
&MBB
) const;
114 unsigned getInstrOffset(const MachineInstr
&MI
) const;
121 BranchRelaxation() : MachineFunctionPass(ID
) {}
123 bool runOnMachineFunction(MachineFunction
&MF
) override
;
125 StringRef
getPassName() const override
{ return BRANCH_RELAX_NAME
; }
128 } // end anonymous namespace
130 char BranchRelaxation::ID
= 0;
132 char &llvm::BranchRelaxationPassID
= BranchRelaxation::ID
;
134 INITIALIZE_PASS(BranchRelaxation
, DEBUG_TYPE
, BRANCH_RELAX_NAME
, false, false)
136 /// verify - check BBOffsets, BBSizes, alignment of islands
137 void BranchRelaxation::verify() {
139 unsigned PrevNum
= MF
->begin()->getNumber();
140 for (MachineBasicBlock
&MBB
: *MF
) {
141 const unsigned Num
= MBB
.getNumber();
142 assert(!Num
|| BlockInfo
[PrevNum
].postOffset(MBB
) <= BlockInfo
[Num
].Offset
);
143 assert(BlockInfo
[Num
].Size
== computeBlockSize(MBB
));
147 for (MachineBasicBlock
&MBB
: *MF
) {
148 for (MachineBasicBlock::iterator J
= MBB
.getFirstTerminator();
149 J
!= MBB
.end(); J
= std::next(J
)) {
150 MachineInstr
&MI
= *J
;
151 if (!MI
.isConditionalBranch() && !MI
.isUnconditionalBranch())
153 if (MI
.getOpcode() == TargetOpcode::FAULTING_OP
)
155 MachineBasicBlock
*DestBB
= TII
->getBranchDestBlock(MI
);
156 assert(isBlockInRange(MI
, *DestBB
) ||
157 RelaxedUnconditionals
.contains({&MBB
, DestBB
}));
163 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
164 /// print block size and offset information - debugging
165 LLVM_DUMP_METHOD
void BranchRelaxation::dumpBBs() {
166 for (auto &MBB
: *MF
) {
167 const BasicBlockInfo
&BBI
= BlockInfo
[MBB
.getNumber()];
168 dbgs() << format("%%bb.%u\toffset=%08x\t", MBB
.getNumber(), BBI
.Offset
)
169 << format("size=%#x\n", BBI
.Size
);
174 /// scanFunction - Do the initial scan of the function, building up
175 /// information about each block.
176 void BranchRelaxation::scanFunction() {
178 BlockInfo
.resize(MF
->getNumBlockIDs());
180 TrampolineInsertionPoint
= nullptr;
181 RelaxedUnconditionals
.clear();
183 // First thing, compute the size of all basic blocks, and see if the function
184 // has any inline assembly in it. If so, we have to be conservative about
185 // alignment assumptions, as we don't know for sure the size of any
186 // instructions in the inline assembly. At the same time, place the
187 // trampoline insertion point at the end of the hot portion of the function.
188 for (MachineBasicBlock
&MBB
: *MF
) {
189 BlockInfo
[MBB
.getNumber()].Size
= computeBlockSize(MBB
);
191 if (MBB
.getSectionID() != MBBSectionID::ColdSectionID
)
192 TrampolineInsertionPoint
= &MBB
;
195 // Compute block offsets and known bits.
196 adjustBlockOffsets(*MF
->begin());
198 if (TrampolineInsertionPoint
== nullptr) {
199 LLVM_DEBUG(dbgs() << " No suitable trampoline insertion point found in "
200 << MF
->getName() << ".\n");
204 /// computeBlockSize - Compute the size for MBB.
206 BranchRelaxation::computeBlockSize(const MachineBasicBlock
&MBB
) const {
208 for (const MachineInstr
&MI
: MBB
)
209 Size
+= TII
->getInstSizeInBytes(MI
);
213 /// getInstrOffset - Return the current offset of the specified machine
214 /// instruction from the start of the function. This offset changes as stuff is
215 /// moved around inside the function.
216 unsigned BranchRelaxation::getInstrOffset(const MachineInstr
&MI
) const {
217 const MachineBasicBlock
*MBB
= MI
.getParent();
219 // The offset is composed of two things: the sum of the sizes of all MBB's
220 // before this instruction's block, and the offset from the start of the block
222 unsigned Offset
= BlockInfo
[MBB
->getNumber()].Offset
;
224 // Sum instructions before MI in MBB.
225 for (MachineBasicBlock::const_iterator I
= MBB
->begin(); &*I
!= &MI
; ++I
) {
226 assert(I
!= MBB
->end() && "Didn't find MI in its own basic block?");
227 Offset
+= TII
->getInstSizeInBytes(*I
);
233 void BranchRelaxation::adjustBlockOffsets(MachineBasicBlock
&Start
) {
234 adjustBlockOffsets(Start
, MF
->end());
237 void BranchRelaxation::adjustBlockOffsets(MachineBasicBlock
&Start
,
238 MachineFunction::iterator End
) {
239 unsigned PrevNum
= Start
.getNumber();
241 make_range(std::next(MachineFunction::iterator(Start
)), End
)) {
242 unsigned Num
= MBB
.getNumber();
243 // Get the offset and known bits at the end of the layout predecessor.
244 // Include the alignment of the current block.
245 BlockInfo
[Num
].Offset
= BlockInfo
[PrevNum
].postOffset(MBB
);
251 /// Insert a new empty MachineBasicBlock and insert it after \p OrigMBB
253 BranchRelaxation::createNewBlockAfter(MachineBasicBlock
&OrigBB
) {
254 return createNewBlockAfter(OrigBB
, OrigBB
.getBasicBlock());
257 /// Insert a new empty MachineBasicBlock with \p BB as its BasicBlock
258 /// and insert it after \p OrigMBB
260 BranchRelaxation::createNewBlockAfter(MachineBasicBlock
&OrigMBB
,
261 const BasicBlock
*BB
) {
262 // Create a new MBB for the code after the OrigBB.
263 MachineBasicBlock
*NewBB
= MF
->CreateMachineBasicBlock(BB
);
264 MF
->insert(++OrigMBB
.getIterator(), NewBB
);
266 // Place the new block in the same section as OrigBB
267 NewBB
->setSectionID(OrigMBB
.getSectionID());
268 NewBB
->setIsEndSection(OrigMBB
.isEndSection());
269 OrigMBB
.setIsEndSection(false);
271 // Insert an entry into BlockInfo to align it properly with the block numbers.
272 BlockInfo
.insert(BlockInfo
.begin() + NewBB
->getNumber(), BasicBlockInfo());
277 /// Split the basic block containing MI into two blocks, which are joined by
278 /// an unconditional branch. Update data structures and renumber blocks to
279 /// account for this change and returns the newly created block.
281 BranchRelaxation::splitBlockBeforeInstr(MachineInstr
&MI
,
282 MachineBasicBlock
*DestBB
) {
283 MachineBasicBlock
*OrigBB
= MI
.getParent();
285 // Create a new MBB for the code after the OrigBB.
286 MachineBasicBlock
*NewBB
=
287 MF
->CreateMachineBasicBlock(OrigBB
->getBasicBlock());
288 MF
->insert(++OrigBB
->getIterator(), NewBB
);
290 // Place the new block in the same section as OrigBB.
291 NewBB
->setSectionID(OrigBB
->getSectionID());
292 NewBB
->setIsEndSection(OrigBB
->isEndSection());
293 OrigBB
->setIsEndSection(false);
295 // Splice the instructions starting with MI over to NewBB.
296 NewBB
->splice(NewBB
->end(), OrigBB
, MI
.getIterator(), OrigBB
->end());
298 // Add an unconditional branch from OrigBB to NewBB.
299 // Note the new unconditional branch is not being recorded.
300 // There doesn't seem to be meaningful DebugInfo available; this doesn't
301 // correspond to anything in the source.
302 TII
->insertUnconditionalBranch(*OrigBB
, NewBB
, DebugLoc());
304 // Insert an entry into BlockInfo to align it properly with the block numbers.
305 BlockInfo
.insert(BlockInfo
.begin() + NewBB
->getNumber(), BasicBlockInfo());
307 NewBB
->transferSuccessors(OrigBB
);
308 OrigBB
->addSuccessor(NewBB
);
309 OrigBB
->addSuccessor(DestBB
);
311 // Cleanup potential unconditional branch to successor block.
312 // Note that updateTerminator may change the size of the blocks.
313 OrigBB
->updateTerminator(NewBB
);
315 // Figure out how large the OrigBB is. As the first half of the original
316 // block, it cannot contain a tablejump. The size includes
317 // the new jump we added. (It should be possible to do this without
318 // recounting everything, but it's very confusing, and this is rarely
320 BlockInfo
[OrigBB
->getNumber()].Size
= computeBlockSize(*OrigBB
);
322 // Figure out how large the NewMBB is. As the second half of the original
323 // block, it may contain a tablejump.
324 BlockInfo
[NewBB
->getNumber()].Size
= computeBlockSize(*NewBB
);
326 // Update the offset of the new block.
327 adjustBlockOffsets(*OrigBB
, std::next(NewBB
->getIterator()));
329 // Need to fix live-in lists if we track liveness.
330 if (TRI
->trackLivenessAfterRegAlloc(*MF
))
331 computeAndAddLiveIns(LiveRegs
, *NewBB
);
338 /// isBlockInRange - Returns true if the distance between specific MI and
339 /// specific BB can fit in MI's displacement field.
340 bool BranchRelaxation::isBlockInRange(const MachineInstr
&MI
,
341 const MachineBasicBlock
&DestBB
) const {
342 int64_t BrOffset
= getInstrOffset(MI
);
343 int64_t DestOffset
= BlockInfo
[DestBB
.getNumber()].Offset
;
345 const MachineBasicBlock
*SrcBB
= MI
.getParent();
347 if (TII
->isBranchOffsetInRange(MI
.getOpcode(),
348 SrcBB
->getSectionID() != DestBB
.getSectionID()
349 ? TM
->getMaxCodeSize()
350 : DestOffset
- BrOffset
))
353 LLVM_DEBUG(dbgs() << "Out of range branch to destination "
354 << printMBBReference(DestBB
) << " from "
355 << printMBBReference(*MI
.getParent()) << " to "
356 << DestOffset
<< " offset " << DestOffset
- BrOffset
<< '\t'
362 /// fixupConditionalBranch - Fix up a conditional branch whose destination is
363 /// too far away to fit in its displacement field. It is converted to an inverse
364 /// conditional branch + an unconditional branch to the destination.
365 bool BranchRelaxation::fixupConditionalBranch(MachineInstr
&MI
) {
366 DebugLoc DL
= MI
.getDebugLoc();
367 MachineBasicBlock
*MBB
= MI
.getParent();
368 MachineBasicBlock
*TBB
= nullptr, *FBB
= nullptr;
369 MachineBasicBlock
*NewBB
= nullptr;
370 SmallVector
<MachineOperand
, 4> Cond
;
372 auto insertUncondBranch
= [&](MachineBasicBlock
*MBB
,
373 MachineBasicBlock
*DestBB
) {
374 unsigned &BBSize
= BlockInfo
[MBB
->getNumber()].Size
;
376 TII
->insertUnconditionalBranch(*MBB
, DestBB
, DL
, &NewBrSize
);
379 auto insertBranch
= [&](MachineBasicBlock
*MBB
, MachineBasicBlock
*TBB
,
380 MachineBasicBlock
*FBB
,
381 SmallVectorImpl
<MachineOperand
> &Cond
) {
382 unsigned &BBSize
= BlockInfo
[MBB
->getNumber()].Size
;
384 TII
->insertBranch(*MBB
, TBB
, FBB
, Cond
, DL
, &NewBrSize
);
387 auto removeBranch
= [&](MachineBasicBlock
*MBB
) {
388 unsigned &BBSize
= BlockInfo
[MBB
->getNumber()].Size
;
390 TII
->removeBranch(*MBB
, &RemovedSize
);
391 BBSize
-= RemovedSize
;
394 // Populate the block offset and live-ins for a new basic block.
395 auto updateOffsetAndLiveness
= [&](MachineBasicBlock
*NewBB
) {
396 assert(NewBB
!= nullptr && "can't populate offset for nullptr");
398 // Keep the block offsets approximately up to date. While they will be
399 // slight underestimates, we will update them appropriately in the next
400 // scan through the function.
401 adjustBlockOffsets(*std::prev(NewBB
->getIterator()),
402 std::next(NewBB
->getIterator()));
404 // Need to fix live-in lists if we track liveness.
405 if (TRI
->trackLivenessAfterRegAlloc(*MF
))
406 computeAndAddLiveIns(LiveRegs
, *NewBB
);
409 bool Fail
= TII
->analyzeBranch(*MBB
, TBB
, FBB
, Cond
);
410 assert(!Fail
&& "branches to be relaxed must be analyzable");
413 // Since cross-section conditional branches to the cold section are rarely
414 // taken, try to avoid inverting the condition. Instead, add a "trampoline
415 // branch", which unconditionally branches to the branch destination. Place
416 // the trampoline branch at the end of the function and retarget the
417 // conditional branch to the trampoline.
422 // L1Trampoline: b L1
423 if (MBB
->getSectionID() != TBB
->getSectionID() &&
424 TBB
->getSectionID() == MBBSectionID::ColdSectionID
&&
425 TrampolineInsertionPoint
!= nullptr) {
426 // If the insertion point is out of range, we can't put a trampoline there.
428 createNewBlockAfter(*TrampolineInsertionPoint
, MBB
->getBasicBlock());
430 if (isBlockInRange(MI
, *NewBB
)) {
431 LLVM_DEBUG(dbgs() << " Retarget destination to trampoline at "
434 insertUncondBranch(NewBB
, TBB
);
436 // Update the successor lists to include the trampoline.
437 MBB
->replaceSuccessor(TBB
, NewBB
);
438 NewBB
->addSuccessor(TBB
);
440 // Replace branch in the current (MBB) block.
442 insertBranch(MBB
, NewBB
, FBB
, Cond
);
444 TrampolineInsertionPoint
= NewBB
;
445 updateOffsetAndLiveness(NewBB
);
450 dbgs() << " Trampoline insertion point out of range for Bcc from "
451 << printMBBReference(*MBB
) << " to " << printMBBReference(*TBB
)
453 TrampolineInsertionPoint
->setIsEndSection(NewBB
->isEndSection());
458 // Add an unconditional branch to the destination and invert the branch
459 // condition to jump over it:
466 bool ReversedCond
= !TII
->reverseBranchCondition(Cond
);
468 if (FBB
&& isBlockInRange(MI
, *FBB
)) {
469 // Last MI in the BB is an unconditional branch. We can simply invert the
470 // condition and swap destinations:
476 LLVM_DEBUG(dbgs() << " Invert condition and swap "
477 "its destination with "
481 insertBranch(MBB
, FBB
, TBB
, Cond
);
485 // We need to split the basic block here to obtain two long-range
486 // unconditional branches.
487 NewBB
= createNewBlockAfter(*MBB
);
489 insertUncondBranch(NewBB
, FBB
);
490 // Update the succesor lists according to the transformation to follow.
491 // Do it here since if there's no split, no update is needed.
492 MBB
->replaceSuccessor(FBB
, NewBB
);
493 NewBB
->addSuccessor(FBB
);
494 updateOffsetAndLiveness(NewBB
);
497 // We now have an appropriate fall-through block in place (either naturally
498 // or just created), so we can use the inverted the condition.
499 MachineBasicBlock
&NextBB
= *std::next(MachineFunction::iterator(MBB
));
501 LLVM_DEBUG(dbgs() << " Insert B to " << printMBBReference(*TBB
)
502 << ", invert condition and change dest. to "
503 << printMBBReference(NextBB
) << '\n');
506 // Insert a new conditional branch and a new unconditional branch.
507 insertBranch(MBB
, &NextBB
, TBB
, Cond
);
510 // Branch cond can't be inverted.
511 // In this case we always add a block after the MBB.
512 LLVM_DEBUG(dbgs() << " The branch condition can't be inverted. "
513 << " Insert a new BB after " << MBB
->back());
516 FBB
= &(*std::next(MachineFunction::iterator(MBB
)));
518 // This is the block with cond. branch and the distance to TBB is too long.
522 // We do the following transformation:
529 NewBB
= createNewBlockAfter(*MBB
);
530 insertUncondBranch(NewBB
, TBB
);
532 LLVM_DEBUG(dbgs() << " Insert cond B to the new BB "
533 << printMBBReference(*NewBB
)
534 << " Keep the exiting condition.\n"
535 << " Insert B to " << printMBBReference(*FBB
) << ".\n"
536 << " In the new BB: Insert B to "
537 << printMBBReference(*TBB
) << ".\n");
539 // Update the successor lists according to the transformation to follow.
540 MBB
->replaceSuccessor(TBB
, NewBB
);
541 NewBB
->addSuccessor(TBB
);
543 // Replace branch in the current (MBB) block.
545 insertBranch(MBB
, NewBB
, FBB
, Cond
);
547 updateOffsetAndLiveness(NewBB
);
551 bool BranchRelaxation::fixupUnconditionalBranch(MachineInstr
&MI
) {
552 MachineBasicBlock
*MBB
= MI
.getParent();
553 SmallVector
<MachineOperand
, 4> Cond
;
554 unsigned OldBrSize
= TII
->getInstSizeInBytes(MI
);
555 MachineBasicBlock
*DestBB
= TII
->getBranchDestBlock(MI
);
557 int64_t DestOffset
= BlockInfo
[DestBB
->getNumber()].Offset
;
558 int64_t SrcOffset
= getInstrOffset(MI
);
560 assert(!TII
->isBranchOffsetInRange(
561 MI
.getOpcode(), MBB
->getSectionID() != DestBB
->getSectionID()
562 ? TM
->getMaxCodeSize()
563 : DestOffset
- SrcOffset
));
565 BlockInfo
[MBB
->getNumber()].Size
-= OldBrSize
;
567 MachineBasicBlock
*BranchBB
= MBB
;
569 // If this was an expanded conditional branch, there is already a single
570 // unconditional branch in a block.
572 BranchBB
= createNewBlockAfter(*MBB
);
575 for (const MachineBasicBlock
*Succ
: MBB
->successors()) {
576 for (const MachineBasicBlock::RegisterMaskPair
&LiveIn
: Succ
->liveins())
577 BranchBB
->addLiveIn(LiveIn
);
580 BranchBB
->sortUniqueLiveIns();
581 BranchBB
->addSuccessor(DestBB
);
582 MBB
->replaceSuccessor(DestBB
, BranchBB
);
583 if (TrampolineInsertionPoint
== MBB
)
584 TrampolineInsertionPoint
= BranchBB
;
587 DebugLoc DL
= MI
.getDebugLoc();
588 MI
.eraseFromParent();
590 // Create the optional restore block and, initially, place it at the end of
591 // function. That block will be placed later if it's used; otherwise, it will
593 MachineBasicBlock
*RestoreBB
=
594 createNewBlockAfter(MF
->back(), DestBB
->getBasicBlock());
595 std::prev(RestoreBB
->getIterator())
596 ->setIsEndSection(RestoreBB
->isEndSection());
597 RestoreBB
->setIsEndSection(false);
599 TII
->insertIndirectBranch(*BranchBB
, *DestBB
, *RestoreBB
, DL
,
600 BranchBB
->getSectionID() != DestBB
->getSectionID()
601 ? TM
->getMaxCodeSize()
602 : DestOffset
- SrcOffset
,
605 // Update the block size and offset for the BranchBB (which may be newly
607 BlockInfo
[BranchBB
->getNumber()].Size
= computeBlockSize(*BranchBB
);
608 adjustBlockOffsets(*MBB
, std::next(BranchBB
->getIterator()));
610 // If RestoreBB is required, place it appropriately.
611 if (!RestoreBB
->empty()) {
612 // If the jump is Cold -> Hot, don't place the restore block (which is
613 // cold) in the middle of the function. Place it at the end.
614 if (MBB
->getSectionID() == MBBSectionID::ColdSectionID
&&
615 DestBB
->getSectionID() != MBBSectionID::ColdSectionID
) {
616 MachineBasicBlock
*NewBB
= createNewBlockAfter(*TrampolineInsertionPoint
);
617 TII
->insertUnconditionalBranch(*NewBB
, DestBB
, DebugLoc());
618 BlockInfo
[NewBB
->getNumber()].Size
= computeBlockSize(*NewBB
);
619 adjustBlockOffsets(*TrampolineInsertionPoint
,
620 std::next(NewBB
->getIterator()));
622 // New trampolines should be inserted after NewBB.
623 TrampolineInsertionPoint
= NewBB
;
625 // Retarget the unconditional branch to the trampoline block.
626 BranchBB
->replaceSuccessor(DestBB
, NewBB
);
627 NewBB
->addSuccessor(DestBB
);
632 // In all other cases, try to place just before DestBB.
634 // TODO: For multiple far branches to the same destination, there are
635 // chances that some restore blocks could be shared if they clobber the
636 // same registers and share the same restore sequence. So far, those
637 // restore blocks are just duplicated for each far branch.
638 assert(!DestBB
->isEntryBlock());
639 MachineBasicBlock
*PrevBB
= &*std::prev(DestBB
->getIterator());
640 // Fall through only if PrevBB has no unconditional branch as one of its
642 if (auto *FT
= PrevBB
->getLogicalFallThrough()) {
643 assert(FT
== DestBB
);
644 TII
->insertUnconditionalBranch(*PrevBB
, FT
, DebugLoc());
645 BlockInfo
[PrevBB
->getNumber()].Size
= computeBlockSize(*PrevBB
);
647 // Now, RestoreBB could be placed directly before DestBB.
648 MF
->splice(DestBB
->getIterator(), RestoreBB
->getIterator());
649 // Update successors and predecessors.
650 RestoreBB
->addSuccessor(DestBB
);
651 BranchBB
->replaceSuccessor(DestBB
, RestoreBB
);
652 if (TRI
->trackLivenessAfterRegAlloc(*MF
))
653 computeAndAddLiveIns(LiveRegs
, *RestoreBB
);
654 // Compute the restore block size.
655 BlockInfo
[RestoreBB
->getNumber()].Size
= computeBlockSize(*RestoreBB
);
656 // Update the estimated offset for the restore block.
657 adjustBlockOffsets(*PrevBB
, DestBB
->getIterator());
659 // Fix up section information for RestoreBB and DestBB
660 RestoreBB
->setSectionID(DestBB
->getSectionID());
661 RestoreBB
->setIsBeginSection(DestBB
->isBeginSection());
662 DestBB
->setIsBeginSection(false);
663 RelaxedUnconditionals
.insert({BranchBB
, RestoreBB
});
665 // Remove restore block if it's not required.
666 MF
->erase(RestoreBB
);
667 RelaxedUnconditionals
.insert({BranchBB
, DestBB
});
673 bool BranchRelaxation::relaxBranchInstructions() {
674 bool Changed
= false;
676 // Relaxing branches involves creating new basic blocks, so re-eval
677 // end() for termination.
678 for (MachineBasicBlock
&MBB
: *MF
) {
680 MachineBasicBlock::iterator Last
= MBB
.getLastNonDebugInstr();
681 if (Last
== MBB
.end())
684 // Expand the unconditional branch first if necessary. If there is a
685 // conditional branch, this will end up changing the branch destination of
686 // it to be over the newly inserted indirect branch block, which may avoid
687 // the need to try expanding the conditional branch first, saving an extra
689 if (Last
->isUnconditionalBranch()) {
690 // Unconditional branch destination might be unanalyzable, assume these
692 if (MachineBasicBlock
*DestBB
= TII
->getBranchDestBlock(*Last
)) {
693 if (!isBlockInRange(*Last
, *DestBB
) && !TII
->isTailCall(*Last
) &&
694 !RelaxedUnconditionals
.contains({&MBB
, DestBB
})) {
695 fixupUnconditionalBranch(*Last
);
696 ++NumUnconditionalRelaxed
;
702 // Loop over the conditional branches.
703 MachineBasicBlock::iterator Next
;
704 for (MachineBasicBlock::iterator J
= MBB
.getFirstTerminator();
705 J
!= MBB
.end(); J
= Next
) {
707 MachineInstr
&MI
= *J
;
709 if (!MI
.isConditionalBranch())
712 if (MI
.getOpcode() == TargetOpcode::FAULTING_OP
)
713 // FAULTING_OP's destination is not encoded in the instruction stream
714 // and thus never needs relaxed.
717 MachineBasicBlock
*DestBB
= TII
->getBranchDestBlock(MI
);
718 if (!isBlockInRange(MI
, *DestBB
)) {
719 if (Next
!= MBB
.end() && Next
->isConditionalBranch()) {
720 // If there are multiple conditional branches, this isn't an
721 // analyzable block. Split later terminators into a new block so
722 // each one will be analyzable.
724 splitBlockBeforeInstr(*Next
, DestBB
);
726 fixupConditionalBranch(MI
);
727 ++NumConditionalRelaxed
;
732 // This may have modified all of the terminators, so start over.
733 Next
= MBB
.getFirstTerminator();
738 // If we relaxed a branch, we must recompute offsets for *all* basic blocks.
739 // Otherwise, we may underestimate branch distances and fail to relax a branch
740 // that has been pushed out of range.
742 adjustBlockOffsets(MF
->front());
747 bool BranchRelaxation::runOnMachineFunction(MachineFunction
&mf
) {
750 LLVM_DEBUG(dbgs() << "***** BranchRelaxation *****\n");
752 const TargetSubtargetInfo
&ST
= MF
->getSubtarget();
753 TII
= ST
.getInstrInfo();
754 TM
= &MF
->getTarget();
756 TRI
= ST
.getRegisterInfo();
757 if (TRI
->trackLivenessAfterRegAlloc(*MF
))
758 RS
.reset(new RegScavenger());
760 // Renumber all of the machine basic blocks in the function, guaranteeing that
761 // the numbers agree with the position of the block in the function.
762 MF
->RenumberBlocks();
764 // Do the initial scan of the function, building up information about the
765 // sizes of each block.
768 LLVM_DEBUG(dbgs() << " Basic blocks before relaxation\n"; dumpBBs(););
770 bool MadeChange
= false;
771 while (relaxBranchInstructions())
774 // After a while, this might be made debug-only, but it is not expensive.
777 LLVM_DEBUG(dbgs() << " Basic blocks after relaxation\n\n"; dumpBBs());
780 RelaxedUnconditionals
.clear();