1 //===------- LoopBoundSplit.cpp - Split Loop Bound --------------*- C++ -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "llvm/Transforms/Scalar/LoopBoundSplit.h"
10 #include "llvm/ADT/Sequence.h"
11 #include "llvm/Analysis/LoopAnalysisManager.h"
12 #include "llvm/Analysis/LoopInfo.h"
13 #include "llvm/Analysis/ScalarEvolution.h"
14 #include "llvm/Analysis/ScalarEvolutionExpressions.h"
15 #include "llvm/IR/PatternMatch.h"
16 #include "llvm/Transforms/Scalar/LoopPassManager.h"
17 #include "llvm/Transforms/Utils/BasicBlockUtils.h"
18 #include "llvm/Transforms/Utils/Cloning.h"
19 #include "llvm/Transforms/Utils/LoopSimplify.h"
20 #include "llvm/Transforms/Utils/ScalarEvolutionExpander.h"
22 #define DEBUG_TYPE "loop-bound-split"
26 using namespace PatternMatch
;
29 struct ConditionInfo
{
30 /// Branch instruction with this condition
31 BranchInst
*BI
= nullptr;
32 /// ICmp instruction with this condition
33 ICmpInst
*ICmp
= nullptr;
35 CmpPredicate Pred
= ICmpInst::BAD_ICMP_PREDICATE
;
37 Value
*AddRecValue
= nullptr;
38 /// Non PHI AddRec llvm value
39 Value
*NonPHIAddRecValue
;
41 Value
*BoundValue
= nullptr;
43 const SCEVAddRecExpr
*AddRecSCEV
= nullptr;
45 const SCEV
*BoundSCEV
= nullptr;
47 ConditionInfo() = default;
51 static void analyzeICmp(ScalarEvolution
&SE
, ICmpInst
*ICmp
,
52 ConditionInfo
&Cond
, const Loop
&L
) {
54 if (match(ICmp
, m_ICmp(Cond
.Pred
, m_Value(Cond
.AddRecValue
),
55 m_Value(Cond
.BoundValue
)))) {
56 const SCEV
*AddRecSCEV
= SE
.getSCEV(Cond
.AddRecValue
);
57 const SCEV
*BoundSCEV
= SE
.getSCEV(Cond
.BoundValue
);
58 const SCEVAddRecExpr
*LHSAddRecSCEV
= dyn_cast
<SCEVAddRecExpr
>(AddRecSCEV
);
59 const SCEVAddRecExpr
*RHSAddRecSCEV
= dyn_cast
<SCEVAddRecExpr
>(BoundSCEV
);
60 // Locate AddRec in LHSSCEV and Bound in RHSSCEV.
61 if (!LHSAddRecSCEV
&& RHSAddRecSCEV
) {
62 std::swap(Cond
.AddRecValue
, Cond
.BoundValue
);
63 std::swap(AddRecSCEV
, BoundSCEV
);
64 Cond
.Pred
= ICmpInst::getSwappedPredicate(Cond
.Pred
);
67 Cond
.AddRecSCEV
= dyn_cast
<SCEVAddRecExpr
>(AddRecSCEV
);
68 Cond
.BoundSCEV
= BoundSCEV
;
69 Cond
.NonPHIAddRecValue
= Cond
.AddRecValue
;
71 // If the Cond.AddRecValue is PHI node, update Cond.NonPHIAddRecValue with
72 // value from backedge.
73 if (Cond
.AddRecSCEV
&& isa
<PHINode
>(Cond
.AddRecValue
)) {
74 PHINode
*PN
= cast
<PHINode
>(Cond
.AddRecValue
);
75 Cond
.NonPHIAddRecValue
= PN
->getIncomingValueForBlock(L
.getLoopLatch());
80 static bool calculateUpperBound(const Loop
&L
, ScalarEvolution
&SE
,
81 ConditionInfo
&Cond
, bool IsExitCond
) {
83 const SCEV
*ExitCount
= SE
.getExitCount(&L
, Cond
.ICmp
->getParent());
84 if (isa
<SCEVCouldNotCompute
>(ExitCount
))
87 Cond
.BoundSCEV
= ExitCount
;
91 // For non-exit condtion, if pred is LT, keep existing bound.
92 if (Cond
.Pred
== ICmpInst::ICMP_SLT
|| Cond
.Pred
== ICmpInst::ICMP_ULT
)
95 // For non-exit condition, if pre is LE, try to convert it to LT.
97 // AddRec <= Bound --> AddRec < Bound + 1
98 if (Cond
.Pred
!= ICmpInst::ICMP_ULE
&& Cond
.Pred
!= ICmpInst::ICMP_SLE
)
101 if (IntegerType
*BoundSCEVIntType
=
102 dyn_cast
<IntegerType
>(Cond
.BoundSCEV
->getType())) {
103 unsigned BitWidth
= BoundSCEVIntType
->getBitWidth();
104 APInt Max
= ICmpInst::isSigned(Cond
.Pred
)
105 ? APInt::getSignedMaxValue(BitWidth
)
106 : APInt::getMaxValue(BitWidth
);
107 const SCEV
*MaxSCEV
= SE
.getConstant(Max
);
108 // Check Bound < INT_MAX
109 ICmpInst::Predicate Pred
=
110 ICmpInst::isSigned(Cond
.Pred
) ? ICmpInst::ICMP_SLT
: ICmpInst::ICMP_ULT
;
111 if (SE
.isKnownPredicate(Pred
, Cond
.BoundSCEV
, MaxSCEV
)) {
112 const SCEV
*BoundPlusOneSCEV
=
113 SE
.getAddExpr(Cond
.BoundSCEV
, SE
.getOne(BoundSCEVIntType
));
114 Cond
.BoundSCEV
= BoundPlusOneSCEV
;
120 // ToDo: Support ICMP_NE/EQ.
125 static bool hasProcessableCondition(const Loop
&L
, ScalarEvolution
&SE
,
126 ICmpInst
*ICmp
, ConditionInfo
&Cond
,
128 analyzeICmp(SE
, ICmp
, Cond
, L
);
130 // The BoundSCEV should be evaluated at loop entry.
131 if (!SE
.isAvailableAtLoopEntry(Cond
.BoundSCEV
, &L
))
134 // Allowed AddRec as induction variable.
135 if (!Cond
.AddRecSCEV
)
138 if (!Cond
.AddRecSCEV
->isAffine())
141 const SCEV
*StepRecSCEV
= Cond
.AddRecSCEV
->getStepRecurrence(SE
);
142 // Allowed constant step.
143 if (!isa
<SCEVConstant
>(StepRecSCEV
))
146 ConstantInt
*StepCI
= cast
<SCEVConstant
>(StepRecSCEV
)->getValue();
147 // Allowed positive step for now.
148 // TODO: Support negative step.
149 if (StepCI
->isNegative() || StepCI
->isZero())
152 // Calculate upper bound.
153 if (!calculateUpperBound(L
, SE
, Cond
, IsExitCond
))
159 static bool isProcessableCondBI(const ScalarEvolution
&SE
,
160 const BranchInst
*BI
) {
161 BasicBlock
*TrueSucc
= nullptr;
162 BasicBlock
*FalseSucc
= nullptr;
164 if (!match(BI
, m_Br(m_ICmp(m_Value(LHS
), m_Value(RHS
)),
165 m_BasicBlock(TrueSucc
), m_BasicBlock(FalseSucc
))))
168 if (!SE
.isSCEVable(LHS
->getType()))
170 assert(SE
.isSCEVable(RHS
->getType()) && "Expected RHS's type is SCEVable");
172 if (TrueSucc
== FalseSucc
)
178 static bool canSplitLoopBound(const Loop
&L
, const DominatorTree
&DT
,
179 ScalarEvolution
&SE
, ConditionInfo
&Cond
) {
180 // Skip function with optsize.
181 if (L
.getHeader()->getParent()->hasOptSize())
184 // Split only innermost loop.
185 if (!L
.isInnermost())
188 // Check loop is in simplified form.
189 if (!L
.isLoopSimplifyForm())
192 // Check loop is in LCSSA form.
193 if (!L
.isLCSSAForm(DT
))
196 // Skip loop that cannot be cloned.
197 if (!L
.isSafeToClone())
200 BasicBlock
*ExitingBB
= L
.getExitingBlock();
201 // Assumed only one exiting block.
205 BranchInst
*ExitingBI
= dyn_cast
<BranchInst
>(ExitingBB
->getTerminator());
209 // Allowed only conditional branch with ICmp.
210 if (!isProcessableCondBI(SE
, ExitingBI
))
213 // Check the condition is processable.
214 ICmpInst
*ICmp
= cast
<ICmpInst
>(ExitingBI
->getCondition());
215 if (!hasProcessableCondition(L
, SE
, ICmp
, Cond
, /*IsExitCond*/ true))
222 static bool isProfitableToTransform(const Loop
&L
, const BranchInst
*BI
) {
223 // If the conditional branch splits a loop into two halves, we could
224 // generally say it is profitable.
226 // ToDo: Add more profitable cases here.
228 // Check this branch causes diamond CFG.
229 BasicBlock
*Succ0
= BI
->getSuccessor(0);
230 BasicBlock
*Succ1
= BI
->getSuccessor(1);
232 BasicBlock
*Succ0Succ
= Succ0
->getSingleSuccessor();
233 BasicBlock
*Succ1Succ
= Succ1
->getSingleSuccessor();
234 if (!Succ0Succ
|| !Succ1Succ
|| Succ0Succ
!= Succ1Succ
)
237 // ToDo: Calculate each successor's instruction cost.
242 static BranchInst
*findSplitCandidate(const Loop
&L
, ScalarEvolution
&SE
,
243 ConditionInfo
&ExitingCond
,
244 ConditionInfo
&SplitCandidateCond
) {
245 for (auto *BB
: L
.blocks()) {
246 // Skip condition of backedge.
247 if (L
.getLoopLatch() == BB
)
250 auto *BI
= dyn_cast
<BranchInst
>(BB
->getTerminator());
254 // Check conditional branch with ICmp.
255 if (!isProcessableCondBI(SE
, BI
))
258 // Skip loop invariant condition.
259 if (L
.isLoopInvariant(BI
->getCondition()))
262 // Check the condition is processable.
263 ICmpInst
*ICmp
= cast
<ICmpInst
>(BI
->getCondition());
264 if (!hasProcessableCondition(L
, SE
, ICmp
, SplitCandidateCond
,
265 /*IsExitCond*/ false))
268 if (ExitingCond
.BoundSCEV
->getType() !=
269 SplitCandidateCond
.BoundSCEV
->getType())
272 // After transformation, we assume the split condition of the pre-loop is
273 // always true. In order to guarantee it, we need to check the start value
274 // of the split cond AddRec satisfies the split condition.
275 if (!SE
.isLoopEntryGuardedByCond(&L
, SplitCandidateCond
.Pred
,
276 SplitCandidateCond
.AddRecSCEV
->getStart(),
277 SplitCandidateCond
.BoundSCEV
))
280 SplitCandidateCond
.BI
= BI
;
287 static bool splitLoopBound(Loop
&L
, DominatorTree
&DT
, LoopInfo
&LI
,
288 ScalarEvolution
&SE
, LPMUpdater
&U
) {
289 ConditionInfo SplitCandidateCond
;
290 ConditionInfo ExitingCond
;
292 // Check we can split this loop's bound.
293 if (!canSplitLoopBound(L
, DT
, SE
, ExitingCond
))
296 if (!findSplitCandidate(L
, SE
, ExitingCond
, SplitCandidateCond
))
299 if (!isProfitableToTransform(L
, SplitCandidateCond
.BI
))
302 // Now, we have a split candidate. Let's build a form as below.
303 // +--------------------+
305 // | set up newbound |
306 // +--------------------+
307 // | /----------------\
308 // +--------v----v------+ |
310 // | with true condition| | |
311 // +--------------------+ | |
313 // +--------v-----------+ | |
314 // | if.then.BB | | |
315 // +--------------------+ | |
317 // +--------v-----------<---/ |
318 // | latch >----------/
320 // +--------------------+
322 // +--------v-----------+
323 // | preheader2 |--------------\
324 // | if (AddRec i != | |
326 // +--------------------+ |
327 // | /----------------\ |
328 // +--------v----v------+ | |
329 // | header2 |---\ | |
330 // | conditional branch | | | |
331 // |with false condition| | | |
332 // +--------------------+ | | |
334 // +--------v-----------+ | | |
335 // | if.then.BB2 | | | |
336 // +--------------------+ | | |
338 // +--------v-----------<---/ | |
339 // | latch2 >----------/ |
340 // | with org bound | |
341 // +--------v-----------+ |
343 // | +---------------+ |
344 // +--> exit <-------/
347 // Let's create post loop.
348 SmallVector
<BasicBlock
*, 8> PostLoopBlocks
;
350 ValueToValueMapTy VMap
;
351 BasicBlock
*PreHeader
= L
.getLoopPreheader();
352 BasicBlock
*SplitLoopPH
= SplitEdge(PreHeader
, L
.getHeader(), &DT
, &LI
);
353 PostLoop
= cloneLoopWithPreheader(L
.getExitBlock(), SplitLoopPH
, &L
, VMap
,
354 ".split", &LI
, &DT
, PostLoopBlocks
);
355 remapInstructionsInBlocks(PostLoopBlocks
, VMap
);
357 BasicBlock
*PostLoopPreHeader
= PostLoop
->getLoopPreheader();
358 IRBuilder
<> Builder(&PostLoopPreHeader
->front());
360 // Update phi nodes in header of post-loop.
361 bool isExitingLatch
=
362 (L
.getExitingBlock() == L
.getLoopLatch()) ? true : false;
363 Value
*ExitingCondLCSSAPhi
= nullptr;
364 for (PHINode
&PN
: L
.getHeader()->phis()) {
365 // Create LCSSA phi node in preheader of post-loop.
367 Builder
.CreatePHI(PN
.getType(), 1, PN
.getName() + ".lcssa");
368 LCSSAPhi
->setDebugLoc(PN
.getDebugLoc());
369 // If the exiting block is loop latch, the phi does not have the update at
370 // last iteration. In this case, update lcssa phi with value from backedge.
371 LCSSAPhi
->addIncoming(
372 isExitingLatch
? PN
.getIncomingValueForBlock(L
.getLoopLatch()) : &PN
,
373 L
.getExitingBlock());
375 // Update the start value of phi node in post-loop with the LCSSA phi node.
376 PHINode
*PostLoopPN
= cast
<PHINode
>(VMap
[&PN
]);
377 PostLoopPN
->setIncomingValueForBlock(PostLoopPreHeader
, LCSSAPhi
);
379 // Find PHI with exiting condition from pre-loop. The PHI should be
380 // SCEVAddRecExpr and have same incoming value from backedge with
382 if (!SE
.isSCEVable(PN
.getType()))
385 const SCEVAddRecExpr
*PhiSCEV
= dyn_cast
<SCEVAddRecExpr
>(SE
.getSCEV(&PN
));
386 if (PhiSCEV
&& ExitingCond
.NonPHIAddRecValue
==
387 PN
.getIncomingValueForBlock(L
.getLoopLatch()))
388 ExitingCondLCSSAPhi
= LCSSAPhi
;
391 // Add conditional branch to check we can skip post-loop in its preheader.
392 Instruction
*OrigBI
= PostLoopPreHeader
->getTerminator();
393 ICmpInst::Predicate Pred
= ICmpInst::ICMP_NE
;
395 Builder
.CreateICmp(Pred
, ExitingCondLCSSAPhi
, ExitingCond
.BoundValue
);
396 Builder
.CreateCondBr(Cond
, PostLoop
->getHeader(), PostLoop
->getExitBlock());
397 OrigBI
->eraseFromParent();
399 // Create new loop bound and add it into preheader of pre-loop.
400 const SCEV
*NewBoundSCEV
= ExitingCond
.BoundSCEV
;
401 const SCEV
*SplitBoundSCEV
= SplitCandidateCond
.BoundSCEV
;
402 NewBoundSCEV
= ICmpInst::isSigned(ExitingCond
.Pred
)
403 ? SE
.getSMinExpr(NewBoundSCEV
, SplitBoundSCEV
)
404 : SE
.getUMinExpr(NewBoundSCEV
, SplitBoundSCEV
);
406 SCEVExpander
Expander(
407 SE
, L
.getHeader()->getDataLayout(), "split");
408 Instruction
*InsertPt
= SplitLoopPH
->getTerminator();
409 Value
*NewBoundValue
=
410 Expander
.expandCodeFor(NewBoundSCEV
, NewBoundSCEV
->getType(), InsertPt
);
411 NewBoundValue
->setName("new.bound");
413 // Replace exiting bound value of pre-loop NewBound.
414 ExitingCond
.ICmp
->setOperand(1, NewBoundValue
);
416 // Replace SplitCandidateCond.BI's condition of pre-loop by True.
417 LLVMContext
&Context
= PreHeader
->getContext();
418 SplitCandidateCond
.BI
->setCondition(ConstantInt::getTrue(Context
));
420 // Replace cloned SplitCandidateCond.BI's condition in post-loop by False.
421 BranchInst
*ClonedSplitCandidateBI
=
422 cast
<BranchInst
>(VMap
[SplitCandidateCond
.BI
]);
423 ClonedSplitCandidateBI
->setCondition(ConstantInt::getFalse(Context
));
425 // Replace exit branch target of pre-loop by post-loop's preheader.
426 if (L
.getExitBlock() == ExitingCond
.BI
->getSuccessor(0))
427 ExitingCond
.BI
->setSuccessor(0, PostLoopPreHeader
);
429 ExitingCond
.BI
->setSuccessor(1, PostLoopPreHeader
);
431 // Update phi node in exit block of post-loop.
432 Builder
.SetInsertPoint(PostLoopPreHeader
, PostLoopPreHeader
->begin());
433 for (PHINode
&PN
: PostLoop
->getExitBlock()->phis()) {
434 for (auto i
: seq
<int>(0, PN
.getNumOperands())) {
435 // Check incoming block is pre-loop's exiting block.
436 if (PN
.getIncomingBlock(i
) == L
.getExitingBlock()) {
437 Value
*IncomingValue
= PN
.getIncomingValue(i
);
439 // Create LCSSA phi node for incoming value.
441 Builder
.CreatePHI(PN
.getType(), 1, PN
.getName() + ".lcssa");
442 LCSSAPhi
->setDebugLoc(PN
.getDebugLoc());
443 LCSSAPhi
->addIncoming(IncomingValue
, PN
.getIncomingBlock(i
));
445 // Replace pre-loop's exiting block by post-loop's preheader.
446 PN
.setIncomingBlock(i
, PostLoopPreHeader
);
447 // Replace incoming value by LCSSAPhi.
448 PN
.setIncomingValue(i
, LCSSAPhi
);
449 // Add a new incoming value with post-loop's exiting block.
450 PN
.addIncoming(VMap
[IncomingValue
], PostLoop
->getExitingBlock());
455 // Update dominator tree.
456 DT
.changeImmediateDominator(PostLoopPreHeader
, L
.getExitingBlock());
457 DT
.changeImmediateDominator(PostLoop
->getExitBlock(), PostLoopPreHeader
);
459 // Invalidate cached SE information.
462 // Canonicalize loops.
463 simplifyLoop(&L
, &DT
, &LI
, &SE
, nullptr, nullptr, true);
464 simplifyLoop(PostLoop
, &DT
, &LI
, &SE
, nullptr, nullptr, true);
466 // Add new post-loop to loop pass manager.
467 U
.addSiblingLoops(PostLoop
);
472 PreservedAnalyses
LoopBoundSplitPass::run(Loop
&L
, LoopAnalysisManager
&AM
,
473 LoopStandardAnalysisResults
&AR
,
475 Function
&F
= *L
.getHeader()->getParent();
478 LLVM_DEBUG(dbgs() << "Spliting bound of loop in " << F
.getName() << ": " << L
481 if (!splitLoopBound(L
, AR
.DT
, AR
.LI
, AR
.SE
, U
))
482 return PreservedAnalyses::all();
484 assert(AR
.DT
.verify(DominatorTree::VerificationLevel::Fast
));
487 return getLoopPassPreservedAnalyses();
490 } // end namespace llvm