llvm/lib/Transforms/Utils/SimplifyIndVar.cpp

   1 //===-- SimplifyIndVar.cpp - Induction variable simplification ------------===//
   2 //
   3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
   4 // See https://llvm.org/LICENSE.txt for license information.
   5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
   6 //
   7 //===----------------------------------------------------------------------===//
   8 //
   9 // This file implements induction variable simplification. It does
  10 // not define any actual pass or policy, but provides a single function to
  11 // simplify a loop's induction variables based on ScalarEvolution.
  12 //
  13 //===----------------------------------------------------------------------===//
  14
  15 #include "llvm/Transforms/Utils/SimplifyIndVar.h"
  16 #include "llvm/ADT/SmallVector.h"
  17 #include "llvm/ADT/Statistic.h"
  18 #include "llvm/Analysis/LoopInfo.h"
  19 #include "llvm/IR/Dominators.h"
  20 #include "llvm/IR/IRBuilder.h"
  21 #include "llvm/IR/Instructions.h"
  22 #include "llvm/IR/IntrinsicInst.h"
  23 #include "llvm/IR/PatternMatch.h"
  24 #include "llvm/Support/Debug.h"
  25 #include "llvm/Support/raw_ostream.h"
  26 #include "llvm/Transforms/Utils/Local.h"
  27 #include "llvm/Transforms/Utils/ScalarEvolutionExpander.h"
  28
  29 using namespace llvm;
  30
  31 #define DEBUG_TYPE "indvars"
  32
  33 STATISTIC(NumElimIdentity, "Number of IV identities eliminated");
  34 STATISTIC(NumElimOperand,  "Number of IV operands folded into a use");
  35 STATISTIC(NumFoldedUser, "Number of IV users folded into a constant");
  36 STATISTIC(NumElimRem     , "Number of IV remainder operations eliminated");
  37 STATISTIC(
  38     NumSimplifiedSDiv,
  39     "Number of IV signed division operations converted to unsigned division");
  40 STATISTIC(
  41     NumSimplifiedSRem,
  42     "Number of IV signed remainder operations converted to unsigned remainder");
  43 STATISTIC(NumElimCmp     , "Number of IV comparisons eliminated");
  44
  45 namespace {
  46   /// This is a utility for simplifying induction variables
  47   /// based on ScalarEvolution. It is the primary instrument of the
  48   /// IndvarSimplify pass, but it may also be directly invoked to cleanup after
  49   /// other loop passes that preserve SCEV.
  50   class SimplifyIndvar {
  51     Loop             *L;
  52     LoopInfo         *LI;
  53     ScalarEvolution  *SE;
  54     DominatorTree    *DT;
  55     const TargetTransformInfo *TTI;
  56     SCEVExpander     &Rewriter;
  57     SmallVectorImpl<WeakTrackingVH> &DeadInsts;
  58
  59     bool Changed = false;
  60
  61   public:
  62     SimplifyIndvar(Loop *Loop, ScalarEvolution *SE, DominatorTree *DT,
  63                    LoopInfo *LI, const TargetTransformInfo *TTI,
  64                    SCEVExpander &Rewriter,
  65                    SmallVectorImpl<WeakTrackingVH> &Dead)
  66         : L(Loop), LI(LI), SE(SE), DT(DT), TTI(TTI), Rewriter(Rewriter),
  67           DeadInsts(Dead) {
  68       assert(LI && "IV simplification requires LoopInfo");
  69     }
  70
  71     bool hasChanged() const { return Changed; }
  72
  73     /// Iteratively perform simplification on a worklist of users of the
  74     /// specified induction variable. This is the top-level driver that applies
  75     /// all simplifications to users of an IV.
  76     void simplifyUsers(PHINode *CurrIV, IVVisitor *V = nullptr);
  77
  78     Value *foldIVUser(Instruction *UseInst, Instruction *IVOperand);
  79
  80     bool eliminateIdentitySCEV(Instruction *UseInst, Instruction *IVOperand);
  81     bool replaceIVUserWithLoopInvariant(Instruction *UseInst);
  82     bool replaceFloatIVWithIntegerIV(Instruction *UseInst);
  83
  84     bool eliminateOverflowIntrinsic(WithOverflowInst *WO);
  85     bool eliminateSaturatingIntrinsic(SaturatingInst *SI);
  86     bool eliminateTrunc(TruncInst *TI);
  87     bool eliminateIVUser(Instruction *UseInst, Instruction *IVOperand);
  88     bool makeIVComparisonInvariant(ICmpInst *ICmp, Instruction *IVOperand);
  89     void eliminateIVComparison(ICmpInst *ICmp, Instruction *IVOperand);
  90     void simplifyIVRemainder(BinaryOperator *Rem, Instruction *IVOperand,
  91                              bool IsSigned);
  92     void replaceRemWithNumerator(BinaryOperator *Rem);
  93     void replaceRemWithNumeratorOrZero(BinaryOperator *Rem);
  94     void replaceSRemWithURem(BinaryOperator *Rem);
  95     bool eliminateSDiv(BinaryOperator *SDiv);
  96     bool strengthenBinaryOp(BinaryOperator *BO, Instruction *IVOperand);
  97     bool strengthenOverflowingOperation(BinaryOperator *OBO,
  98                                         Instruction *IVOperand);
  99     bool strengthenRightShift(BinaryOperator *BO, Instruction *IVOperand);
 100   };
 101 }
 102
 103 /// Find a point in code which dominates all given instructions. We can safely
 104 /// assume that, whatever fact we can prove at the found point, this fact is
 105 /// also true for each of the given instructions.
 106 static Instruction *findCommonDominator(ArrayRef<Instruction *> Instructions,
 107                                         DominatorTree &DT) {
 108   Instruction *CommonDom = nullptr;
 109   for (auto *Insn : Instructions)
 110     CommonDom =
 111         CommonDom ? DT.findNearestCommonDominator(CommonDom, Insn) : Insn;
 112   assert(CommonDom && "Common dominator not found?");
 113   return CommonDom;
 114 }
 115
 116 /// Fold an IV operand into its use.  This removes increments of an
 117 /// aligned IV when used by a instruction that ignores the low bits.
 118 ///
 119 /// IVOperand is guaranteed SCEVable, but UseInst may not be.
 120 ///
 121 /// Return the operand of IVOperand for this induction variable if IVOperand can
 122 /// be folded (in case more folding opportunities have been exposed).
 123 /// Otherwise return null.
 124 Value *SimplifyIndvar::foldIVUser(Instruction *UseInst, Instruction *IVOperand) {
 125   Value *IVSrc = nullptr;
 126   const unsigned OperIdx = 0;
 127   const SCEV *FoldedExpr = nullptr;
 128   bool MustDropExactFlag = false;
 129   switch (UseInst->getOpcode()) {
 130   default:
 131     return nullptr;
 132   case Instruction::UDiv:
 133   case Instruction::LShr:
 134     // We're only interested in the case where we know something about
 135     // the numerator and have a constant denominator.
 136     if (IVOperand != UseInst->getOperand(OperIdx) ||
 137         !isa<ConstantInt>(UseInst->getOperand(1)))
 138       return nullptr;
 139
 140     // Attempt to fold a binary operator with constant operand.
 141     // e.g. ((I + 1) >> 2) => I >> 2
 142     if (!isa<BinaryOperator>(IVOperand)
 143         || !isa<ConstantInt>(IVOperand->getOperand(1)))
 144       return nullptr;
 145
 146     IVSrc = IVOperand->getOperand(0);
 147     // IVSrc must be the (SCEVable) IV, since the other operand is const.
 148     assert(SE->isSCEVable(IVSrc->getType()) && "Expect SCEVable IV operand");
 149
 150     ConstantInt *D = cast<ConstantInt>(UseInst->getOperand(1));
 151     if (UseInst->getOpcode() == Instruction::LShr) {
 152       // Get a constant for the divisor. See createSCEV.
 153       uint32_t BitWidth = cast<IntegerType>(UseInst->getType())->getBitWidth();
 154       if (D->getValue().uge(BitWidth))
 155         return nullptr;
 156
 157       D = ConstantInt::get(UseInst->getContext(),
 158                            APInt::getOneBitSet(BitWidth, D->getZExtValue()));
 159     }
 160     const auto *LHS = SE->getSCEV(IVSrc);
 161     const auto *RHS = SE->getSCEV(D);
 162     FoldedExpr = SE->getUDivExpr(LHS, RHS);
 163     // We might have 'exact' flag set at this point which will no longer be
 164     // correct after we make the replacement.
 165     if (UseInst->isExact() && LHS != SE->getMulExpr(FoldedExpr, RHS))
 166       MustDropExactFlag = true;
 167   }
 168   // We have something that might fold it's operand. Compare SCEVs.
 169   if (!SE->isSCEVable(UseInst->getType()))
 170     return nullptr;
 171
 172   // Bypass the operand if SCEV can prove it has no effect.
 173   if (SE->getSCEV(UseInst) != FoldedExpr)
 174     return nullptr;
 175
 176   LLVM_DEBUG(dbgs() << "INDVARS: Eliminated IV operand: " << *IVOperand
 177                     << " -> " << *UseInst << '\n');
 178
 179   UseInst->setOperand(OperIdx, IVSrc);
 180   assert(SE->getSCEV(UseInst) == FoldedExpr && "bad SCEV with folded oper");
 181
 182   if (MustDropExactFlag)
 183     UseInst->dropPoisonGeneratingFlags();
 184
 185   ++NumElimOperand;
 186   Changed = true;
 187   if (IVOperand->use_empty())
 188     DeadInsts.emplace_back(IVOperand);
 189   return IVSrc;
 190 }
 191
 192 bool SimplifyIndvar::makeIVComparisonInvariant(ICmpInst *ICmp,
 193                                                Instruction *IVOperand) {
 194   auto *Preheader = L->getLoopPreheader();
 195   if (!Preheader)
 196     return false;
 197   unsigned IVOperIdx = 0;
 198   ICmpInst::Predicate Pred = ICmp->getPredicate();
 199   if (IVOperand != ICmp->getOperand(0)) {
 200     // Swapped
 201     assert(IVOperand == ICmp->getOperand(1) && "Can't find IVOperand");
 202     IVOperIdx = 1;
 203     Pred = ICmpInst::getSwappedPredicate(Pred);
 204   }
 205
 206   // Get the SCEVs for the ICmp operands (in the specific context of the
 207   // current loop)
 208   const Loop *ICmpLoop = LI->getLoopFor(ICmp->getParent());
 209   const SCEV *S = SE->getSCEVAtScope(ICmp->getOperand(IVOperIdx), ICmpLoop);
 210   const SCEV *X = SE->getSCEVAtScope(ICmp->getOperand(1 - IVOperIdx), ICmpLoop);
 211   auto LIP = SE->getLoopInvariantPredicate(Pred, S, X, L, ICmp);
 212   if (!LIP)
 213     return false;
 214   ICmpInst::Predicate InvariantPredicate = LIP->Pred;
 215   const SCEV *InvariantLHS = LIP->LHS;
 216   const SCEV *InvariantRHS = LIP->RHS;
 217
 218   // Do not generate something ridiculous.
 219   auto *PHTerm = Preheader->getTerminator();
 220   if (Rewriter.isHighCostExpansion({InvariantLHS, InvariantRHS}, L,
 221                                    2 * SCEVCheapExpansionBudget, TTI, PHTerm) ||
 222       !Rewriter.isSafeToExpandAt(InvariantLHS, PHTerm) ||
 223       !Rewriter.isSafeToExpandAt(InvariantRHS, PHTerm))
 224     return false;
 225   auto *NewLHS =
 226       Rewriter.expandCodeFor(InvariantLHS, IVOperand->getType(), PHTerm);
 227   auto *NewRHS =
 228       Rewriter.expandCodeFor(InvariantRHS, IVOperand->getType(), PHTerm);
 229   LLVM_DEBUG(dbgs() << "INDVARS: Simplified comparison: " << *ICmp << '\n');
 230   ICmp->setPredicate(InvariantPredicate);
 231   ICmp->setOperand(0, NewLHS);
 232   ICmp->setOperand(1, NewRHS);
 233   return true;
 234 }
 235
 236 /// SimplifyIVUsers helper for eliminating useless
 237 /// comparisons against an induction variable.
 238 void SimplifyIndvar::eliminateIVComparison(ICmpInst *ICmp,
 239                                            Instruction *IVOperand) {
 240   unsigned IVOperIdx = 0;
 241   ICmpInst::Predicate Pred = ICmp->getPredicate();
 242   ICmpInst::Predicate OriginalPred = Pred;
 243   if (IVOperand != ICmp->getOperand(0)) {
 244     // Swapped
 245     assert(IVOperand == ICmp->getOperand(1) && "Can't find IVOperand");
 246     IVOperIdx = 1;
 247     Pred = ICmpInst::getSwappedPredicate(Pred);
 248   }
 249
 250   // Get the SCEVs for the ICmp operands (in the specific context of the
 251   // current loop)
 252   const Loop *ICmpLoop = LI->getLoopFor(ICmp->getParent());
 253   const SCEV *S = SE->getSCEVAtScope(ICmp->getOperand(IVOperIdx), ICmpLoop);
 254   const SCEV *X = SE->getSCEVAtScope(ICmp->getOperand(1 - IVOperIdx), ICmpLoop);
 255
 256   // If the condition is always true or always false in the given context,
 257   // replace it with a constant value.
 258   SmallVector<Instruction *, 4> Users;
 259   for (auto *U : ICmp->users())
 260     Users.push_back(cast<Instruction>(U));
 261   const Instruction *CtxI = findCommonDominator(Users, *DT);
 262   if (auto Ev = SE->evaluatePredicateAt(Pred, S, X, CtxI)) {
 263     SE->forgetValue(ICmp);
 264     ICmp->replaceAllUsesWith(ConstantInt::getBool(ICmp->getContext(), *Ev));
 265     DeadInsts.emplace_back(ICmp);
 266     LLVM_DEBUG(dbgs() << "INDVARS: Eliminated comparison: " << *ICmp << '\n');
 267   } else if (makeIVComparisonInvariant(ICmp, IVOperand)) {
 268     // fallthrough to end of function
 269   } else if (ICmpInst::isSigned(OriginalPred) &&
 270              SE->isKnownNonNegative(S) && SE->isKnownNonNegative(X)) {
 271     // If we were unable to make anything above, all we can is to canonicalize
 272     // the comparison hoping that it will open the doors for other
 273     // optimizations. If we find out that we compare two non-negative values,
 274     // we turn the instruction's predicate to its unsigned version. Note that
 275     // we cannot rely on Pred here unless we check if we have swapped it.
 276     assert(ICmp->getPredicate() == OriginalPred && "Predicate changed?");
 277     LLVM_DEBUG(dbgs() << "INDVARS: Turn to unsigned comparison: " << *ICmp
 278                       << '\n');
 279     ICmp->setPredicate(ICmpInst::getUnsignedPredicate(OriginalPred));
 280   } else
 281     return;
 282
 283   ++NumElimCmp;
 284   Changed = true;
 285 }
 286
 287 bool SimplifyIndvar::eliminateSDiv(BinaryOperator *SDiv) {
 288   // Get the SCEVs for the ICmp operands.
 289   auto *N = SE->getSCEV(SDiv->getOperand(0));
 290   auto *D = SE->getSCEV(SDiv->getOperand(1));
 291
 292   // Simplify unnecessary loops away.
 293   const Loop *L = LI->getLoopFor(SDiv->getParent());
 294   N = SE->getSCEVAtScope(N, L);
 295   D = SE->getSCEVAtScope(D, L);
 296
 297   // Replace sdiv by udiv if both of the operands are non-negative
 298   if (SE->isKnownNonNegative(N) && SE->isKnownNonNegative(D)) {
 299     auto *UDiv = BinaryOperator::Create(
 300         BinaryOperator::UDiv, SDiv->getOperand(0), SDiv->getOperand(1),
 301         SDiv->getName() + ".udiv", SDiv);
 302     UDiv->setIsExact(SDiv->isExact());
 303     SDiv->replaceAllUsesWith(UDiv);
 304     LLVM_DEBUG(dbgs() << "INDVARS: Simplified sdiv: " << *SDiv << '\n');
 305     ++NumSimplifiedSDiv;
 306     Changed = true;
 307     DeadInsts.push_back(SDiv);
 308     return true;
 309   }
 310
 311   return false;
 312 }
 313
 314 // i %s n -> i %u n if i >= 0 and n >= 0
 315 void SimplifyIndvar::replaceSRemWithURem(BinaryOperator *Rem) {
 316   auto *N = Rem->getOperand(0), *D = Rem->getOperand(1);
 317   auto *URem = BinaryOperator::Create(BinaryOperator::URem, N, D,
 318                                       Rem->getName() + ".urem", Rem);
 319   Rem->replaceAllUsesWith(URem);
 320   LLVM_DEBUG(dbgs() << "INDVARS: Simplified srem: " << *Rem << '\n');
 321   ++NumSimplifiedSRem;
 322   Changed = true;
 323   DeadInsts.emplace_back(Rem);
 324 }
 325
 326 // i % n  -->  i  if i is in [0,n).
 327 void SimplifyIndvar::replaceRemWithNumerator(BinaryOperator *Rem) {
 328   Rem->replaceAllUsesWith(Rem->getOperand(0));
 329   LLVM_DEBUG(dbgs() << "INDVARS: Simplified rem: " << *Rem << '\n');
 330   ++NumElimRem;
 331   Changed = true;
 332   DeadInsts.emplace_back(Rem);
 333 }
 334
 335 // (i+1) % n  -->  (i+1)==n?0:(i+1)  if i is in [0,n).
 336 void SimplifyIndvar::replaceRemWithNumeratorOrZero(BinaryOperator *Rem) {
 337   auto *T = Rem->getType();
 338   auto *N = Rem->getOperand(0), *D = Rem->getOperand(1);
 339   ICmpInst *ICmp = new ICmpInst(Rem, ICmpInst::ICMP_EQ, N, D);
 340   SelectInst *Sel =
 341       SelectInst::Create(ICmp, ConstantInt::get(T, 0), N, "iv.rem", Rem);
 342   Rem->replaceAllUsesWith(Sel);
 343   LLVM_DEBUG(dbgs() << "INDVARS: Simplified rem: " << *Rem << '\n');
 344   ++NumElimRem;
 345   Changed = true;
 346   DeadInsts.emplace_back(Rem);
 347 }
 348
 349 /// SimplifyIVUsers helper for eliminating useless remainder operations
 350 /// operating on an induction variable or replacing srem by urem.
 351 void SimplifyIndvar::simplifyIVRemainder(BinaryOperator *Rem,
 352                                          Instruction *IVOperand,
 353                                          bool IsSigned) {
 354   auto *NValue = Rem->getOperand(0);
 355   auto *DValue = Rem->getOperand(1);
 356   // We're only interested in the case where we know something about
 357   // the numerator, unless it is a srem, because we want to replace srem by urem
 358   // in general.
 359   bool UsedAsNumerator = IVOperand == NValue;
 360   if (!UsedAsNumerator && !IsSigned)
 361     return;
 362
 363   const SCEV *N = SE->getSCEV(NValue);
 364
 365   // Simplify unnecessary loops away.
 366   const Loop *ICmpLoop = LI->getLoopFor(Rem->getParent());
 367   N = SE->getSCEVAtScope(N, ICmpLoop);
 368
 369   bool IsNumeratorNonNegative = !IsSigned || SE->isKnownNonNegative(N);
 370
 371   // Do not proceed if the Numerator may be negative
 372   if (!IsNumeratorNonNegative)
 373     return;
 374
 375   const SCEV *D = SE->getSCEV(DValue);
 376   D = SE->getSCEVAtScope(D, ICmpLoop);
 377
 378   if (UsedAsNumerator) {
 379     auto LT = IsSigned ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_ULT;
 380     if (SE->isKnownPredicate(LT, N, D)) {
 381       replaceRemWithNumerator(Rem);
 382       return;
 383     }
 384
 385     auto *T = Rem->getType();
 386     const auto *NLessOne = SE->getMinusSCEV(N, SE->getOne(T));
 387     if (SE->isKnownPredicate(LT, NLessOne, D)) {
 388       replaceRemWithNumeratorOrZero(Rem);
 389       return;
 390     }
 391   }
 392
 393   // Try to replace SRem with URem, if both N and D are known non-negative.
 394   // Since we had already check N, we only need to check D now
 395   if (!IsSigned || !SE->isKnownNonNegative(D))
 396     return;
 397
 398   replaceSRemWithURem(Rem);
 399 }
 400
 401 bool SimplifyIndvar::eliminateOverflowIntrinsic(WithOverflowInst *WO) {
 402   const SCEV *LHS = SE->getSCEV(WO->getLHS());
 403   const SCEV *RHS = SE->getSCEV(WO->getRHS());
 404   if (!SE->willNotOverflow(WO->getBinaryOp(), WO->isSigned(), LHS, RHS))
 405     return false;
 406
 407   // Proved no overflow, nuke the overflow check and, if possible, the overflow
 408   // intrinsic as well.
 409
 410   BinaryOperator *NewResult = BinaryOperator::Create(
 411       WO->getBinaryOp(), WO->getLHS(), WO->getRHS(), "", WO);
 412
 413   if (WO->isSigned())
 414     NewResult->setHasNoSignedWrap(true);
 415   else
 416     NewResult->setHasNoUnsignedWrap(true);
 417
 418   SmallVector<ExtractValueInst *, 4> ToDelete;
 419
 420   for (auto *U : WO->users()) {
 421     if (auto *EVI = dyn_cast<ExtractValueInst>(U)) {
 422       if (EVI->getIndices()[0] == 1)
 423         EVI->replaceAllUsesWith(ConstantInt::getFalse(WO->getContext()));
 424       else {
 425         assert(EVI->getIndices()[0] == 0 && "Only two possibilities!");
 426         EVI->replaceAllUsesWith(NewResult);
 427       }
 428       ToDelete.push_back(EVI);
 429     }
 430   }
 431
 432   for (auto *EVI : ToDelete)
 433     EVI->eraseFromParent();
 434
 435   if (WO->use_empty())
 436     WO->eraseFromParent();
 437
 438   Changed = true;
 439   return true;
 440 }
 441
 442 bool SimplifyIndvar::eliminateSaturatingIntrinsic(SaturatingInst *SI) {
 443   const SCEV *LHS = SE->getSCEV(SI->getLHS());
 444   const SCEV *RHS = SE->getSCEV(SI->getRHS());
 445   if (!SE->willNotOverflow(SI->getBinaryOp(), SI->isSigned(), LHS, RHS))
 446     return false;
 447
 448   BinaryOperator *BO = BinaryOperator::Create(
 449       SI->getBinaryOp(), SI->getLHS(), SI->getRHS(), SI->getName(), SI);
 450   if (SI->isSigned())
 451     BO->setHasNoSignedWrap();
 452   else
 453     BO->setHasNoUnsignedWrap();
 454
 455   SI->replaceAllUsesWith(BO);
 456   DeadInsts.emplace_back(SI);
 457   Changed = true;
 458   return true;
 459 }
 460
 461 bool SimplifyIndvar::eliminateTrunc(TruncInst *TI) {
 462   // It is always legal to replace
 463   //   icmp <pred> i32 trunc(iv), n
 464   // with
 465   //   icmp <pred> i64 sext(trunc(iv)), sext(n), if pred is signed predicate.
 466   // Or with
 467   //   icmp <pred> i64 zext(trunc(iv)), zext(n), if pred is unsigned predicate.
 468   // Or with either of these if pred is an equality predicate.
 469   //
 470   // If we can prove that iv == sext(trunc(iv)) or iv == zext(trunc(iv)) for
 471   // every comparison which uses trunc, it means that we can replace each of
 472   // them with comparison of iv against sext/zext(n). We no longer need trunc
 473   // after that.
 474   //
 475   // TODO: Should we do this if we can widen *some* comparisons, but not all
 476   // of them? Sometimes it is enough to enable other optimizations, but the
 477   // trunc instruction will stay in the loop.
 478   Value *IV = TI->getOperand(0);
 479   Type *IVTy = IV->getType();
 480   const SCEV *IVSCEV = SE->getSCEV(IV);
 481   const SCEV *TISCEV = SE->getSCEV(TI);
 482
 483   // Check if iv == zext(trunc(iv)) and if iv == sext(trunc(iv)). If so, we can
 484   // get rid of trunc
 485   bool DoesSExtCollapse = false;
 486   bool DoesZExtCollapse = false;
 487   if (IVSCEV == SE->getSignExtendExpr(TISCEV, IVTy))
 488     DoesSExtCollapse = true;
 489   if (IVSCEV == SE->getZeroExtendExpr(TISCEV, IVTy))
 490     DoesZExtCollapse = true;
 491
 492   // If neither sext nor zext does collapse, it is not profitable to do any
 493   // transform. Bail.
 494   if (!DoesSExtCollapse && !DoesZExtCollapse)
 495     return false;
 496
 497   // Collect users of the trunc that look like comparisons against invariants.
 498   // Bail if we find something different.
 499   SmallVector<ICmpInst *, 4> ICmpUsers;
 500   for (auto *U : TI->users()) {
 501     // We don't care about users in unreachable blocks.
 502     if (isa<Instruction>(U) &&
 503         !DT->isReachableFromEntry(cast<Instruction>(U)->getParent()))
 504       continue;
 505     ICmpInst *ICI = dyn_cast<ICmpInst>(U);
 506     if (!ICI) return false;
 507     assert(L->contains(ICI->getParent()) && "LCSSA form broken?");
 508     if (!(ICI->getOperand(0) == TI && L->isLoopInvariant(ICI->getOperand(1))) &&
 509         !(ICI->getOperand(1) == TI && L->isLoopInvariant(ICI->getOperand(0))))
 510       return false;
 511     // If we cannot get rid of trunc, bail.
 512     if (ICI->isSigned() && !DoesSExtCollapse)
 513       return false;
 514     if (ICI->isUnsigned() && !DoesZExtCollapse)
 515       return false;
 516     // For equality, either signed or unsigned works.
 517     ICmpUsers.push_back(ICI);
 518   }
 519
 520   auto CanUseZExt = [&](ICmpInst *ICI) {
 521     // Unsigned comparison can be widened as unsigned.
 522     if (ICI->isUnsigned())
 523       return true;
 524     // Is it profitable to do zext?
 525     if (!DoesZExtCollapse)
 526       return false;
 527     // For equality, we can safely zext both parts.
 528     if (ICI->isEquality())
 529       return true;
 530     // Otherwise we can only use zext when comparing two non-negative or two
 531     // negative values. But in practice, we will never pass DoesZExtCollapse
 532     // check for a negative value, because zext(trunc(x)) is non-negative. So
 533     // it only make sense to check for non-negativity here.
 534     const SCEV *SCEVOP1 = SE->getSCEV(ICI->getOperand(0));
 535     const SCEV *SCEVOP2 = SE->getSCEV(ICI->getOperand(1));
 536     return SE->isKnownNonNegative(SCEVOP1) && SE->isKnownNonNegative(SCEVOP2);
 537   };
 538   // Replace all comparisons against trunc with comparisons against IV.
 539   for (auto *ICI : ICmpUsers) {
 540     bool IsSwapped = L->isLoopInvariant(ICI->getOperand(0));
 541     auto *Op1 = IsSwapped ? ICI->getOperand(0) : ICI->getOperand(1);
 542     Instruction *Ext = nullptr;
 543     // For signed/unsigned predicate, replace the old comparison with comparison
 544     // of immediate IV against sext/zext of the invariant argument. If we can
 545     // use either sext or zext (i.e. we are dealing with equality predicate),
 546     // then prefer zext as a more canonical form.
 547     // TODO: If we see a signed comparison which can be turned into unsigned,
 548     // we can do it here for canonicalization purposes.
 549     ICmpInst::Predicate Pred = ICI->getPredicate();
 550     if (IsSwapped) Pred = ICmpInst::getSwappedPredicate(Pred);
 551     if (CanUseZExt(ICI)) {
 552       assert(DoesZExtCollapse && "Unprofitable zext?");
 553       Ext = new ZExtInst(Op1, IVTy, "zext", ICI);
 554       Pred = ICmpInst::getUnsignedPredicate(Pred);
 555     } else {
 556       assert(DoesSExtCollapse && "Unprofitable sext?");
 557       Ext = new SExtInst(Op1, IVTy, "sext", ICI);
 558       assert(Pred == ICmpInst::getSignedPredicate(Pred) && "Must be signed!");
 559     }
 560     bool Changed;
 561     L->makeLoopInvariant(Ext, Changed);
 562     (void)Changed;
 563     ICmpInst *NewICI = new ICmpInst(ICI, Pred, IV, Ext);
 564     ICI->replaceAllUsesWith(NewICI);
 565     DeadInsts.emplace_back(ICI);
 566   }
 567
 568   // Trunc no longer needed.
 569   TI->replaceAllUsesWith(PoisonValue::get(TI->getType()));
 570   DeadInsts.emplace_back(TI);
 571   return true;
 572 }
 573
 574 /// Eliminate an operation that consumes a simple IV and has no observable
 575 /// side-effect given the range of IV values.  IVOperand is guaranteed SCEVable,
 576 /// but UseInst may not be.
 577 bool SimplifyIndvar::eliminateIVUser(Instruction *UseInst,
 578                                      Instruction *IVOperand) {
 579   if (ICmpInst *ICmp = dyn_cast<ICmpInst>(UseInst)) {
 580     eliminateIVComparison(ICmp, IVOperand);
 581     return true;
 582   }
 583   if (BinaryOperator *Bin = dyn_cast<BinaryOperator>(UseInst)) {
 584     bool IsSRem = Bin->getOpcode() == Instruction::SRem;
 585     if (IsSRem || Bin->getOpcode() == Instruction::URem) {
 586       simplifyIVRemainder(Bin, IVOperand, IsSRem);
 587       return true;
 588     }
 589
 590     if (Bin->getOpcode() == Instruction::SDiv)
 591       return eliminateSDiv(Bin);
 592   }
 593
 594   if (auto *WO = dyn_cast<WithOverflowInst>(UseInst))
 595     if (eliminateOverflowIntrinsic(WO))
 596       return true;
 597
 598   if (auto *SI = dyn_cast<SaturatingInst>(UseInst))
 599     if (eliminateSaturatingIntrinsic(SI))
 600       return true;
 601
 602   if (auto *TI = dyn_cast<TruncInst>(UseInst))
 603     if (eliminateTrunc(TI))
 604       return true;
 605
 606   if (eliminateIdentitySCEV(UseInst, IVOperand))
 607     return true;
 608
 609   return false;
 610 }
 611
 612 static Instruction *GetLoopInvariantInsertPosition(Loop *L, Instruction *Hint) {
 613   if (auto *BB = L->getLoopPreheader())
 614     return BB->getTerminator();
 615
 616   return Hint;
 617 }
 618
 619 /// Replace the UseInst with a loop invariant expression if it is safe.
 620 bool SimplifyIndvar::replaceIVUserWithLoopInvariant(Instruction *I) {
 621   if (!SE->isSCEVable(I->getType()))
 622     return false;
 623
 624   // Get the symbolic expression for this instruction.
 625   const SCEV *S = SE->getSCEV(I);
 626
 627   if (!SE->isLoopInvariant(S, L))
 628     return false;
 629
 630   // Do not generate something ridiculous even if S is loop invariant.
 631   if (Rewriter.isHighCostExpansion(S, L, SCEVCheapExpansionBudget, TTI, I))
 632     return false;
 633
 634   auto *IP = GetLoopInvariantInsertPosition(L, I);
 635
 636   if (!Rewriter.isSafeToExpandAt(S, IP)) {
 637     LLVM_DEBUG(dbgs() << "INDVARS: Can not replace IV user: " << *I
 638                       << " with non-speculable loop invariant: " << *S << '\n');
 639     return false;
 640   }
 641
 642   auto *Invariant = Rewriter.expandCodeFor(S, I->getType(), IP);
 643
 644   I->replaceAllUsesWith(Invariant);
 645   LLVM_DEBUG(dbgs() << "INDVARS: Replace IV user: " << *I
 646                     << " with loop invariant: " << *S << '\n');
 647   ++NumFoldedUser;
 648   Changed = true;
 649   DeadInsts.emplace_back(I);
 650   return true;
 651 }
 652
 653 /// Eliminate redundant type cast between integer and float.
 654 bool SimplifyIndvar::replaceFloatIVWithIntegerIV(Instruction *UseInst) {
 655   if (UseInst->getOpcode() != CastInst::SIToFP &&
 656       UseInst->getOpcode() != CastInst::UIToFP)
 657     return false;
 658
 659   Instruction *IVOperand = cast<Instruction>(UseInst->getOperand(0));
 660   // Get the symbolic expression for this instruction.
 661   const SCEV *IV = SE->getSCEV(IVOperand);
 662   unsigned MaskBits;
 663   if (UseInst->getOpcode() == CastInst::SIToFP)
 664     MaskBits = SE->getSignedRange(IV).getMinSignedBits();
 665   else
 666     MaskBits = SE->getUnsignedRange(IV).getActiveBits();
 667   unsigned DestNumSigBits = UseInst->getType()->getFPMantissaWidth();
 668   if (MaskBits <= DestNumSigBits) {
 669     for (User *U : UseInst->users()) {
 670       // Match for fptosi/fptoui of sitofp and with same type.
 671       auto *CI = dyn_cast<CastInst>(U);
 672       if (!CI)
 673         continue;
 674
 675       CastInst::CastOps Opcode = CI->getOpcode();
 676       if (Opcode != CastInst::FPToSI && Opcode != CastInst::FPToUI)
 677         continue;
 678
 679       Value *Conv = nullptr;
 680       if (IVOperand->getType() != CI->getType()) {
 681         IRBuilder<> Builder(CI);
 682         StringRef Name = IVOperand->getName();
 683         // To match InstCombine logic, we only need sext if both fptosi and
 684         // sitofp are used. If one of them is unsigned, then we can use zext.
 685         if (SE->getTypeSizeInBits(IVOperand->getType()) >
 686             SE->getTypeSizeInBits(CI->getType())) {
 687           Conv = Builder.CreateTrunc(IVOperand, CI->getType(), Name + ".trunc");
 688         } else if (Opcode == CastInst::FPToUI ||
 689                    UseInst->getOpcode() == CastInst::UIToFP) {
 690           Conv = Builder.CreateZExt(IVOperand, CI->getType(), Name + ".zext");
 691         } else {
 692           Conv = Builder.CreateSExt(IVOperand, CI->getType(), Name + ".sext");
 693         }
 694       } else
 695         Conv = IVOperand;
 696
 697       CI->replaceAllUsesWith(Conv);
 698       DeadInsts.push_back(CI);
 699       LLVM_DEBUG(dbgs() << "INDVARS: Replace IV user: " << *CI
 700                         << " with: " << *Conv << '\n');
 701
 702       ++NumFoldedUser;
 703       Changed = true;
 704     }
 705   }
 706
 707   return Changed;
 708 }
 709
 710 /// Eliminate any operation that SCEV can prove is an identity function.
 711 bool SimplifyIndvar::eliminateIdentitySCEV(Instruction *UseInst,
 712                                            Instruction *IVOperand) {
 713   if (!SE->isSCEVable(UseInst->getType()) ||
 714       (UseInst->getType() != IVOperand->getType()) ||
 715       (SE->getSCEV(UseInst) != SE->getSCEV(IVOperand)))
 716     return false;
 717
 718   // getSCEV(X) == getSCEV(Y) does not guarantee that X and Y are related in the
 719   // dominator tree, even if X is an operand to Y.  For instance, in
 720   //
 721   //     %iv = phi i32 {0,+,1}
 722   //     br %cond, label %left, label %merge
 723   //
 724   //   left:
 725   //     %X = add i32 %iv, 0
 726   //     br label %merge
 727   //
 728   //   merge:
 729   //     %M = phi (%X, %iv)
 730   //
 731   // getSCEV(%M) == getSCEV(%X) == {0,+,1}, but %X does not dominate %M, and
 732   // %M.replaceAllUsesWith(%X) would be incorrect.
 733
 734   if (isa<PHINode>(UseInst))
 735     // If UseInst is not a PHI node then we know that IVOperand dominates
 736     // UseInst directly from the legality of SSA.
 737     if (!DT || !DT->dominates(IVOperand, UseInst))
 738       return false;
 739
 740   if (!LI->replacementPreservesLCSSAForm(UseInst, IVOperand))
 741     return false;
 742
 743   LLVM_DEBUG(dbgs() << "INDVARS: Eliminated identity: " << *UseInst << '\n');
 744
 745   SE->forgetValue(UseInst);
 746   UseInst->replaceAllUsesWith(IVOperand);
 747   ++NumElimIdentity;
 748   Changed = true;
 749   DeadInsts.emplace_back(UseInst);
 750   return true;
 751 }
 752
 753 bool SimplifyIndvar::strengthenBinaryOp(BinaryOperator *BO,
 754                                         Instruction *IVOperand) {
 755   return (isa<OverflowingBinaryOperator>(BO) &&
 756           strengthenOverflowingOperation(BO, IVOperand)) ||
 757          (isa<ShlOperator>(BO) && strengthenRightShift(BO, IVOperand));
 758 }
 759
 760 /// Annotate BO with nsw / nuw if it provably does not signed-overflow /
 761 /// unsigned-overflow.  Returns true if anything changed, false otherwise.
 762 bool SimplifyIndvar::strengthenOverflowingOperation(BinaryOperator *BO,
 763                                                     Instruction *IVOperand) {
 764   auto Flags = SE->getStrengthenedNoWrapFlagsFromBinOp(
 765       cast<OverflowingBinaryOperator>(BO));
 766
 767   if (!Flags)
 768     return false;
 769
 770   BO->setHasNoUnsignedWrap(ScalarEvolution::maskFlags(*Flags, SCEV::FlagNUW) ==
 771                            SCEV::FlagNUW);
 772   BO->setHasNoSignedWrap(ScalarEvolution::maskFlags(*Flags, SCEV::FlagNSW) ==
 773                          SCEV::FlagNSW);
 774
 775   // The getStrengthenedNoWrapFlagsFromBinOp() check inferred additional nowrap
 776   // flags on addrecs while performing zero/sign extensions. We could call
 777   // forgetValue() here to make sure those flags also propagate to any other
 778   // SCEV expressions based on the addrec. However, this can have pathological
 779   // compile-time impact, see https://bugs.llvm.org/show_bug.cgi?id=50384.
 780   return true;
 781 }
 782
 783 /// Annotate the Shr in (X << IVOperand) >> C as exact using the
 784 /// information from the IV's range. Returns true if anything changed, false
 785 /// otherwise.
 786 bool SimplifyIndvar::strengthenRightShift(BinaryOperator *BO,
 787                                           Instruction *IVOperand) {
 788   using namespace llvm::PatternMatch;
 789
 790   if (BO->getOpcode() == Instruction::Shl) {
 791     bool Changed = false;
 792     ConstantRange IVRange = SE->getUnsignedRange(SE->getSCEV(IVOperand));
 793     for (auto *U : BO->users()) {
 794       const APInt *C;
 795       if (match(U,
 796                 m_AShr(m_Shl(m_Value(), m_Specific(IVOperand)), m_APInt(C))) ||
 797           match(U,
 798                 m_LShr(m_Shl(m_Value(), m_Specific(IVOperand)), m_APInt(C)))) {
 799         BinaryOperator *Shr = cast<BinaryOperator>(U);
 800         if (!Shr->isExact() && IVRange.getUnsignedMin().uge(*C)) {
 801           Shr->setIsExact(true);
 802           Changed = true;
 803         }
 804       }
 805     }
 806     return Changed;
 807   }
 808
 809   return false;
 810 }
 811
 812 /// Add all uses of Def to the current IV's worklist.
 813 static void pushIVUsers(
 814   Instruction *Def, Loop *L,
 815   SmallPtrSet<Instruction*,16> &Simplified,
 816   SmallVectorImpl< std::pair<Instruction*,Instruction*> > &SimpleIVUsers) {
 817
 818   for (User *U : Def->users()) {
 819     Instruction *UI = cast<Instruction>(U);
 820
 821     // Avoid infinite or exponential worklist processing.
 822     // Also ensure unique worklist users.
 823     // If Def is a LoopPhi, it may not be in the Simplified set, so check for
 824     // self edges first.
 825     if (UI == Def)
 826       continue;
 827
 828     // Only change the current Loop, do not change the other parts (e.g. other
 829     // Loops).
 830     if (!L->contains(UI))
 831       continue;
 832
 833     // Do not push the same instruction more than once.
 834     if (!Simplified.insert(UI).second)
 835       continue;
 836
 837     SimpleIVUsers.push_back(std::make_pair(UI, Def));
 838   }
 839 }
 840
 841 /// Return true if this instruction generates a simple SCEV
 842 /// expression in terms of that IV.
 843 ///
 844 /// This is similar to IVUsers' isInteresting() but processes each instruction
 845 /// non-recursively when the operand is already known to be a simpleIVUser.
 846 ///
 847 static bool isSimpleIVUser(Instruction *I, const Loop *L, ScalarEvolution *SE) {
 848   if (!SE->isSCEVable(I->getType()))
 849     return false;
 850
 851   // Get the symbolic expression for this instruction.
 852   const SCEV *S = SE->getSCEV(I);
 853
 854   // Only consider affine recurrences.
 855   const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(S);
 856   if (AR && AR->getLoop() == L)
 857     return true;
 858
 859   return false;
 860 }
 861
 862 /// Iteratively perform simplification on a worklist of users
 863 /// of the specified induction variable. Each successive simplification may push
 864 /// more users which may themselves be candidates for simplification.
 865 ///
 866 /// This algorithm does not require IVUsers analysis. Instead, it simplifies
 867 /// instructions in-place during analysis. Rather than rewriting induction
 868 /// variables bottom-up from their users, it transforms a chain of IVUsers
 869 /// top-down, updating the IR only when it encounters a clear optimization
 870 /// opportunity.
 871 ///
 872 /// Once DisableIVRewrite is default, LSR will be the only client of IVUsers.
 873 ///
 874 void SimplifyIndvar::simplifyUsers(PHINode *CurrIV, IVVisitor *V) {
 875   if (!SE->isSCEVable(CurrIV->getType()))
 876     return;
 877
 878   // Instructions processed by SimplifyIndvar for CurrIV.
 879   SmallPtrSet<Instruction*,16> Simplified;
 880
 881   // Use-def pairs if IV users waiting to be processed for CurrIV.
 882   SmallVector<std::pair<Instruction*, Instruction*>, 8> SimpleIVUsers;
 883
 884   // Push users of the current LoopPhi. In rare cases, pushIVUsers may be
 885   // called multiple times for the same LoopPhi. This is the proper thing to
 886   // do for loop header phis that use each other.
 887   pushIVUsers(CurrIV, L, Simplified, SimpleIVUsers);
 888
 889   while (!SimpleIVUsers.empty()) {
 890     std::pair<Instruction*, Instruction*> UseOper =
 891       SimpleIVUsers.pop_back_val();
 892     Instruction *UseInst = UseOper.first;
 893
 894     // If a user of the IndVar is trivially dead, we prefer just to mark it dead
 895     // rather than try to do some complex analysis or transformation (such as
 896     // widening) basing on it.
 897     // TODO: Propagate TLI and pass it here to handle more cases.
 898     if (isInstructionTriviallyDead(UseInst, /* TLI */ nullptr)) {
 899       DeadInsts.emplace_back(UseInst);
 900       continue;
 901     }
 902
 903     // Bypass back edges to avoid extra work.
 904     if (UseInst == CurrIV) continue;
 905
 906     // Try to replace UseInst with a loop invariant before any other
 907     // simplifications.
 908     if (replaceIVUserWithLoopInvariant(UseInst))
 909       continue;
 910
 911     // Go further for the bitcast ''prtoint ptr to i64'
 912     if (isa<PtrToIntInst>(UseInst))
 913       for (Use &U : UseInst->uses()) {
 914         Instruction *User = cast<Instruction>(U.getUser());
 915         if (replaceIVUserWithLoopInvariant(User))
 916           break; // done replacing
 917       }
 918
 919     Instruction *IVOperand = UseOper.second;
 920     for (unsigned N = 0; IVOperand; ++N) {
 921       assert(N <= Simplified.size() && "runaway iteration");
 922       (void) N;
 923
 924       Value *NewOper = foldIVUser(UseInst, IVOperand);
 925       if (!NewOper)
 926         break; // done folding
 927       IVOperand = dyn_cast<Instruction>(NewOper);
 928     }
 929     if (!IVOperand)
 930       continue;
 931
 932     if (eliminateIVUser(UseInst, IVOperand)) {
 933       pushIVUsers(IVOperand, L, Simplified, SimpleIVUsers);
 934       continue;
 935     }
 936
 937     if (BinaryOperator *BO = dyn_cast<BinaryOperator>(UseInst)) {
 938       if (strengthenBinaryOp(BO, IVOperand)) {
 939         // re-queue uses of the now modified binary operator and fall
 940         // through to the checks that remain.
 941         pushIVUsers(IVOperand, L, Simplified, SimpleIVUsers);
 942       }
 943     }
 944
 945     // Try to use integer induction for FPToSI of float induction directly.
 946     if (replaceFloatIVWithIntegerIV(UseInst)) {
 947       // Re-queue the potentially new direct uses of IVOperand.
 948       pushIVUsers(IVOperand, L, Simplified, SimpleIVUsers);
 949       continue;
 950     }
 951
 952     CastInst *Cast = dyn_cast<CastInst>(UseInst);
 953     if (V && Cast) {
 954       V->visitCast(Cast);
 955       continue;
 956     }
 957     if (isSimpleIVUser(UseInst, L, SE)) {
 958       pushIVUsers(UseInst, L, Simplified, SimpleIVUsers);
 959     }
 960   }
 961 }
 962
 963 namespace llvm {
 964
 965 void IVVisitor::anchor() { }
 966
 967 /// Simplify instructions that use this induction variable
 968 /// by using ScalarEvolution to analyze the IV's recurrence.
 969 bool simplifyUsersOfIV(PHINode *CurrIV, ScalarEvolution *SE, DominatorTree *DT,
 970                        LoopInfo *LI, const TargetTransformInfo *TTI,
 971                        SmallVectorImpl<WeakTrackingVH> &Dead,
 972                        SCEVExpander &Rewriter, IVVisitor *V) {
 973   SimplifyIndvar SIV(LI->getLoopFor(CurrIV->getParent()), SE, DT, LI, TTI,
 974                      Rewriter, Dead);
 975   SIV.simplifyUsers(CurrIV, V);
 976   return SIV.hasChanged();
 977 }
 978
 979 /// Simplify users of induction variables within this
 980 /// loop. This does not actually change or add IVs.
 981 bool simplifyLoopIVs(Loop *L, ScalarEvolution *SE, DominatorTree *DT,
 982                      LoopInfo *LI, const TargetTransformInfo *TTI,
 983                      SmallVectorImpl<WeakTrackingVH> &Dead) {
 984   SCEVExpander Rewriter(*SE, SE->getDataLayout(), "indvars");
 985 #ifndef NDEBUG
 986   Rewriter.setDebugType(DEBUG_TYPE);
 987 #endif
 988   bool Changed = false;
 989   for (BasicBlock::iterator I = L->getHeader()->begin(); isa<PHINode>(I); ++I) {
 990     Changed |=
 991         simplifyUsersOfIV(cast<PHINode>(I), SE, DT, LI, TTI, Dead, Rewriter);
 992   }
 993   return Changed;
 994 }
 995
 996 } // namespace llvm
 997
 998 namespace {
 999 //===----------------------------------------------------------------------===//
1000 // Widen Induction Variables - Extend the width of an IV to cover its
1001 // widest uses.
1002 //===----------------------------------------------------------------------===//
1003
1004 class WidenIV {
1005   // Parameters
1006   PHINode *OrigPhi;
1007   Type *WideType;
1008
1009   // Context
1010   LoopInfo        *LI;
1011   Loop            *L;
1012   ScalarEvolution *SE;
1013   DominatorTree   *DT;
1014
1015   // Does the module have any calls to the llvm.experimental.guard intrinsic
1016   // at all? If not we can avoid scanning instructions looking for guards.
1017   bool HasGuards;
1018
1019   bool UsePostIncrementRanges;
1020
1021   // Statistics
1022   unsigned NumElimExt = 0;
1023   unsigned NumWidened = 0;
1024
1025   // Result
1026   PHINode *WidePhi = nullptr;
1027   Instruction *WideInc = nullptr;
1028   const SCEV *WideIncExpr = nullptr;
1029   SmallVectorImpl<WeakTrackingVH> &DeadInsts;
1030
1031   SmallPtrSet<Instruction *,16> Widened;
1032
1033   enum class ExtendKind { Zero, Sign, Unknown };
1034
1035   // A map tracking the kind of extension used to widen each narrow IV
1036   // and narrow IV user.
1037   // Key: pointer to a narrow IV or IV user.
1038   // Value: the kind of extension used to widen this Instruction.
1039   DenseMap<AssertingVH<Instruction>, ExtendKind> ExtendKindMap;
1040
1041   using DefUserPair = std::pair<AssertingVH<Value>, AssertingVH<Instruction>>;
1042
1043   // A map with control-dependent ranges for post increment IV uses. The key is
1044   // a pair of IV def and a use of this def denoting the context. The value is
1045   // a ConstantRange representing possible values of the def at the given
1046   // context.
1047   DenseMap<DefUserPair, ConstantRange> PostIncRangeInfos;
1048
1049   std::optional<ConstantRange> getPostIncRangeInfo(Value *Def,
1050                                                    Instruction *UseI) {
1051     DefUserPair Key(Def, UseI);
1052     auto It = PostIncRangeInfos.find(Key);
1053     return It == PostIncRangeInfos.end()
1054                ? std::optional<ConstantRange>(std::nullopt)
1055                : std::optional<ConstantRange>(It->second);
1056   }
1057
1058   void calculatePostIncRanges(PHINode *OrigPhi);
1059   void calculatePostIncRange(Instruction *NarrowDef, Instruction *NarrowUser);
1060
1061   void updatePostIncRangeInfo(Value *Def, Instruction *UseI, ConstantRange R) {
1062     DefUserPair Key(Def, UseI);
1063     auto It = PostIncRangeInfos.find(Key);
1064     if (It == PostIncRangeInfos.end())
1065       PostIncRangeInfos.insert({Key, R});
1066     else
1067       It->second = R.intersectWith(It->second);
1068   }
1069
1070 public:
1071   /// Record a link in the Narrow IV def-use chain along with the WideIV that
1072   /// computes the same value as the Narrow IV def.  This avoids caching Use*
1073   /// pointers.
1074   struct NarrowIVDefUse {
1075     Instruction *NarrowDef = nullptr;
1076     Instruction *NarrowUse = nullptr;
1077     Instruction *WideDef = nullptr;
1078
1079     // True if the narrow def is never negative.  Tracking this information lets
1080     // us use a sign extension instead of a zero extension or vice versa, when
1081     // profitable and legal.
1082     bool NeverNegative = false;
1083
1084     NarrowIVDefUse(Instruction *ND, Instruction *NU, Instruction *WD,
1085                    bool NeverNegative)
1086         : NarrowDef(ND), NarrowUse(NU), WideDef(WD),
1087           NeverNegative(NeverNegative) {}
1088   };
1089
1090   WidenIV(const WideIVInfo &WI, LoopInfo *LInfo, ScalarEvolution *SEv,
1091           DominatorTree *DTree, SmallVectorImpl<WeakTrackingVH> &DI,
1092           bool HasGuards, bool UsePostIncrementRanges = true);
1093
1094   PHINode *createWideIV(SCEVExpander &Rewriter);
1095
1096   unsigned getNumElimExt() { return NumElimExt; };
1097   unsigned getNumWidened() { return NumWidened; };
1098
1099 protected:
1100   Value *createExtendInst(Value *NarrowOper, Type *WideType, bool IsSigned,
1101                           Instruction *Use);
1102
1103   Instruction *cloneIVUser(NarrowIVDefUse DU, const SCEVAddRecExpr *WideAR);
1104   Instruction *cloneArithmeticIVUser(NarrowIVDefUse DU,
1105                                      const SCEVAddRecExpr *WideAR);
1106   Instruction *cloneBitwiseIVUser(NarrowIVDefUse DU);
1107
1108   ExtendKind getExtendKind(Instruction *I);
1109
1110   using WidenedRecTy = std::pair<const SCEVAddRecExpr *, ExtendKind>;
1111
1112   WidenedRecTy getWideRecurrence(NarrowIVDefUse DU);
1113
1114   WidenedRecTy getExtendedOperandRecurrence(NarrowIVDefUse DU);
1115
1116   const SCEV *getSCEVByOpCode(const SCEV *LHS, const SCEV *RHS,
1117                               unsigned OpCode) const;
1118
1119   Instruction *widenIVUse(NarrowIVDefUse DU, SCEVExpander &Rewriter);
1120
1121   bool widenLoopCompare(NarrowIVDefUse DU);
1122   bool widenWithVariantUse(NarrowIVDefUse DU);
1123
1124   void pushNarrowIVUsers(Instruction *NarrowDef, Instruction *WideDef);
1125
1126 private:
1127   SmallVector<NarrowIVDefUse, 8> NarrowIVUsers;
1128 };
1129 } // namespace
1130
1131 /// Determine the insertion point for this user. By default, insert immediately
1132 /// before the user. SCEVExpander or LICM will hoist loop invariants out of the
1133 /// loop. For PHI nodes, there may be multiple uses, so compute the nearest
1134 /// common dominator for the incoming blocks. A nullptr can be returned if no
1135 /// viable location is found: it may happen if User is a PHI and Def only comes
1136 /// to this PHI from unreachable blocks.
1137 static Instruction *getInsertPointForUses(Instruction *User, Value *Def,
1138                                           DominatorTree *DT, LoopInfo *LI) {
1139   PHINode *PHI = dyn_cast<PHINode>(User);
1140   if (!PHI)
1141     return User;
1142
1143   Instruction *InsertPt = nullptr;
1144   for (unsigned i = 0, e = PHI->getNumIncomingValues(); i != e; ++i) {
1145     if (PHI->getIncomingValue(i) != Def)
1146       continue;
1147
1148     BasicBlock *InsertBB = PHI->getIncomingBlock(i);
1149
1150     if (!DT->isReachableFromEntry(InsertBB))
1151       continue;
1152
1153     if (!InsertPt) {
1154       InsertPt = InsertBB->getTerminator();
1155       continue;
1156     }
1157     InsertBB = DT->findNearestCommonDominator(InsertPt->getParent(), InsertBB);
1158     InsertPt = InsertBB->getTerminator();
1159   }
1160
1161   // If we have skipped all inputs, it means that Def only comes to Phi from
1162   // unreachable blocks.
1163   if (!InsertPt)
1164     return nullptr;
1165
1166   auto *DefI = dyn_cast<Instruction>(Def);
1167   if (!DefI)
1168     return InsertPt;
1169
1170   assert(DT->dominates(DefI, InsertPt) && "def does not dominate all uses");
1171
1172   auto *L = LI->getLoopFor(DefI->getParent());
1173   assert(!L || L->contains(LI->getLoopFor(InsertPt->getParent())));
1174
1175   for (auto *DTN = (*DT)[InsertPt->getParent()]; DTN; DTN = DTN->getIDom())
1176     if (LI->getLoopFor(DTN->getBlock()) == L)
1177       return DTN->getBlock()->getTerminator();
1178
1179   llvm_unreachable("DefI dominates InsertPt!");
1180 }
1181
1182 WidenIV::WidenIV(const WideIVInfo &WI, LoopInfo *LInfo, ScalarEvolution *SEv,
1183           DominatorTree *DTree, SmallVectorImpl<WeakTrackingVH> &DI,
1184           bool HasGuards, bool UsePostIncrementRanges)
1185       : OrigPhi(WI.NarrowIV), WideType(WI.WidestNativeType), LI(LInfo),
1186         L(LI->getLoopFor(OrigPhi->getParent())), SE(SEv), DT(DTree),
1187         HasGuards(HasGuards), UsePostIncrementRanges(UsePostIncrementRanges),
1188         DeadInsts(DI) {
1189     assert(L->getHeader() == OrigPhi->getParent() && "Phi must be an IV");
1190     ExtendKindMap[OrigPhi] = WI.IsSigned ? ExtendKind::Sign : ExtendKind::Zero;
1191 }
1192
1193 Value *WidenIV::createExtendInst(Value *NarrowOper, Type *WideType,
1194                                  bool IsSigned, Instruction *Use) {
1195   // Set the debug location and conservative insertion point.
1196   IRBuilder<> Builder(Use);
1197   // Hoist the insertion point into loop preheaders as far as possible.
1198   for (const Loop *L = LI->getLoopFor(Use->getParent());
1199        L && L->getLoopPreheader() && L->isLoopInvariant(NarrowOper);
1200        L = L->getParentLoop())
1201     Builder.SetInsertPoint(L->getLoopPreheader()->getTerminator());
1202
1203   return IsSigned ? Builder.CreateSExt(NarrowOper, WideType) :
1204                     Builder.CreateZExt(NarrowOper, WideType);
1205 }
1206
1207 /// Instantiate a wide operation to replace a narrow operation. This only needs
1208 /// to handle operations that can evaluation to SCEVAddRec. It can safely return
1209 /// 0 for any operation we decide not to clone.
1210 Instruction *WidenIV::cloneIVUser(WidenIV::NarrowIVDefUse DU,
1211                                   const SCEVAddRecExpr *WideAR) {
1212   unsigned Opcode = DU.NarrowUse->getOpcode();
1213   switch (Opcode) {
1214   default:
1215     return nullptr;
1216   case Instruction::Add:
1217   case Instruction::Mul:
1218   case Instruction::UDiv:
1219   case Instruction::Sub:
1220     return cloneArithmeticIVUser(DU, WideAR);
1221
1222   case Instruction::And:
1223   case Instruction::Or:
1224   case Instruction::Xor:
1225   case Instruction::Shl:
1226   case Instruction::LShr:
1227   case Instruction::AShr:
1228     return cloneBitwiseIVUser(DU);
1229   }
1230 }
1231
1232 Instruction *WidenIV::cloneBitwiseIVUser(WidenIV::NarrowIVDefUse DU) {
1233   Instruction *NarrowUse = DU.NarrowUse;
1234   Instruction *NarrowDef = DU.NarrowDef;
1235   Instruction *WideDef = DU.WideDef;
1236
1237   LLVM_DEBUG(dbgs() << "Cloning bitwise IVUser: " << *NarrowUse << "\n");
1238
1239   // Replace NarrowDef operands with WideDef. Otherwise, we don't know anything
1240   // about the narrow operand yet so must insert a [sz]ext. It is probably loop
1241   // invariant and will be folded or hoisted. If it actually comes from a
1242   // widened IV, it should be removed during a future call to widenIVUse.
1243   bool IsSigned = getExtendKind(NarrowDef) == ExtendKind::Sign;
1244   Value *LHS = (NarrowUse->getOperand(0) == NarrowDef)
1245                    ? WideDef
1246                    : createExtendInst(NarrowUse->getOperand(0), WideType,
1247                                       IsSigned, NarrowUse);
1248   Value *RHS = (NarrowUse->getOperand(1) == NarrowDef)
1249                    ? WideDef
1250                    : createExtendInst(NarrowUse->getOperand(1), WideType,
1251                                       IsSigned, NarrowUse);
1252
1253   auto *NarrowBO = cast<BinaryOperator>(NarrowUse);
1254   auto *WideBO = BinaryOperator::Create(NarrowBO->getOpcode(), LHS, RHS,
1255                                         NarrowBO->getName());
1256   IRBuilder<> Builder(NarrowUse);
1257   Builder.Insert(WideBO);
1258   WideBO->copyIRFlags(NarrowBO);
1259   return WideBO;
1260 }
1261
1262 Instruction *WidenIV::cloneArithmeticIVUser(WidenIV::NarrowIVDefUse DU,
1263                                             const SCEVAddRecExpr *WideAR) {
1264   Instruction *NarrowUse = DU.NarrowUse;
1265   Instruction *NarrowDef = DU.NarrowDef;
1266   Instruction *WideDef = DU.WideDef;
1267
1268   LLVM_DEBUG(dbgs() << "Cloning arithmetic IVUser: " << *NarrowUse << "\n");
1269
1270   unsigned IVOpIdx = (NarrowUse->getOperand(0) == NarrowDef) ? 0 : 1;
1271
1272   // We're trying to find X such that
1273   //
1274   //  Widen(NarrowDef `op` NonIVNarrowDef) == WideAR == WideDef `op.wide` X
1275   //
1276   // We guess two solutions to X, sext(NonIVNarrowDef) and zext(NonIVNarrowDef),
1277   // and check using SCEV if any of them are correct.
1278
1279   // Returns true if extending NonIVNarrowDef according to `SignExt` is a
1280   // correct solution to X.
1281   auto GuessNonIVOperand = [&](bool SignExt) {
1282     const SCEV *WideLHS;
1283     const SCEV *WideRHS;
1284
1285     auto GetExtend = [this, SignExt](const SCEV *S, Type *Ty) {
1286       if (SignExt)
1287         return SE->getSignExtendExpr(S, Ty);
1288       return SE->getZeroExtendExpr(S, Ty);
1289     };
1290
1291     if (IVOpIdx == 0) {
1292       WideLHS = SE->getSCEV(WideDef);
1293       const SCEV *NarrowRHS = SE->getSCEV(NarrowUse->getOperand(1));
1294       WideRHS = GetExtend(NarrowRHS, WideType);
1295     } else {
1296       const SCEV *NarrowLHS = SE->getSCEV(NarrowUse->getOperand(0));
1297       WideLHS = GetExtend(NarrowLHS, WideType);
1298       WideRHS = SE->getSCEV(WideDef);
1299     }
1300
1301     // WideUse is "WideDef `op.wide` X" as described in the comment.
1302     const SCEV *WideUse =
1303       getSCEVByOpCode(WideLHS, WideRHS, NarrowUse->getOpcode());
1304
1305     return WideUse == WideAR;
1306   };
1307
1308   bool SignExtend = getExtendKind(NarrowDef) == ExtendKind::Sign;
1309   if (!GuessNonIVOperand(SignExtend)) {
1310     SignExtend = !SignExtend;
1311     if (!GuessNonIVOperand(SignExtend))
1312       return nullptr;
1313   }
1314
1315   Value *LHS = (NarrowUse->getOperand(0) == NarrowDef)
1316                    ? WideDef
1317                    : createExtendInst(NarrowUse->getOperand(0), WideType,
1318                                       SignExtend, NarrowUse);
1319   Value *RHS = (NarrowUse->getOperand(1) == NarrowDef)
1320                    ? WideDef
1321                    : createExtendInst(NarrowUse->getOperand(1), WideType,
1322                                       SignExtend, NarrowUse);
1323
1324   auto *NarrowBO = cast<BinaryOperator>(NarrowUse);
1325   auto *WideBO = BinaryOperator::Create(NarrowBO->getOpcode(), LHS, RHS,
1326                                         NarrowBO->getName());
1327
1328   IRBuilder<> Builder(NarrowUse);
1329   Builder.Insert(WideBO);
1330   WideBO->copyIRFlags(NarrowBO);
1331   return WideBO;
1332 }
1333
1334 WidenIV::ExtendKind WidenIV::getExtendKind(Instruction *I) {
1335   auto It = ExtendKindMap.find(I);
1336   assert(It != ExtendKindMap.end() && "Instruction not yet extended!");
1337   return It->second;
1338 }
1339
1340 const SCEV *WidenIV::getSCEVByOpCode(const SCEV *LHS, const SCEV *RHS,
1341                                      unsigned OpCode) const {
1342   switch (OpCode) {
1343   case Instruction::Add:
1344     return SE->getAddExpr(LHS, RHS);
1345   case Instruction::Sub:
1346     return SE->getMinusSCEV(LHS, RHS);
1347   case Instruction::Mul:
1348     return SE->getMulExpr(LHS, RHS);
1349   case Instruction::UDiv:
1350     return SE->getUDivExpr(LHS, RHS);
1351   default:
1352     llvm_unreachable("Unsupported opcode.");
1353   };
1354 }
1355
1356 /// No-wrap operations can transfer sign extension of their result to their
1357 /// operands. Generate the SCEV value for the widened operation without
1358 /// actually modifying the IR yet. If the expression after extending the
1359 /// operands is an AddRec for this loop, return the AddRec and the kind of
1360 /// extension used.
1361 WidenIV::WidenedRecTy
1362 WidenIV::getExtendedOperandRecurrence(WidenIV::NarrowIVDefUse DU) {
1363   // Handle the common case of add<nsw/nuw>
1364   const unsigned OpCode = DU.NarrowUse->getOpcode();
1365   // Only Add/Sub/Mul instructions supported yet.
1366   if (OpCode != Instruction::Add && OpCode != Instruction::Sub &&
1367       OpCode != Instruction::Mul)
1368     return {nullptr, ExtendKind::Unknown};
1369
1370   // One operand (NarrowDef) has already been extended to WideDef. Now determine
1371   // if extending the other will lead to a recurrence.
1372   const unsigned ExtendOperIdx =
1373       DU.NarrowUse->getOperand(0) == DU.NarrowDef ? 1 : 0;
1374   assert(DU.NarrowUse->getOperand(1-ExtendOperIdx) == DU.NarrowDef && "bad DU");
1375
1376   const SCEV *ExtendOperExpr = nullptr;
1377   const OverflowingBinaryOperator *OBO =
1378     cast<OverflowingBinaryOperator>(DU.NarrowUse);
1379   ExtendKind ExtKind = getExtendKind(DU.NarrowDef);
1380   if (ExtKind == ExtendKind::Sign && OBO->hasNoSignedWrap())
1381     ExtendOperExpr = SE->getSignExtendExpr(
1382       SE->getSCEV(DU.NarrowUse->getOperand(ExtendOperIdx)), WideType);
1383   else if (ExtKind == ExtendKind::Zero && OBO->hasNoUnsignedWrap())
1384     ExtendOperExpr = SE->getZeroExtendExpr(
1385       SE->getSCEV(DU.NarrowUse->getOperand(ExtendOperIdx)), WideType);
1386   else
1387     return {nullptr, ExtendKind::Unknown};
1388
1389   // When creating this SCEV expr, don't apply the current operations NSW or NUW
1390   // flags. This instruction may be guarded by control flow that the no-wrap
1391   // behavior depends on. Non-control-equivalent instructions can be mapped to
1392   // the same SCEV expression, and it would be incorrect to transfer NSW/NUW
1393   // semantics to those operations.
1394   const SCEV *lhs = SE->getSCEV(DU.WideDef);
1395   const SCEV *rhs = ExtendOperExpr;
1396
1397   // Let's swap operands to the initial order for the case of non-commutative
1398   // operations, like SUB. See PR21014.
1399   if (ExtendOperIdx == 0)
1400     std::swap(lhs, rhs);
1401   const SCEVAddRecExpr *AddRec =
1402       dyn_cast<SCEVAddRecExpr>(getSCEVByOpCode(lhs, rhs, OpCode));
1403
1404   if (!AddRec || AddRec->getLoop() != L)
1405     return {nullptr, ExtendKind::Unknown};
1406
1407   return {AddRec, ExtKind};
1408 }
1409
1410 /// Is this instruction potentially interesting for further simplification after
1411 /// widening it's type? In other words, can the extend be safely hoisted out of
1412 /// the loop with SCEV reducing the value to a recurrence on the same loop. If
1413 /// so, return the extended recurrence and the kind of extension used. Otherwise
1414 /// return {nullptr, ExtendKind::Unknown}.
1415 WidenIV::WidenedRecTy WidenIV::getWideRecurrence(WidenIV::NarrowIVDefUse DU) {
1416   if (!DU.NarrowUse->getType()->isIntegerTy())
1417     return {nullptr, ExtendKind::Unknown};
1418
1419   const SCEV *NarrowExpr = SE->getSCEV(DU.NarrowUse);
1420   if (SE->getTypeSizeInBits(NarrowExpr->getType()) >=
1421       SE->getTypeSizeInBits(WideType)) {
1422     // NarrowUse implicitly widens its operand. e.g. a gep with a narrow
1423     // index. So don't follow this use.
1424     return {nullptr, ExtendKind::Unknown};
1425   }
1426
1427   const SCEV *WideExpr;
1428   ExtendKind ExtKind;
1429   if (DU.NeverNegative) {
1430     WideExpr = SE->getSignExtendExpr(NarrowExpr, WideType);
1431     if (isa<SCEVAddRecExpr>(WideExpr))
1432       ExtKind = ExtendKind::Sign;
1433     else {
1434       WideExpr = SE->getZeroExtendExpr(NarrowExpr, WideType);
1435       ExtKind = ExtendKind::Zero;
1436     }
1437   } else if (getExtendKind(DU.NarrowDef) == ExtendKind::Sign) {
1438     WideExpr = SE->getSignExtendExpr(NarrowExpr, WideType);
1439     ExtKind = ExtendKind::Sign;
1440   } else {
1441     WideExpr = SE->getZeroExtendExpr(NarrowExpr, WideType);
1442     ExtKind = ExtendKind::Zero;
1443   }
1444   const SCEVAddRecExpr *AddRec = dyn_cast<SCEVAddRecExpr>(WideExpr);
1445   if (!AddRec || AddRec->getLoop() != L)
1446     return {nullptr, ExtendKind::Unknown};
1447   return {AddRec, ExtKind};
1448 }
1449
1450 /// This IV user cannot be widened. Replace this use of the original narrow IV
1451 /// with a truncation of the new wide IV to isolate and eliminate the narrow IV.
1452 static void truncateIVUse(WidenIV::NarrowIVDefUse DU, DominatorTree *DT,
1453                           LoopInfo *LI) {
1454   auto *InsertPt = getInsertPointForUses(DU.NarrowUse, DU.NarrowDef, DT, LI);
1455   if (!InsertPt)
1456     return;
1457   LLVM_DEBUG(dbgs() << "INDVARS: Truncate IV " << *DU.WideDef << " for user "
1458                     << *DU.NarrowUse << "\n");
1459   IRBuilder<> Builder(InsertPt);
1460   Value *Trunc = Builder.CreateTrunc(DU.WideDef, DU.NarrowDef->getType());
1461   DU.NarrowUse->replaceUsesOfWith(DU.NarrowDef, Trunc);
1462 }
1463
1464 /// If the narrow use is a compare instruction, then widen the compare
1465 //  (and possibly the other operand).  The extend operation is hoisted into the
1466 // loop preheader as far as possible.
1467 bool WidenIV::widenLoopCompare(WidenIV::NarrowIVDefUse DU) {
1468   ICmpInst *Cmp = dyn_cast<ICmpInst>(DU.NarrowUse);
1469   if (!Cmp)
1470     return false;
1471
1472   // We can legally widen the comparison in the following two cases:
1473   //
1474   //  - The signedness of the IV extension and comparison match
1475   //
1476   //  - The narrow IV is always positive (and thus its sign extension is equal
1477   //    to its zero extension).  For instance, let's say we're zero extending
1478   //    %narrow for the following use
1479   //
1480   //      icmp slt i32 %narrow, %val   ... (A)
1481   //
1482   //    and %narrow is always positive.  Then
1483   //
1484   //      (A) == icmp slt i32 sext(%narrow), sext(%val)
1485   //          == icmp slt i32 zext(%narrow), sext(%val)
1486   bool IsSigned = getExtendKind(DU.NarrowDef) == ExtendKind::Sign;
1487   if (!(DU.NeverNegative || IsSigned == Cmp->isSigned()))
1488     return false;
1489
1490   Value *Op = Cmp->getOperand(Cmp->getOperand(0) == DU.NarrowDef ? 1 : 0);
1491   unsigned CastWidth = SE->getTypeSizeInBits(Op->getType());
1492   unsigned IVWidth = SE->getTypeSizeInBits(WideType);
1493   assert(CastWidth <= IVWidth && "Unexpected width while widening compare.");
1494
1495   // Widen the compare instruction.
1496   auto *InsertPt = getInsertPointForUses(DU.NarrowUse, DU.NarrowDef, DT, LI);
1497   if (!InsertPt)
1498     return false;
1499   IRBuilder<> Builder(InsertPt);
1500   DU.NarrowUse->replaceUsesOfWith(DU.NarrowDef, DU.WideDef);
1501
1502   // Widen the other operand of the compare, if necessary.
1503   if (CastWidth < IVWidth) {
1504     Value *ExtOp = createExtendInst(Op, WideType, Cmp->isSigned(), Cmp);
1505     DU.NarrowUse->replaceUsesOfWith(Op, ExtOp);
1506   }
1507   return true;
1508 }
1509
1510 // The widenIVUse avoids generating trunc by evaluating the use as AddRec, this
1511 // will not work when:
1512 //    1) SCEV traces back to an instruction inside the loop that SCEV can not
1513 // expand, eg. add %indvar, (load %addr)
1514 //    2) SCEV finds a loop variant, eg. add %indvar, %loopvariant
1515 // While SCEV fails to avoid trunc, we can still try to use instruction
1516 // combining approach to prove trunc is not required. This can be further
1517 // extended with other instruction combining checks, but for now we handle the
1518 // following case (sub can be "add" and "mul", "nsw + sext" can be "nus + zext")
1519 //
1520 // Src:
1521 //   %c = sub nsw %b, %indvar
1522 //   %d = sext %c to i64
1523 // Dst:
1524 //   %indvar.ext1 = sext %indvar to i64
1525 //   %m = sext %b to i64
1526 //   %d = sub nsw i64 %m, %indvar.ext1
1527 // Therefore, as long as the result of add/sub/mul is extended to wide type, no
1528 // trunc is required regardless of how %b is generated. This pattern is common
1529 // when calculating address in 64 bit architecture
1530 bool WidenIV::widenWithVariantUse(WidenIV::NarrowIVDefUse DU) {
1531   Instruction *NarrowUse = DU.NarrowUse;
1532   Instruction *NarrowDef = DU.NarrowDef;
1533   Instruction *WideDef = DU.WideDef;
1534
1535   // Handle the common case of add<nsw/nuw>
1536   const unsigned OpCode = NarrowUse->getOpcode();
1537   // Only Add/Sub/Mul instructions are supported.
1538   if (OpCode != Instruction::Add && OpCode != Instruction::Sub &&
1539       OpCode != Instruction::Mul)
1540     return false;
1541
1542   // The operand that is not defined by NarrowDef of DU. Let's call it the
1543   // other operand.
1544   assert((NarrowUse->getOperand(0) == NarrowDef ||
1545           NarrowUse->getOperand(1) == NarrowDef) &&
1546          "bad DU");
1547
1548   const OverflowingBinaryOperator *OBO =
1549     cast<OverflowingBinaryOperator>(NarrowUse);
1550   ExtendKind ExtKind = getExtendKind(NarrowDef);
1551   bool CanSignExtend = ExtKind == ExtendKind::Sign && OBO->hasNoSignedWrap();
1552   bool CanZeroExtend = ExtKind == ExtendKind::Zero && OBO->hasNoUnsignedWrap();
1553   auto AnotherOpExtKind = ExtKind;
1554
1555   // Check that all uses are either:
1556   // - narrow def (in case of we are widening the IV increment);
1557   // - single-input LCSSA Phis;
1558   // - comparison of the chosen type;
1559   // - extend of the chosen type (raison d'etre).
1560   SmallVector<Instruction *, 4> ExtUsers;
1561   SmallVector<PHINode *, 4> LCSSAPhiUsers;
1562   SmallVector<ICmpInst *, 4> ICmpUsers;
1563   for (Use &U : NarrowUse->uses()) {
1564     Instruction *User = cast<Instruction>(U.getUser());
1565     if (User == NarrowDef)
1566       continue;
1567     if (!L->contains(User)) {
1568       auto *LCSSAPhi = cast<PHINode>(User);
1569       // Make sure there is only 1 input, so that we don't have to split
1570       // critical edges.
1571       if (LCSSAPhi->getNumOperands() != 1)
1572         return false;
1573       LCSSAPhiUsers.push_back(LCSSAPhi);
1574       continue;
1575     }
1576     if (auto *ICmp = dyn_cast<ICmpInst>(User)) {
1577       auto Pred = ICmp->getPredicate();
1578       // We have 3 types of predicates: signed, unsigned and equality
1579       // predicates. For equality, it's legal to widen icmp for either sign and
1580       // zero extend. For sign extend, we can also do so for signed predicates,
1581       // likeweise for zero extend we can widen icmp for unsigned predicates.
1582       if (ExtKind == ExtendKind::Zero && ICmpInst::isSigned(Pred))
1583         return false;
1584       if (ExtKind == ExtendKind::Sign && ICmpInst::isUnsigned(Pred))
1585         return false;
1586       ICmpUsers.push_back(ICmp);
1587       continue;
1588     }
1589     if (ExtKind == ExtendKind::Sign)
1590       User = dyn_cast<SExtInst>(User);
1591     else
1592       User = dyn_cast<ZExtInst>(User);
1593     if (!User || User->getType() != WideType)
1594       return false;
1595     ExtUsers.push_back(User);
1596   }
1597   if (ExtUsers.empty()) {
1598     DeadInsts.emplace_back(NarrowUse);
1599     return true;
1600   }
1601
1602   // We'll prove some facts that should be true in the context of ext users. If
1603   // there is no users, we are done now. If there are some, pick their common
1604   // dominator as context.
1605   const Instruction *CtxI = findCommonDominator(ExtUsers, *DT);
1606
1607   if (!CanSignExtend && !CanZeroExtend) {
1608     // Because InstCombine turns 'sub nuw' to 'add' losing the no-wrap flag, we
1609     // will most likely not see it. Let's try to prove it.
1610     if (OpCode != Instruction::Add)
1611       return false;
1612     if (ExtKind != ExtendKind::Zero)
1613       return false;
1614     const SCEV *LHS = SE->getSCEV(OBO->getOperand(0));
1615     const SCEV *RHS = SE->getSCEV(OBO->getOperand(1));
1616     // TODO: Support case for NarrowDef = NarrowUse->getOperand(1).
1617     if (NarrowUse->getOperand(0) != NarrowDef)
1618       return false;
1619     if (!SE->isKnownNegative(RHS))
1620       return false;
1621     bool ProvedSubNUW = SE->isKnownPredicateAt(ICmpInst::ICMP_UGE, LHS,
1622                                                SE->getNegativeSCEV(RHS), CtxI);
1623     if (!ProvedSubNUW)
1624       return false;
1625     // In fact, our 'add' is 'sub nuw'. We will need to widen the 2nd operand as
1626     // neg(zext(neg(op))), which is basically sext(op).
1627     AnotherOpExtKind = ExtendKind::Sign;
1628   }
1629
1630   // Verifying that Defining operand is an AddRec
1631   const SCEV *Op1 = SE->getSCEV(WideDef);
1632   const SCEVAddRecExpr *AddRecOp1 = dyn_cast<SCEVAddRecExpr>(Op1);
1633   if (!AddRecOp1 || AddRecOp1->getLoop() != L)
1634     return false;
1635
1636   LLVM_DEBUG(dbgs() << "Cloning arithmetic IVUser: " << *NarrowUse << "\n");
1637
1638   // Generating a widening use instruction.
1639   Value *LHS =
1640       (NarrowUse->getOperand(0) == NarrowDef)
1641           ? WideDef
1642           : createExtendInst(NarrowUse->getOperand(0), WideType,
1643                              AnotherOpExtKind == ExtendKind::Sign, NarrowUse);
1644   Value *RHS =
1645       (NarrowUse->getOperand(1) == NarrowDef)
1646           ? WideDef
1647           : createExtendInst(NarrowUse->getOperand(1), WideType,
1648                              AnotherOpExtKind == ExtendKind::Sign, NarrowUse);
1649
1650   auto *NarrowBO = cast<BinaryOperator>(NarrowUse);
1651   auto *WideBO = BinaryOperator::Create(NarrowBO->getOpcode(), LHS, RHS,
1652                                         NarrowBO->getName());
1653   IRBuilder<> Builder(NarrowUse);
1654   Builder.Insert(WideBO);
1655   WideBO->copyIRFlags(NarrowBO);
1656   ExtendKindMap[NarrowUse] = ExtKind;
1657
1658   for (Instruction *User : ExtUsers) {
1659     assert(User->getType() == WideType && "Checked before!");
1660     LLVM_DEBUG(dbgs() << "INDVARS: eliminating " << *User << " replaced by "
1661                       << *WideBO << "\n");
1662     ++NumElimExt;
1663     User->replaceAllUsesWith(WideBO);
1664     DeadInsts.emplace_back(User);
1665   }
1666
1667   for (PHINode *User : LCSSAPhiUsers) {
1668     assert(User->getNumOperands() == 1 && "Checked before!");
1669     Builder.SetInsertPoint(User);
1670     auto *WidePN =
1671         Builder.CreatePHI(WideBO->getType(), 1, User->getName() + ".wide");
1672     BasicBlock *LoopExitingBlock = User->getParent()->getSinglePredecessor();
1673     assert(LoopExitingBlock && L->contains(LoopExitingBlock) &&
1674            "Not a LCSSA Phi?");
1675     WidePN->addIncoming(WideBO, LoopExitingBlock);
1676     Builder.SetInsertPoint(User->getParent(),
1677                            User->getParent()->getFirstInsertionPt());
1678     auto *TruncPN = Builder.CreateTrunc(WidePN, User->getType());
1679     User->replaceAllUsesWith(TruncPN);
1680     DeadInsts.emplace_back(User);
1681   }
1682
1683   for (ICmpInst *User : ICmpUsers) {
1684     Builder.SetInsertPoint(User);
1685     auto ExtendedOp = [&](Value * V)->Value * {
1686       if (V == NarrowUse)
1687         return WideBO;
1688       if (ExtKind == ExtendKind::Zero)
1689         return Builder.CreateZExt(V, WideBO->getType());
1690       else
1691         return Builder.CreateSExt(V, WideBO->getType());
1692     };
1693     auto Pred = User->getPredicate();
1694     auto *LHS = ExtendedOp(User->getOperand(0));
1695     auto *RHS = ExtendedOp(User->getOperand(1));
1696     auto *WideCmp =
1697         Builder.CreateICmp(Pred, LHS, RHS, User->getName() + ".wide");
1698     User->replaceAllUsesWith(WideCmp);
1699     DeadInsts.emplace_back(User);
1700   }
1701
1702   return true;
1703 }
1704
1705 /// Determine whether an individual user of the narrow IV can be widened. If so,
1706 /// return the wide clone of the user.
1707 Instruction *WidenIV::widenIVUse(WidenIV::NarrowIVDefUse DU, SCEVExpander &Rewriter) {
1708   assert(ExtendKindMap.count(DU.NarrowDef) &&
1709          "Should already know the kind of extension used to widen NarrowDef");
1710
1711   // Stop traversing the def-use chain at inner-loop phis or post-loop phis.
1712   if (PHINode *UsePhi = dyn_cast<PHINode>(DU.NarrowUse)) {
1713     if (LI->getLoopFor(UsePhi->getParent()) != L) {
1714       // For LCSSA phis, sink the truncate outside the loop.
1715       // After SimplifyCFG most loop exit targets have a single predecessor.
1716       // Otherwise fall back to a truncate within the loop.
1717       if (UsePhi->getNumOperands() != 1)
1718         truncateIVUse(DU, DT, LI);
1719       else {
1720         // Widening the PHI requires us to insert a trunc.  The logical place
1721         // for this trunc is in the same BB as the PHI.  This is not possible if
1722         // the BB is terminated by a catchswitch.
1723         if (isa<CatchSwitchInst>(UsePhi->getParent()->getTerminator()))
1724           return nullptr;
1725
1726         PHINode *WidePhi =
1727           PHINode::Create(DU.WideDef->getType(), 1, UsePhi->getName() + ".wide",
1728                           UsePhi);
1729         WidePhi->addIncoming(DU.WideDef, UsePhi->getIncomingBlock(0));
1730         BasicBlock *WidePhiBB = WidePhi->getParent();
1731         IRBuilder<> Builder(WidePhiBB, WidePhiBB->getFirstInsertionPt());
1732         Value *Trunc = Builder.CreateTrunc(WidePhi, DU.NarrowDef->getType());
1733         UsePhi->replaceAllUsesWith(Trunc);
1734         DeadInsts.emplace_back(UsePhi);
1735         LLVM_DEBUG(dbgs() << "INDVARS: Widen lcssa phi " << *UsePhi << " to "
1736                           << *WidePhi << "\n");
1737       }
1738       return nullptr;
1739     }
1740   }
1741
1742   // This narrow use can be widened by a sext if it's non-negative or its narrow
1743   // def was widended by a sext. Same for zext.
1744   auto canWidenBySExt = [&]() {
1745     return DU.NeverNegative || getExtendKind(DU.NarrowDef) == ExtendKind::Sign;
1746   };
1747   auto canWidenByZExt = [&]() {
1748     return DU.NeverNegative || getExtendKind(DU.NarrowDef) == ExtendKind::Zero;
1749   };
1750
1751   // Our raison d'etre! Eliminate sign and zero extension.
1752   if ((isa<SExtInst>(DU.NarrowUse) && canWidenBySExt()) ||
1753       (isa<ZExtInst>(DU.NarrowUse) && canWidenByZExt())) {
1754     Value *NewDef = DU.WideDef;
1755     if (DU.NarrowUse->getType() != WideType) {
1756       unsigned CastWidth = SE->getTypeSizeInBits(DU.NarrowUse->getType());
1757       unsigned IVWidth = SE->getTypeSizeInBits(WideType);
1758       if (CastWidth < IVWidth) {
1759         // The cast isn't as wide as the IV, so insert a Trunc.
1760         IRBuilder<> Builder(DU.NarrowUse);
1761         NewDef = Builder.CreateTrunc(DU.WideDef, DU.NarrowUse->getType());
1762       }
1763       else {
1764         // A wider extend was hidden behind a narrower one. This may induce
1765         // another round of IV widening in which the intermediate IV becomes
1766         // dead. It should be very rare.
1767         LLVM_DEBUG(dbgs() << "INDVARS: New IV " << *WidePhi
1768                           << " not wide enough to subsume " << *DU.NarrowUse
1769                           << "\n");
1770         DU.NarrowUse->replaceUsesOfWith(DU.NarrowDef, DU.WideDef);
1771         NewDef = DU.NarrowUse;
1772       }
1773     }
1774     if (NewDef != DU.NarrowUse) {
1775       LLVM_DEBUG(dbgs() << "INDVARS: eliminating " << *DU.NarrowUse
1776                         << " replaced by " << *DU.WideDef << "\n");
1777       ++NumElimExt;
1778       DU.NarrowUse->replaceAllUsesWith(NewDef);
1779       DeadInsts.emplace_back(DU.NarrowUse);
1780     }
1781     // Now that the extend is gone, we want to expose it's uses for potential
1782     // further simplification. We don't need to directly inform SimplifyIVUsers
1783     // of the new users, because their parent IV will be processed later as a
1784     // new loop phi. If we preserved IVUsers analysis, we would also want to
1785     // push the uses of WideDef here.
1786
1787     // No further widening is needed. The deceased [sz]ext had done it for us.
1788     return nullptr;
1789   }
1790
1791   // Does this user itself evaluate to a recurrence after widening?
1792   WidenedRecTy WideAddRec = getExtendedOperandRecurrence(DU);
1793   if (!WideAddRec.first)
1794     WideAddRec = getWideRecurrence(DU);
1795
1796   assert((WideAddRec.first == nullptr) ==
1797          (WideAddRec.second == ExtendKind::Unknown));
1798   if (!WideAddRec.first) {
1799     // If use is a loop condition, try to promote the condition instead of
1800     // truncating the IV first.
1801     if (widenLoopCompare(DU))
1802       return nullptr;
1803
1804     // We are here about to generate a truncate instruction that may hurt
1805     // performance because the scalar evolution expression computed earlier
1806     // in WideAddRec.first does not indicate a polynomial induction expression.
1807     // In that case, look at the operands of the use instruction to determine
1808     // if we can still widen the use instead of truncating its operand.
1809     if (widenWithVariantUse(DU))
1810       return nullptr;
1811
1812     // This user does not evaluate to a recurrence after widening, so don't
1813     // follow it. Instead insert a Trunc to kill off the original use,
1814     // eventually isolating the original narrow IV so it can be removed.
1815     truncateIVUse(DU, DT, LI);
1816     return nullptr;
1817   }
1818
1819   // Reuse the IV increment that SCEVExpander created as long as it dominates
1820   // NarrowUse.
1821   Instruction *WideUse = nullptr;
1822   if (WideAddRec.first == WideIncExpr &&
1823       Rewriter.hoistIVInc(WideInc, DU.NarrowUse))
1824     WideUse = WideInc;
1825   else {
1826     WideUse = cloneIVUser(DU, WideAddRec.first);
1827     if (!WideUse)
1828       return nullptr;
1829   }
1830   // Evaluation of WideAddRec ensured that the narrow expression could be
1831   // extended outside the loop without overflow. This suggests that the wide use
1832   // evaluates to the same expression as the extended narrow use, but doesn't
1833   // absolutely guarantee it. Hence the following failsafe check. In rare cases
1834   // where it fails, we simply throw away the newly created wide use.
1835   if (WideAddRec.first != SE->getSCEV(WideUse)) {
1836     LLVM_DEBUG(dbgs() << "Wide use expression mismatch: " << *WideUse << ": "
1837                       << *SE->getSCEV(WideUse) << " != " << *WideAddRec.first
1838                       << "\n");
1839     DeadInsts.emplace_back(WideUse);
1840     return nullptr;
1841   }
1842
1843   // if we reached this point then we are going to replace
1844   // DU.NarrowUse with WideUse. Reattach DbgValue then.
1845   replaceAllDbgUsesWith(*DU.NarrowUse, *WideUse, *WideUse, *DT);
1846
1847   ExtendKindMap[DU.NarrowUse] = WideAddRec.second;
1848   // Returning WideUse pushes it on the worklist.
1849   return WideUse;
1850 }
1851
1852 /// Add eligible users of NarrowDef to NarrowIVUsers.
1853 void WidenIV::pushNarrowIVUsers(Instruction *NarrowDef, Instruction *WideDef) {
1854   const SCEV *NarrowSCEV = SE->getSCEV(NarrowDef);
1855   bool NonNegativeDef =
1856       SE->isKnownPredicate(ICmpInst::ICMP_SGE, NarrowSCEV,
1857                            SE->getZero(NarrowSCEV->getType()));
1858   for (User *U : NarrowDef->users()) {
1859     Instruction *NarrowUser = cast<Instruction>(U);
1860
1861     // Handle data flow merges and bizarre phi cycles.
1862     if (!Widened.insert(NarrowUser).second)
1863       continue;
1864
1865     bool NonNegativeUse = false;
1866     if (!NonNegativeDef) {
1867       // We might have a control-dependent range information for this context.
1868       if (auto RangeInfo = getPostIncRangeInfo(NarrowDef, NarrowUser))
1869         NonNegativeUse = RangeInfo->getSignedMin().isNonNegative();
1870     }
1871
1872     NarrowIVUsers.emplace_back(NarrowDef, NarrowUser, WideDef,
1873                                NonNegativeDef || NonNegativeUse);
1874   }
1875 }
1876
1877 /// Process a single induction variable. First use the SCEVExpander to create a
1878 /// wide induction variable that evaluates to the same recurrence as the
1879 /// original narrow IV. Then use a worklist to forward traverse the narrow IV's
1880 /// def-use chain. After widenIVUse has processed all interesting IV users, the
1881 /// narrow IV will be isolated for removal by DeleteDeadPHIs.
1882 ///
1883 /// It would be simpler to delete uses as they are processed, but we must avoid
1884 /// invalidating SCEV expressions.
1885 PHINode *WidenIV::createWideIV(SCEVExpander &Rewriter) {
1886   // Is this phi an induction variable?
1887   const SCEVAddRecExpr *AddRec = dyn_cast<SCEVAddRecExpr>(SE->getSCEV(OrigPhi));
1888   if (!AddRec)
1889     return nullptr;
1890
1891   // Widen the induction variable expression.
1892   const SCEV *WideIVExpr = getExtendKind(OrigPhi) == ExtendKind::Sign
1893                                ? SE->getSignExtendExpr(AddRec, WideType)
1894                                : SE->getZeroExtendExpr(AddRec, WideType);
1895
1896   assert(SE->getEffectiveSCEVType(WideIVExpr->getType()) == WideType &&
1897          "Expect the new IV expression to preserve its type");
1898
1899   // Can the IV be extended outside the loop without overflow?
1900   AddRec = dyn_cast<SCEVAddRecExpr>(WideIVExpr);
1901   if (!AddRec || AddRec->getLoop() != L)
1902     return nullptr;
1903
1904   // An AddRec must have loop-invariant operands. Since this AddRec is
1905   // materialized by a loop header phi, the expression cannot have any post-loop
1906   // operands, so they must dominate the loop header.
1907   assert(
1908       SE->properlyDominates(AddRec->getStart(), L->getHeader()) &&
1909       SE->properlyDominates(AddRec->getStepRecurrence(*SE), L->getHeader()) &&
1910       "Loop header phi recurrence inputs do not dominate the loop");
1911
1912   // Iterate over IV uses (including transitive ones) looking for IV increments
1913   // of the form 'add nsw %iv, <const>'. For each increment and each use of
1914   // the increment calculate control-dependent range information basing on
1915   // dominating conditions inside of the loop (e.g. a range check inside of the
1916   // loop). Calculated ranges are stored in PostIncRangeInfos map.
1917   //
1918   // Control-dependent range information is later used to prove that a narrow
1919   // definition is not negative (see pushNarrowIVUsers). It's difficult to do
1920   // this on demand because when pushNarrowIVUsers needs this information some
1921   // of the dominating conditions might be already widened.
1922   if (UsePostIncrementRanges)
1923     calculatePostIncRanges(OrigPhi);
1924
1925   // The rewriter provides a value for the desired IV expression. This may
1926   // either find an existing phi or materialize a new one. Either way, we
1927   // expect a well-formed cyclic phi-with-increments. i.e. any operand not part
1928   // of the phi-SCC dominates the loop entry.
1929   Instruction *InsertPt = &*L->getHeader()->getFirstInsertionPt();
1930   Value *ExpandInst = Rewriter.expandCodeFor(AddRec, WideType, InsertPt);
1931   // If the wide phi is not a phi node, for example a cast node, like bitcast,
1932   // inttoptr, ptrtoint, just skip for now.
1933   if (!(WidePhi = dyn_cast<PHINode>(ExpandInst))) {
1934     // if the cast node is an inserted instruction without any user, we should
1935     // remove it to make sure the pass don't touch the function as we can not
1936     // wide the phi.
1937     if (ExpandInst->hasNUses(0) &&
1938         Rewriter.isInsertedInstruction(cast<Instruction>(ExpandInst)))
1939       DeadInsts.emplace_back(ExpandInst);
1940     return nullptr;
1941   }
1942
1943   // Remembering the WideIV increment generated by SCEVExpander allows
1944   // widenIVUse to reuse it when widening the narrow IV's increment. We don't
1945   // employ a general reuse mechanism because the call above is the only call to
1946   // SCEVExpander. Henceforth, we produce 1-to-1 narrow to wide uses.
1947   if (BasicBlock *LatchBlock = L->getLoopLatch()) {
1948     WideInc =
1949         dyn_cast<Instruction>(WidePhi->getIncomingValueForBlock(LatchBlock));
1950     if (WideInc) {
1951       WideIncExpr = SE->getSCEV(WideInc);
1952       // Propagate the debug location associated with the original loop
1953       // increment to the new (widened) increment.
1954       auto *OrigInc =
1955           cast<Instruction>(OrigPhi->getIncomingValueForBlock(LatchBlock));
1956       WideInc->setDebugLoc(OrigInc->getDebugLoc());
1957     }
1958   }
1959
1960   LLVM_DEBUG(dbgs() << "Wide IV: " << *WidePhi << "\n");
1961   ++NumWidened;
1962
1963   // Traverse the def-use chain using a worklist starting at the original IV.
1964   assert(Widened.empty() && NarrowIVUsers.empty() && "expect initial state" );
1965
1966   Widened.insert(OrigPhi);
1967   pushNarrowIVUsers(OrigPhi, WidePhi);
1968
1969   while (!NarrowIVUsers.empty()) {
1970     WidenIV::NarrowIVDefUse DU = NarrowIVUsers.pop_back_val();
1971
1972     // Process a def-use edge. This may replace the use, so don't hold a
1973     // use_iterator across it.
1974     Instruction *WideUse = widenIVUse(DU, Rewriter);
1975
1976     // Follow all def-use edges from the previous narrow use.
1977     if (WideUse)
1978       pushNarrowIVUsers(DU.NarrowUse, WideUse);
1979
1980     // widenIVUse may have removed the def-use edge.
1981     if (DU.NarrowDef->use_empty())
1982       DeadInsts.emplace_back(DU.NarrowDef);
1983   }
1984
1985   // Attach any debug information to the new PHI.
1986   replaceAllDbgUsesWith(*OrigPhi, *WidePhi, *WidePhi, *DT);
1987
1988   return WidePhi;
1989 }
1990
1991 /// Calculates control-dependent range for the given def at the given context
1992 /// by looking at dominating conditions inside of the loop
1993 void WidenIV::calculatePostIncRange(Instruction *NarrowDef,
1994                                     Instruction *NarrowUser) {
1995   using namespace llvm::PatternMatch;
1996
1997   Value *NarrowDefLHS;
1998   const APInt *NarrowDefRHS;
1999   if (!match(NarrowDef, m_NSWAdd(m_Value(NarrowDefLHS),
2000                                  m_APInt(NarrowDefRHS))) ||
2001       !NarrowDefRHS->isNonNegative())
2002     return;
2003
2004   auto UpdateRangeFromCondition = [&] (Value *Condition,
2005                                        bool TrueDest) {
2006     CmpInst::Predicate Pred;
2007     Value *CmpRHS;
2008     if (!match(Condition, m_ICmp(Pred, m_Specific(NarrowDefLHS),
2009                                  m_Value(CmpRHS))))
2010       return;
2011
2012     CmpInst::Predicate P =
2013             TrueDest ? Pred : CmpInst::getInversePredicate(Pred);
2014
2015     auto CmpRHSRange = SE->getSignedRange(SE->getSCEV(CmpRHS));
2016     auto CmpConstrainedLHSRange =
2017             ConstantRange::makeAllowedICmpRegion(P, CmpRHSRange);
2018     auto NarrowDefRange = CmpConstrainedLHSRange.addWithNoWrap(
2019         *NarrowDefRHS, OverflowingBinaryOperator::NoSignedWrap);
2020
2021     updatePostIncRangeInfo(NarrowDef, NarrowUser, NarrowDefRange);
2022   };
2023
2024   auto UpdateRangeFromGuards = [&](Instruction *Ctx) {
2025     if (!HasGuards)
2026       return;
2027
2028     for (Instruction &I : make_range(Ctx->getIterator().getReverse(),
2029                                      Ctx->getParent()->rend())) {
2030       Value *C = nullptr;
2031       if (match(&I, m_Intrinsic<Intrinsic::experimental_guard>(m_Value(C))))
2032         UpdateRangeFromCondition(C, /*TrueDest=*/true);
2033     }
2034   };
2035
2036   UpdateRangeFromGuards(NarrowUser);
2037
2038   BasicBlock *NarrowUserBB = NarrowUser->getParent();
2039   // If NarrowUserBB is statically unreachable asking dominator queries may
2040   // yield surprising results. (e.g. the block may not have a dom tree node)
2041   if (!DT->isReachableFromEntry(NarrowUserBB))
2042     return;
2043
2044   for (auto *DTB = (*DT)[NarrowUserBB]->getIDom();
2045        L->contains(DTB->getBlock());
2046        DTB = DTB->getIDom()) {
2047     auto *BB = DTB->getBlock();
2048     auto *TI = BB->getTerminator();
2049     UpdateRangeFromGuards(TI);
2050
2051     auto *BI = dyn_cast<BranchInst>(TI);
2052     if (!BI || !BI->isConditional())
2053       continue;
2054
2055     auto *TrueSuccessor = BI->getSuccessor(0);
2056     auto *FalseSuccessor = BI->getSuccessor(1);
2057
2058     auto DominatesNarrowUser = [this, NarrowUser] (BasicBlockEdge BBE) {
2059       return BBE.isSingleEdge() &&
2060              DT->dominates(BBE, NarrowUser->getParent());
2061     };
2062
2063     if (DominatesNarrowUser(BasicBlockEdge(BB, TrueSuccessor)))
2064       UpdateRangeFromCondition(BI->getCondition(), /*TrueDest=*/true);
2065
2066     if (DominatesNarrowUser(BasicBlockEdge(BB, FalseSuccessor)))
2067       UpdateRangeFromCondition(BI->getCondition(), /*TrueDest=*/false);
2068   }
2069 }
2070
2071 /// Calculates PostIncRangeInfos map for the given IV
2072 void WidenIV::calculatePostIncRanges(PHINode *OrigPhi) {
2073   SmallPtrSet<Instruction *, 16> Visited;
2074   SmallVector<Instruction *, 6> Worklist;
2075   Worklist.push_back(OrigPhi);
2076   Visited.insert(OrigPhi);
2077
2078   while (!Worklist.empty()) {
2079     Instruction *NarrowDef = Worklist.pop_back_val();
2080
2081     for (Use &U : NarrowDef->uses()) {
2082       auto *NarrowUser = cast<Instruction>(U.getUser());
2083
2084       // Don't go looking outside the current loop.
2085       auto *NarrowUserLoop = (*LI)[NarrowUser->getParent()];
2086       if (!NarrowUserLoop || !L->contains(NarrowUserLoop))
2087         continue;
2088
2089       if (!Visited.insert(NarrowUser).second)
2090         continue;
2091
2092       Worklist.push_back(NarrowUser);
2093
2094       calculatePostIncRange(NarrowDef, NarrowUser);
2095     }
2096   }
2097 }
2098
2099 PHINode *llvm::createWideIV(const WideIVInfo &WI,
2100     LoopInfo *LI, ScalarEvolution *SE, SCEVExpander &Rewriter,
2101     DominatorTree *DT, SmallVectorImpl<WeakTrackingVH> &DeadInsts,
2102     unsigned &NumElimExt, unsigned &NumWidened,
2103     bool HasGuards, bool UsePostIncrementRanges) {
2104   WidenIV Widener(WI, LI, SE, DT, DeadInsts, HasGuards, UsePostIncrementRanges);
2105   PHINode *WidePHI = Widener.createWideIV(Rewriter);
2106   NumElimExt = Widener.getNumElimExt();
2107   NumWidened = Widener.getNumWidened();
2108   return WidePHI;
2109 }