doxygen/html/ScalarEvolutionExpander_8cpp_source.html

//===- ScalarEvolutionExpander.cpp - Scalar Evolution Analysis ------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file contains the implementation of the scalar evolution expander,

// which is used to generate the code corresponding to a given scalar evolution

// expression.

//

//===----------------------------------------------------------------------===//


#include "llvm/Transforms/Utils/ScalarEvolutionExpander.h"

#include "llvm/ADT/STLExtras.h"

#include "llvm/ADT/ScopeExit.h"

#include "llvm/Analysis/InstructionSimplify.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/ScalarEvolutionPatternMatch.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/raw_ostream.h"

#include "llvm/Transforms/Utils/Local.h"

#include "llvm/Transforms/Utils/LoopUtils.h"


#if LLVM_ENABLE_ABI_BREAKING_CHECKS

#define SCEV_DEBUG_WITH_TYPE(TYPE, X) DEBUG_WITH_TYPE(TYPE, X)

#else

#define SCEV_DEBUG_WITH_TYPE(TYPE, X)

#endif


using namespace llvm;


cl::opt<unsigned> llvm::SCEVCheapExpansionBudget(

    "scev-cheap-expansion-budget", cl::Hidden, cl::init(4),

    cl::desc("When performing SCEV expansion only if it is cheap to do, this "

             "controls the budget that is considered cheap (default = 4)"));


using namespace PatternMatch;

using namespace SCEVPatternMatch;


PoisonFlags::PoisonFlags(const Instruction *I) {

  NUW = false;

  NSW = false;

  Exact = false;

  Disjoint = false;

  NNeg = false;

  SameSign = false;

  GEPNW = GEPNoWrapFlags::none();

  if (auto *OBO = dyn_cast<OverflowingBinaryOperator>(I)) {

    NUW = OBO->hasNoUnsignedWrap();

    NSW = OBO->hasNoSignedWrap();

  }

  if (auto *PEO = dyn_cast<PossiblyExactOperator>(I))

    Exact = PEO->isExact();

  if (auto *PDI = dyn_cast<PossiblyDisjointInst>(I))

    Disjoint = PDI->isDisjoint();

  if (auto *PNI = dyn_cast<PossiblyNonNegInst>(I))

    NNeg = PNI->hasNonNeg();

  if (auto *TI = dyn_cast<TruncInst>(I)) {

    NUW = TI->hasNoUnsignedWrap();

    NSW = TI->hasNoSignedWrap();

  }

  if (auto *GEP = dyn_cast<GetElementPtrInst>(I))

    GEPNW = GEP->getNoWrapFlags();

  if (auto *ICmp = dyn_cast<ICmpInst>(I))

    SameSign = ICmp->hasSameSign();

}


void PoisonFlags::apply(Instruction *I) {

  if (isa<OverflowingBinaryOperator>(I)) {

    I->setHasNoUnsignedWrap(NUW);

    I->setHasNoSignedWrap(NSW);

  }

  if (isa<PossiblyExactOperator>(I))

    I->setIsExact(Exact);

  if (auto *PDI = dyn_cast<PossiblyDisjointInst>(I))

    PDI->setIsDisjoint(Disjoint);

  if (auto *PNI = dyn_cast<PossiblyNonNegInst>(I))

    PNI->setNonNeg(NNeg);

  if (isa<TruncInst>(I)) {

    I->setHasNoUnsignedWrap(NUW);

    I->setHasNoSignedWrap(NSW);

  }

  if (auto *GEP = dyn_cast<GetElementPtrInst>(I))

    GEP->setNoWrapFlags(GEPNW);

  if (auto *ICmp = dyn_cast<ICmpInst>(I))

    ICmp->setSameSign(SameSign);

}


/// ReuseOrCreateCast - Arrange for there to be a cast of V to Ty at IP,

/// reusing an existing cast if a suitable one (= dominating IP) exists, or

/// creating a new one.

Value *SCEVExpander::ReuseOrCreateCast(Value *V, Type *Ty,

                                       Instruction::CastOps Op,

                                       BasicBlock::iterator IP) {

  // This function must be called with the builder having a valid insertion

  // point. It doesn't need to be the actual IP where the uses of the returned

  // cast will be added, but it must dominate such IP.

  // We use this precondition to produce a cast that will dominate all its

  // uses. In particular, this is crucial for the case where the builder's

  // insertion point *is* the point where we were asked to put the cast.

  // Since we don't know the builder's insertion point is actually

  // where the uses will be added (only that it dominates it), we are

  // not allowed to move it.

  BasicBlock::iterator BIP = Builder.GetInsertPoint();


  Value *Ret = nullptr;


  if (!isa<Constant>(V)) {

    // Check to see if there is already a cast!

    for (User *U : V->users()) {

      if (U->getType() != Ty)

        continue;

      CastInst *CI = dyn_cast<CastInst>(U);

      if (!CI || CI->getOpcode() != Op)

        continue;


      // Found a suitable cast that is at IP or comes before IP. Use it. Note

      // that the cast must also properly dominate the Builder's insertion

      // point.

      if (IP->getParent() == CI->getParent() && &*BIP != CI &&

          (&*IP == CI || CI->comesBefore(&*IP))) {

        Ret = CI;

        break;

      }

    }

  }


  // Create a new cast.

  if (!Ret) {

    SCEVInsertPointGuard Guard(Builder, this);

    Builder.SetInsertPoint(&*IP);

    Ret = Builder.CreateCast(Op, V, Ty, V->getName());

  }


  // We assert at the end of the function since IP might point to an

  // instruction with different dominance properties than a cast

  // (an invoke for example) and not dominate BIP (but the cast does).

  assert(!isa<Instruction>(Ret) ||

         SE.DT.dominates(cast<Instruction>(Ret), &*BIP));


  return Ret;

}


BasicBlock::iterator


SCEVExpander::findInsertPointAfter(Instruction *I,

                                   Instruction *MustDominate) const {

  BasicBlock::iterator IP;

  if (auto MaybeIP = I->getInsertionPointAfterDef()) {

    IP = *MaybeIP;

  } else {

    assert(SE.DT.dominates(I, MustDominate) &&

           "instruction must dominate the insertion point");

    IP = MustDominate->getIterator();

  }


  // Adjust insert point to be after instructions inserted by the expander, so

  // we can re-use already inserted instructions. Avoid skipping past the

  // original \p MustDominate, in case it is an inserted instruction.

  while (isInsertedInstruction(&*IP) && &*IP != MustDominate)

    ++IP;


  return IP;

}


void SCEVExpander::eraseDeadInstructions(Value *Root) {

  SmallVector<Value *> WorkList;

  SmallPtrSet<Value *, 8> DeletedValues;

  append_range(WorkList, getAllInsertedInstructions());

  while (!WorkList.empty()) {

    Value *V = WorkList.pop_back_val();

    if (DeletedValues.contains(V))

      continue;

    auto *I = dyn_cast<Instruction>(V);

    if (!I || I == Root || !isInsertedInstruction(I) ||

        !isInstructionTriviallyDead(I))

      continue;

    append_range(WorkList, I->operands());

    InsertedValues.erase(I);

    InsertedPostIncValues.erase(I);

    DeletedValues.insert(I);

    I->eraseFromParent();

  }

}


BasicBlock::iterator

SCEVExpander::GetOptimalInsertionPointForCastOf(Value *V) const {

  // Cast the argument at the beginning of the entry block, after

  // any bitcasts of other arguments.

  if (Argument *A = dyn_cast<Argument>(V)) {

    BasicBlock::iterator IP = A->getParent()->getEntryBlock().begin();

    while ((isa<BitCastInst>(IP) &&

            isa<Argument>(cast<BitCastInst>(IP)->getOperand(0)) &&

            cast<BitCastInst>(IP)->getOperand(0) != A))

      ++IP;

    return IP;

  }


  // Cast the instruction immediately after the instruction.

  if (Instruction *I = dyn_cast<Instruction>(V))

    return findInsertPointAfter(I, &*Builder.GetInsertPoint());


  // Otherwise, this must be some kind of a constant,

  // so let's plop this cast into the function's entry block.

  assert(isa<Constant>(V) &&

         "Expected the cast argument to be a global/constant");

  return Builder.GetInsertBlock()

      ->getParent()

      ->getEntryBlock()

      .getFirstInsertionPt();

}


/// InsertNoopCastOfTo - Insert a cast of V to the specified type,

/// which must be possible with a noop cast, doing what we can to share

/// the casts.

Value *SCEVExpander::InsertNoopCastOfTo(Value *V, Type *Ty) {

  Instruction::CastOps Op = CastInst::getCastOpcode(V, false, Ty, false);

  assert((Op == Instruction::BitCast ||

          Op == Instruction::PtrToInt ||

          Op == Instruction::IntToPtr) &&

         "InsertNoopCastOfTo cannot perform non-noop casts!");

  assert(SE.getTypeSizeInBits(V->getType()) == SE.getTypeSizeInBits(Ty) &&

         "InsertNoopCastOfTo cannot change sizes!");


  // inttoptr only works for integral pointers. For non-integral pointers, we

  // can create a GEP on null with the integral value as index. Note that

  // it is safe to use GEP of null instead of inttoptr here, because only

  // expressions already based on a GEP of null should be converted to pointers

  // during expansion.

  if (Op == Instruction::IntToPtr) {

    auto *PtrTy = cast<PointerType>(Ty);

    if (DL.isNonIntegralPointerType(PtrTy))

      return Builder.CreatePtrAdd(Constant::getNullValue(PtrTy), V, "scevgep");

  }

  // Short-circuit unnecessary bitcasts.

  if (Op == Instruction::BitCast) {

    if (V->getType() == Ty)

      return V;

    if (CastInst *CI = dyn_cast<CastInst>(V)) {

      if (CI->getOperand(0)->getType() == Ty)

        return CI->getOperand(0);

    }

  }

  // Short-circuit unnecessary inttoptr<->ptrtoint casts.

  if ((Op == Instruction::PtrToInt || Op == Instruction::IntToPtr) &&

      SE.getTypeSizeInBits(Ty) == SE.getTypeSizeInBits(V->getType())) {

    if (CastInst *CI = dyn_cast<CastInst>(V))

      if ((CI->getOpcode() == Instruction::PtrToInt ||

           CI->getOpcode() == Instruction::IntToPtr) &&

          SE.getTypeSizeInBits(CI->getType()) ==

          SE.getTypeSizeInBits(CI->getOperand(0)->getType()))

        return CI->getOperand(0);

    if (ConstantExpr *CE = dyn_cast<ConstantExpr>(V))

      if ((CE->getOpcode() == Instruction::PtrToInt ||

           CE->getOpcode() == Instruction::IntToPtr) &&

          SE.getTypeSizeInBits(CE->getType()) ==

          SE.getTypeSizeInBits(CE->getOperand(0)->getType()))

        return CE->getOperand(0);

  }


  // Fold a cast of a constant.

  if (Constant *C = dyn_cast<Constant>(V))

    return ConstantExpr::getCast(Op, C, Ty);


  // Try to reuse existing cast, or insert one.

  return ReuseOrCreateCast(V, Ty, Op, GetOptimalInsertionPointForCastOf(V));

}


/// InsertBinop - Insert the specified binary operator, doing a small amount

/// of work to avoid inserting an obviously redundant operation, and hoisting

/// to an outer loop when the opportunity is there and it is safe.

Value *SCEVExpander::InsertBinop(Instruction::BinaryOps Opcode,

                                 Value *LHS, Value *RHS,

                                 SCEV::NoWrapFlags Flags, bool IsSafeToHoist) {

  // Fold a binop with constant operands.

  if (Constant *CLHS = dyn_cast<Constant>(LHS))

    if (Constant *CRHS = dyn_cast<Constant>(RHS))

      if (Constant *Res = ConstantFoldBinaryOpOperands(Opcode, CLHS, CRHS, DL))

        return Res;


  // Do a quick scan to see if we have this binop nearby.  If so, reuse it.

  unsigned ScanLimit = 6;

  BasicBlock::iterator BlockBegin = Builder.GetInsertBlock()->begin();

  // Scanning starts from the last instruction before the insertion point.

  BasicBlock::iterator IP = Builder.GetInsertPoint();

  if (IP != BlockBegin) {

    --IP;

    for (; ScanLimit; --IP, --ScanLimit) {

      auto canGenerateIncompatiblePoison = [&Flags](Instruction *I) {

        // Ensure that no-wrap flags match.

        if (isa<OverflowingBinaryOperator>(I)) {

          if (I->hasNoSignedWrap() != any(Flags & SCEV::FlagNSW))

            return true;

          if (I->hasNoUnsignedWrap() != any(Flags & SCEV::FlagNUW))

            return true;

        }

        // Conservatively, do not use any instruction which has any of exact

        // flags installed.

        if (isa<PossiblyExactOperator>(I) && I->isExact())

          return true;

        return false;

      };

      if (IP->getOpcode() == (unsigned)Opcode && IP->getOperand(0) == LHS &&

          IP->getOperand(1) == RHS && !canGenerateIncompatiblePoison(&*IP))

        return &*IP;

      if (IP == BlockBegin) break;

    }

  }


  // Save the original insertion point so we can restore it when we're done.

  DebugLoc Loc = Builder.GetInsertPoint()->getDebugLoc();

  SCEVInsertPointGuard Guard(Builder, this);


  if (IsSafeToHoist) {

    // Move the insertion point out of as many loops as we can.

    while (const Loop *L = SE.LI.getLoopFor(Builder.GetInsertBlock())) {

      if (!L->isLoopInvariant(LHS) || !L->isLoopInvariant(RHS)) break;

      BasicBlock *Preheader = L->getLoopPreheader();

      if (!Preheader) break;


      // Ok, move up a level.

      Builder.SetInsertPoint(Preheader->getTerminator());

    }

  }


  // If we haven't found this binop, insert it.

  Builder.SetCurrentDebugLocation(Loc);

  bool IsNUW = any(Flags & SCEV::FlagNUW);

  bool IsNSW = any(Flags & SCEV::FlagNSW);

  // Don't use folder when expanding post-inc rewrites in LSRMode to preserve

  // the rewrites.

  if (LSRMode && !PostIncLoops.empty() &&

      all_of(PostIncLoops, [&](const Loop *L) {

        return !L->contains(Builder.GetInsertBlock());

      })) {

    auto *BO = BinaryOperator::Create(Opcode, LHS, RHS);

    if (IsNUW)

      BO->setHasNoUnsignedWrap();

    if (IsNSW)

      BO->setHasNoSignedWrap();

    return Builder.Insert(BO);

  }

  return Builder.CreateNoWrapBinOp(Opcode, LHS, RHS, IsNUW, IsNSW);

}


/// expandAddToGEP - Expand an addition expression with a pointer type into

/// a GEP instead of using ptrtoint+arithmetic+inttoptr. This helps

/// BasicAliasAnalysis and other passes analyze the result. See the rules

/// for getelementptr vs. inttoptr in

/// http://llvm.org/docs/LangRef.html#pointeraliasing

/// for details.

///

/// Design note: The correctness of using getelementptr here depends on

/// ScalarEvolution not recognizing inttoptr and ptrtoint operators, as

/// they may introduce pointer arithmetic which may not be safely converted

/// into getelementptr.

///

/// Design note: It might seem desirable for this function to be more

/// loop-aware. If some of the indices are loop-invariant while others

/// aren't, it might seem desirable to emit multiple GEPs, keeping the

/// loop-invariant portions of the overall computation outside the loop.

/// However, there are a few reasons this is not done here. Hoisting simple

/// arithmetic is a low-level optimization that often isn't very

/// important until late in the optimization process. In fact, passes

/// like InstructionCombining will combine GEPs, even if it means

/// pushing loop-invariant computation down into loops, so even if the

/// GEPs were split here, the work would quickly be undone. The

/// LoopStrengthReduction pass, which is usually run quite late (and

/// after the last InstructionCombining pass), takes care of hoisting

/// loop-invariant portions of expressions, after considering what

/// can be folded using target addressing modes.

///

Value *SCEVExpander::expandAddToGEP(const SCEV *Offset, Value *V,

                                    SCEV::NoWrapFlags Flags) {

  assert(!isa<Instruction>(V) ||

         SE.DT.dominates(cast<Instruction>(V), &*Builder.GetInsertPoint()));


  Value *Idx = expand(Offset);

  GEPNoWrapFlags NW = any(Flags & SCEV::FlagNUW)

                          ? GEPNoWrapFlags::noUnsignedWrap()

                          : GEPNoWrapFlags::none();


  // Fold a GEP with constant operands.

  if (Constant *CLHS = dyn_cast<Constant>(V))

    if (Constant *CRHS = dyn_cast<Constant>(Idx))

      return Builder.CreatePtrAdd(CLHS, CRHS, "", NW);


  // Do a quick scan to see if we have this GEP nearby.  If so, reuse it.

  unsigned ScanLimit = 6;

  BasicBlock::iterator BlockBegin = Builder.GetInsertBlock()->begin();

  // Scanning starts from the last instruction before the insertion point.

  BasicBlock::iterator IP = Builder.GetInsertPoint();

  if (IP != BlockBegin) {

    --IP;

    for (; ScanLimit; --IP, --ScanLimit) {

      if (auto *GEP = dyn_cast<GetElementPtrInst>(IP)) {

        if (GEP->getPointerOperand() == V &&

            GEP->getSourceElementType() == Builder.getInt8Ty() &&

            GEP->getOperand(1) == Idx) {

          rememberFlags(GEP);

          GEP->setNoWrapFlags(GEP->getNoWrapFlags() & NW);

          return &*IP;

        }

      }

      if (IP == BlockBegin) break;

    }

  }


  // Save the original insertion point so we can restore it when we're done.

  SCEVInsertPointGuard Guard(Builder, this);


  // Move the insertion point out of as many loops as we can.

  while (const Loop *L = SE.LI.getLoopFor(Builder.GetInsertBlock())) {

    if (!L->isLoopInvariant(V) || !L->isLoopInvariant(Idx)) break;

    BasicBlock *Preheader = L->getLoopPreheader();

    if (!Preheader) break;


    // Ok, move up a level.

    Builder.SetInsertPoint(Preheader->getTerminator());

  }


  // Emit a GEP.

  return Builder.CreatePtrAdd(V, Idx, "scevgep", NW);

}


/// PickMostRelevantLoop - Given two loops pick the one that's most relevant for

/// SCEV expansion. If they are nested, this is the most nested. If they are

/// neighboring, pick the later.


static const Loop *PickMostRelevantLoop(const Loop *A, const Loop *B,

                                        DominatorTree &DT) {

  if (!A) return B;

  if (!B) return A;

  if (A->contains(B)) return B;

  if (B->contains(A)) return A;

  if (DT.dominates(A->getHeader(), B->getHeader())) return B;

  if (DT.dominates(B->getHeader(), A->getHeader())) return A;

  return A; // Arbitrarily break the tie.

}


/// getRelevantLoop - Get the most relevant loop associated with the given

/// expression, according to PickMostRelevantLoop.

const Loop *SCEVExpander::getRelevantLoop(const SCEV *S) {

  // Test whether we've already computed the most relevant loop for this SCEV.

  auto Pair = RelevantLoops.try_emplace(S);

  if (!Pair.second)

    return Pair.first->second;


  switch (S->getSCEVType()) {

  case scConstant:

  case scVScale:

    return nullptr; // A constant has no relevant loops.

  case scTruncate:

  case scZeroExtend:

  case scSignExtend:

  case scPtrToAddr:

  case scPtrToInt:

  case scAddExpr:

  case scMulExpr:

  case scUDivExpr:

  case scAddRecExpr:

  case scUMaxExpr:

  case scSMaxExpr:

  case scUMinExpr:

  case scSMinExpr:

  case scSequentialUMinExpr: {

    const Loop *L = nullptr;

    if (const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(S))

      L = AR->getLoop();

    for (const SCEV *Op : S->operands())

      L = PickMostRelevantLoop(L, getRelevantLoop(Op), SE.DT);

    return RelevantLoops[S] = L;

  }

  case scUnknown: {

    const SCEVUnknown *U = cast<SCEVUnknown>(S);

    if (const Instruction *I = dyn_cast<Instruction>(U->getValue()))

      return Pair.first->second = SE.LI.getLoopFor(I->getParent());

    // A non-instruction has no relevant loops.

    return nullptr;

  }

  case scCouldNotCompute:

    llvm_unreachable("Attempt to use a SCEVCouldNotCompute object!");

  }

  llvm_unreachable("Unexpected SCEV type!");

}


namespace {


/// LoopCompare - Compare loops by PickMostRelevantLoop.

class LoopCompare {

  DominatorTree &DT;

public:

  explicit LoopCompare(DominatorTree &dt) : DT(dt) {}


  bool operator()(std::pair<const Loop *, const SCEV *> LHS,

                  std::pair<const Loop *, const SCEV *> RHS) const {

    // Keep pointer operands sorted at the end.

    if (LHS.second->getType()->isPointerTy() !=

        RHS.second->getType()->isPointerTy())

      return LHS.second->getType()->isPointerTy();


    // Compare loops with PickMostRelevantLoop.

    if (LHS.first != RHS.first)

      return PickMostRelevantLoop(LHS.first, RHS.first, DT) != LHS.first;


    // If one operand is a non-constant negative and the other is not,

    // put the non-constant negative on the right so that a sub can

    // be used instead of a negate and add.

    if (LHS.second->isNonConstantNegative()) {

      if (!RHS.second->isNonConstantNegative())

        return false;

    } else if (RHS.second->isNonConstantNegative())

      return true;


    // Otherwise they are equivalent according to this comparison.

    return false;

  }

};


}


Value *SCEVExpander::visitAddExpr(SCEVUseT<const SCEVAddExpr *> S) {

  // Recognize the canonical representation of an unsimplifed urem.

  const SCEV *URemLHS = nullptr;

  const SCEV *URemRHS = nullptr;

  if (match(S, m_scev_URem(m_SCEV(URemLHS), m_SCEV(URemRHS), SE))) {

    Value *LHS = expand(URemLHS);

    Value *RHS = expand(URemRHS);

    return InsertBinop(Instruction::URem, LHS, RHS, SCEV::FlagAnyWrap,

                      /*IsSafeToHoist*/ false);

  }


  // Collect all the add operands in a loop, along with their associated loops.

  // Iterate in reverse so that constants are emitted last, all else equal, and

  // so that pointer operands are inserted first, which the code below relies on

  // to form more involved GEPs.

  SmallVector<std::pair<const Loop *, const SCEV *>, 8> OpsAndLoops;

  for (const SCEV *Op : reverse(S->operands()))

    OpsAndLoops.push_back(std::make_pair(getRelevantLoop(Op), Op));


  // Sort by loop. Use a stable sort so that constants follow non-constants and

  // pointer operands precede non-pointer operands.

  llvm::stable_sort(OpsAndLoops, LoopCompare(SE.DT));


  // Emit instructions to add all the operands. Hoist as much as possible

  // out of loops, and form meaningful getelementptrs where possible.

  Value *Sum = nullptr;

  for (auto I = OpsAndLoops.begin(), E = OpsAndLoops.end(); I != E;) {

    const Loop *CurLoop = I->first;

    const SCEV *Op = I->second;

    if (!Sum) {

      // This is the first operand. Just expand it.

      Sum = expand(Op);

      ++I;

      continue;

    }


    assert(!Op->getType()->isPointerTy() && "Only first op can be pointer");

    if (isa<PointerType>(Sum->getType())) {

      // The running sum expression is a pointer. Try to form a getelementptr

      // at this level with that as the base.

      SmallVector<SCEVUse, 4> NewOps;

      for (; I != E && I->first == CurLoop; ++I) {

        // If the operand is SCEVUnknown and not instructions, peek through

        // it, to enable more of it to be folded into the GEP.

        const SCEV *X = I->second;

        if (const SCEVUnknown *U = dyn_cast<SCEVUnknown>(X))

          if (!isa<Instruction>(U->getValue()))

            X = SE.getSCEV(U->getValue());

        NewOps.push_back(X);

      }

      Sum = expandAddToGEP(SE.getAddExpr(NewOps), Sum, S.getNoWrapFlags());

    } else if (Op->isNonConstantNegative()) {

      // Instead of doing a negate and add, just do a subtract.

      Value *W = expand(SE.getNegativeSCEV(Op));

      Sum = InsertBinop(Instruction::Sub, Sum, W, SCEV::FlagAnyWrap,

                        /*IsSafeToHoist*/ true);

      ++I;

    } else {

      // A simple add.

      Value *W = expand(Op);

      // Canonicalize a constant to the RHS.

      if (isa<Constant>(Sum))

        std::swap(Sum, W);

      Sum = InsertBinop(Instruction::Add, Sum, W, S.getNoWrapFlags(),

                        /*IsSafeToHoist*/ true);

      ++I;

    }

  }


  return Sum;

}


Value *SCEVExpander::visitMulExpr(SCEVUseT<const SCEVMulExpr *> S) {

  Type *Ty = S->getType();


  // Collect all the mul operands in a loop, along with their associated loops.

  // Iterate in reverse so that constants are emitted last, all else equal.

  SmallVector<std::pair<const Loop *, const SCEV *>, 8> OpsAndLoops;

  for (const SCEV *Op : reverse(S->operands()))

    OpsAndLoops.push_back(std::make_pair(getRelevantLoop(Op), Op));


  // Sort by loop. Use a stable sort so that constants follow non-constants.

  llvm::stable_sort(OpsAndLoops, LoopCompare(SE.DT));


  // Emit instructions to mul all the operands. Hoist as much as possible

  // out of loops.

  Value *Prod = nullptr;

  auto I = OpsAndLoops.begin();


  // Expand the calculation of X pow N in the following manner:

  // Let N = P1 + P2 + ... + PK, where all P are powers of 2. Then:

  // X pow N = (X pow P1) * (X pow P2) * ... * (X pow PK).

  const auto ExpandOpBinPowN = [this, &I, &OpsAndLoops]() {

    auto E = I;

    // Calculate how many times the same operand from the same loop is included

    // into this power.

    uint64_t Exponent = 0;

    const uint64_t MaxExponent = UINT64_MAX >> 1;

    // No one sane will ever try to calculate such huge exponents, but if we

    // need this, we stop on UINT64_MAX / 2 because we need to exit the loop

    // below when the power of 2 exceeds our Exponent, and we want it to be

    // 1u << 31 at most to not deal with unsigned overflow.

    while (E != OpsAndLoops.end() && *I == *E && Exponent != MaxExponent) {

      ++Exponent;

      ++E;

    }

    assert(Exponent > 0 && "Trying to calculate a zeroth exponent of operand?");


    // Calculate powers with exponents 1, 2, 4, 8 etc. and include those of them

    // that are needed into the result.

    Value *P = expand(I->second);

    Value *Result = nullptr;

    if (Exponent & 1)

      Result = P;

    for (uint64_t BinExp = 2; BinExp <= Exponent; BinExp <<= 1) {

      P = InsertBinop(Instruction::Mul, P, P, SCEV::FlagAnyWrap,

                      /*IsSafeToHoist*/ true);

      if (Exponent & BinExp)

        Result = Result ? InsertBinop(Instruction::Mul, Result, P,

                                      SCEV::FlagAnyWrap,

                                      /*IsSafeToHoist*/ true)

                        : P;

    }


    I = E;

    assert(Result && "Nothing was expanded?");

    return Result;

  };


  while (I != OpsAndLoops.end()) {

    if (!Prod) {

      // This is the first operand. Just expand it.

      Prod = ExpandOpBinPowN();

    } else if (I->second->isAllOnesValue()) {

      // Instead of doing a multiply by negative one, just do a negate.

      Prod = InsertBinop(Instruction::Sub, Constant::getNullValue(Ty), Prod,

                         SCEV::FlagAnyWrap, /*IsSafeToHoist*/ true);

      ++I;

    } else {

      // A simple mul.

      Value *W = ExpandOpBinPowN();

      // Canonicalize a constant to the RHS.

      if (isa<Constant>(Prod)) std::swap(Prod, W);

      const APInt *RHS;

      if (match(W, m_Power2(RHS))) {

        // Canonicalize Prod*(1<<C) to Prod<<C.

        assert(!Ty->isVectorTy() && "vector types are not SCEVable");

        auto NWFlags = S.getNoWrapFlags();

        // clear nsw flag if shl will produce poison value.

        if (RHS->logBase2() == RHS->getBitWidth() - 1)

          NWFlags = ScalarEvolution::clearFlags(NWFlags, SCEV::FlagNSW);

        Prod = InsertBinop(Instruction::Shl, Prod,

                           ConstantInt::get(Ty, RHS->logBase2()), NWFlags,

                           /*IsSafeToHoist*/ true);

      } else {

        Prod = InsertBinop(Instruction::Mul, Prod, W, S.getNoWrapFlags(),

                           /*IsSafeToHoist*/ true);

      }

    }

  }


  return Prod;

}


Value *SCEVExpander::visitUDivExpr(SCEVUseT<const SCEVUDivExpr *> S) {

  Value *LHS = expand(S->getLHS());

  if (const SCEVConstant *SC = dyn_cast<SCEVConstant>(S->getRHS())) {

    const APInt &RHS = SC->getAPInt();

    if (RHS.isPowerOf2())

      return InsertBinop(Instruction::LShr, LHS,

                         ConstantInt::get(SC->getType(), RHS.logBase2()),

                         SCEV::FlagAnyWrap, /*IsSafeToHoist*/ true);

  }


  const SCEV *RHSExpr = S->getRHS();

  Value *RHS = expand(RHSExpr);

  if (SafeUDivMode) {

    bool GuaranteedNotPoison =

        ScalarEvolution::isGuaranteedNotToBePoison(RHSExpr);

    if (!GuaranteedNotPoison)

      RHS = Builder.CreateFreeze(RHS);


    // We need an umax if either RHSExpr is not known to be zero, or if it is

    // not guaranteed to be non-poison. In the later case, the frozen poison may

    // be 0.

    if (!SE.isKnownNonZero(RHSExpr) || !GuaranteedNotPoison)

      RHS = Builder.CreateIntrinsic(RHS->getType(), Intrinsic::umax,

                                    {RHS, ConstantInt::get(RHS->getType(), 1)});

  }

  return InsertBinop(Instruction::UDiv, LHS, RHS, SCEV::FlagAnyWrap,

                     /*IsSafeToHoist*/ SE.isKnownNonZero(S->getRHS()));

}


/// Determine if this is a well-behaved chain of instructions leading back to

/// the PHI. If so, it may be reused by expanded expressions.

bool SCEVExpander::isNormalAddRecExprPHI(PHINode *PN, Instruction *IncV,

                                         const Loop *L) {

  if (IncV->getNumOperands() == 0 || isa<PHINode>(IncV) ||

      (isa<CastInst>(IncV) && !isa<BitCastInst>(IncV)))

    return false;

  // If any of the operands don't dominate the insert position, bail.

  // Addrec operands are always loop-invariant, so this can only happen

  // if there are instructions which haven't been hoisted.

  if (L == IVIncInsertLoop) {

    for (Use &Op : llvm::drop_begin(IncV->operands()))

      if (Instruction *OInst = dyn_cast<Instruction>(Op))

        if (!SE.DT.dominates(OInst, IVIncInsertPos))

          return false;

  }

  // Advance to the next instruction.

  IncV = dyn_cast<Instruction>(IncV->getOperand(0));

  if (!IncV)

    return false;


  if (IncV->mayHaveSideEffects())

    return false;


  if (IncV == PN)

    return true;


  return isNormalAddRecExprPHI(PN, IncV, L);

}


/// getIVIncOperand returns an induction variable increment's induction

/// variable operand.

///

/// If allowScale is set, any type of GEP is allowed as long as the nonIV

/// operands dominate InsertPos.

///

/// If allowScale is not set, ensure that a GEP increment conforms to one of the

/// simple patterns generated by getAddRecExprPHILiterally and

/// expandAddtoGEP. If the pattern isn't recognized, return NULL.


Instruction *SCEVExpander::getIVIncOperand(Instruction *IncV,

                                           Instruction *InsertPos,

                                           bool allowScale) {

  if (IncV == InsertPos)

    return nullptr;


  switch (IncV->getOpcode()) {

  default:

    return nullptr;

  // Check for a simple Add/Sub or GEP of a loop invariant step.

  case Instruction::Add:

  case Instruction::Sub: {

    Instruction *OInst = dyn_cast<Instruction>(IncV->getOperand(1));

    if (!OInst || SE.DT.dominates(OInst, InsertPos))

      return dyn_cast<Instruction>(IncV->getOperand(0));

    return nullptr;

  }

  case Instruction::BitCast:

    return dyn_cast<Instruction>(IncV->getOperand(0));

  case Instruction::GetElementPtr:

    for (Use &U : llvm::drop_begin(IncV->operands())) {

      if (isa<Constant>(U))

        continue;

      if (Instruction *OInst = dyn_cast<Instruction>(U)) {

        if (!SE.DT.dominates(OInst, InsertPos))

          return nullptr;

      }

      if (allowScale) {

        // allow any kind of GEP as long as it can be hoisted.

        continue;

      }

      // GEPs produced by SCEVExpander use i8 element type.

      if (!cast<GEPOperator>(IncV)->getSourceElementType()->isIntegerTy(8))

        return nullptr;

      break;

    }

    return dyn_cast<Instruction>(IncV->getOperand(0));

  }

}


/// If the insert point of the current builder or any of the builders on the

/// stack of saved builders has 'I' as its insert point, update it to point to

/// the instruction after 'I'.  This is intended to be used when the instruction

/// 'I' is being moved.  If this fixup is not done and 'I' is moved to a

/// different block, the inconsistent insert point (with a mismatched

/// Instruction and Block) can lead to an instruction being inserted in a block

/// other than its parent.

void SCEVExpander::fixupInsertPoints(Instruction *I) {

  BasicBlock::iterator It(*I);

  BasicBlock::iterator NewInsertPt = std::next(It);

  if (Builder.GetInsertPoint() == It)

    Builder.SetInsertPoint(&*NewInsertPt);

  for (auto *InsertPtGuard : InsertPointGuards)

    if (InsertPtGuard->GetInsertPoint() == It)

      InsertPtGuard->SetInsertPoint(NewInsertPt);

}


/// hoistStep - Attempt to hoist a simple IV increment above InsertPos to make

/// it available to other uses in this loop. Recursively hoist any operands,

/// until we reach a value that dominates InsertPos.


bool SCEVExpander::hoistIVInc(Instruction *IncV, Instruction *InsertPos,

                              bool RecomputePoisonFlags) {

  auto FixupPoisonFlags = [this](Instruction *I) {

    // Drop flags that are potentially inferred from old context and infer flags

    // in new context.

    rememberFlags(I);

    I->dropPoisonGeneratingFlags();

    if (auto *OBO = dyn_cast<OverflowingBinaryOperator>(I))

      if (auto Flags = SE.getStrengthenedNoWrapFlagsFromBinOp(OBO)) {

        auto *BO = cast<BinaryOperator>(I);

        BO->setHasNoUnsignedWrap(

            ScalarEvolution::maskFlags(*Flags, SCEV::FlagNUW) == SCEV::FlagNUW);

        BO->setHasNoSignedWrap(

            ScalarEvolution::maskFlags(*Flags, SCEV::FlagNSW) == SCEV::FlagNSW);

      }

  };


  if (SE.DT.dominates(IncV, InsertPos)) {

    if (RecomputePoisonFlags)

      FixupPoisonFlags(IncV);

    return true;

  }


  // InsertPos must itself dominate IncV so that IncV's new position satisfies

  // its existing users.

  if (isa<PHINode>(InsertPos) ||

      !SE.DT.dominates(InsertPos->getParent(), IncV->getParent()))

    return false;


  if (!SE.LI.movementPreservesLCSSAForm(IncV, InsertPos))

    return false;


  // Check that the chain of IV operands leading back to Phi can be hoisted.

  SmallVector<Instruction*, 4> IVIncs;

  for(;;) {

    Instruction *Oper = getIVIncOperand(IncV, InsertPos, /*allowScale*/true);

    if (!Oper)

      return false;

    // IncV is safe to hoist.

    IVIncs.push_back(IncV);

    IncV = Oper;

    if (SE.DT.dominates(IncV, InsertPos))

      break;

  }

  for (Instruction *I : llvm::reverse(IVIncs)) {

    fixupInsertPoints(I);

    I->moveBefore(InsertPos->getIterator());

    if (RecomputePoisonFlags)

      FixupPoisonFlags(I);

  }

  return true;

}


bool SCEVExpander::canReuseFlagsFromOriginalIVInc(PHINode *OrigPhi,

                                                  PHINode *WidePhi,

                                                  Instruction *OrigInc,

                                                  Instruction *WideInc) {

  return match(OrigInc, m_c_BinOp(m_Specific(OrigPhi), m_Value())) &&

         match(WideInc, m_c_BinOp(m_Specific(WidePhi), m_Value())) &&

         OrigInc->getOpcode() == WideInc->getOpcode();

}


/// Determine if this cyclic phi is in a form that would have been generated by

/// LSR. We don't care if the phi was actually expanded in this pass, as long

/// as it is in a low-cost form, for example, no implied multiplication. This

/// should match any patterns generated by getAddRecExprPHILiterally and

/// expandAddtoGEP.

bool SCEVExpander::isExpandedAddRecExprPHI(PHINode *PN, Instruction *IncV,

                                           const Loop *L) {

  for(Instruction *IVOper = IncV;

      (IVOper = getIVIncOperand(IVOper, L->getLoopPreheader()->getTerminator(),

                                /*allowScale=*/false));) {

    if (IVOper == PN)

      return true;

  }

  return false;

}


/// expandIVInc - Expand an IV increment at Builder's current InsertPos.

/// Typically this is the LatchBlock terminator or IVIncInsertPos, but we may

/// need to materialize IV increments elsewhere to handle difficult situations.

Value *SCEVExpander::expandIVInc(PHINode *PN, Value *StepV, const Loop *L,

                                 bool useSubtract) {

  Value *IncV;

  // If the PHI is a pointer, use a GEP, otherwise use an add or sub.

  if (PN->getType()->isPointerTy()) {

    // TODO: Change name to IVName.iv.next.

    IncV = Builder.CreatePtrAdd(PN, StepV, "scevgep");

  } else {

    IncV = useSubtract ?

      Builder.CreateSub(PN, StepV, Twine(IVName) + ".iv.next") :

      Builder.CreateAdd(PN, StepV, Twine(IVName) + ".iv.next");

  }

  return IncV;

}


/// Check whether we can cheaply express the requested SCEV in terms of

/// the available PHI SCEV by truncation and/or inversion of the step.


static bool canBeCheaplyTransformed(ScalarEvolution &SE,

                                    const SCEVAddRecExpr *Phi,

                                    const SCEVAddRecExpr *Requested,

                                    bool &InvertStep) {

  // We can't transform to match a pointer PHI.

  Type *PhiTy = Phi->getType();

  Type *RequestedTy = Requested->getType();

  if (PhiTy->isPointerTy() || RequestedTy->isPointerTy())

    return false;


  if (RequestedTy->getIntegerBitWidth() > PhiTy->getIntegerBitWidth())

    return false;


  // Try truncate it if necessary.

  Phi = dyn_cast<SCEVAddRecExpr>(SE.getTruncateOrNoop(Phi, RequestedTy));

  if (!Phi)

    return false;


  // Check whether truncation will help.

  if (Phi == Requested) {

    InvertStep = false;

    return true;

  }


  // Check whether inverting will help: {R,+,-1} == R - {0,+,1}.

  if (SE.getMinusSCEV(Requested->getStart(), Requested) == Phi) {

    InvertStep = true;

    return true;

  }


  return false;

}


static bool IsIncrementNSW(ScalarEvolution &SE, const SCEVAddRecExpr *AR) {

  if (!isa<IntegerType>(AR->getType()))

    return false;


  unsigned BitWidth = cast<IntegerType>(AR->getType())->getBitWidth();

  Type *WideTy = IntegerType::get(AR->getType()->getContext(), BitWidth * 2);

  const SCEV *Step = AR->getStepRecurrence(SE);

  const SCEV *OpAfterExtend = SE.getAddExpr(SE.getSignExtendExpr(Step, WideTy),

                                            SE.getSignExtendExpr(AR, WideTy));

  const SCEV *ExtendAfterOp =

    SE.getSignExtendExpr(SE.getAddExpr(AR, Step), WideTy);

  return ExtendAfterOp == OpAfterExtend;

}


static bool IsIncrementNUW(ScalarEvolution &SE, const SCEVAddRecExpr *AR) {

  if (!isa<IntegerType>(AR->getType()))

    return false;


  unsigned BitWidth = cast<IntegerType>(AR->getType())->getBitWidth();

  Type *WideTy = IntegerType::get(AR->getType()->getContext(), BitWidth * 2);

  const SCEV *Step = AR->getStepRecurrence(SE);

  const SCEV *OpAfterExtend = SE.getAddExpr(SE.getZeroExtendExpr(Step, WideTy),

                                            SE.getZeroExtendExpr(AR, WideTy));

  const SCEV *ExtendAfterOp =

    SE.getZeroExtendExpr(SE.getAddExpr(AR, Step), WideTy);

  return ExtendAfterOp == OpAfterExtend;

}


/// getAddRecExprPHILiterally - Helper for expandAddRecExprLiterally. Expand

/// the base addrec, which is the addrec without any non-loop-dominating

/// values, and return the PHI.

PHINode *

SCEVExpander::getAddRecExprPHILiterally(const SCEVAddRecExpr *Normalized,

                                        const Loop *L, Type *&TruncTy,

                                        bool &InvertStep) {

  assert((!IVIncInsertLoop || IVIncInsertPos) &&

         "Uninitialized insert position");


  // Reuse a previously-inserted PHI, if present.

  BasicBlock *LatchBlock = L->getLoopLatch();

  if (LatchBlock) {

    PHINode *AddRecPhiMatch = nullptr;

    Instruction *IncV = nullptr;

    TruncTy = nullptr;

    InvertStep = false;


    // Only try partially matching scevs that need truncation and/or

    // step-inversion if we know this loop is outside the current loop.

    bool TryNonMatchingSCEV =

        IVIncInsertLoop &&

        SE.DT.properlyDominates(LatchBlock, IVIncInsertLoop->getHeader());


    for (PHINode &PN : L->getHeader()->phis()) {

      if (!SE.isSCEVable(PN.getType()))

        continue;


      // We should not look for a incomplete PHI. Getting SCEV for a incomplete

      // PHI has no meaning at all.

      if (!PN.isComplete()) {

        SCEV_DEBUG_WITH_TYPE(

            DebugType, dbgs() << "One incomplete PHI is found: " << PN << "\n");

        continue;

      }


      const SCEVAddRecExpr *PhiSCEV = dyn_cast<SCEVAddRecExpr>(SE.getSCEV(&PN));

      if (!PhiSCEV)

        continue;


      bool IsMatchingSCEV = PhiSCEV == Normalized;

      // We only handle truncation and inversion of phi recurrences for the

      // expanded expression if the expanded expression's loop dominates the

      // loop we insert to. Check now, so we can bail out early.

      if (!IsMatchingSCEV && !TryNonMatchingSCEV)

          continue;


      // TODO: this possibly can be reworked to avoid this cast at all.

      Instruction *TempIncV =

          dyn_cast<Instruction>(PN.getIncomingValueForBlock(LatchBlock));

      if (!TempIncV)

        continue;


      // Check whether we can reuse this PHI node.

      if (LSRMode) {

        if (!isExpandedAddRecExprPHI(&PN, TempIncV, L))

          continue;

      } else {

        if (!isNormalAddRecExprPHI(&PN, TempIncV, L))

          continue;

      }


      // Stop if we have found an exact match SCEV.

      if (IsMatchingSCEV) {

        IncV = TempIncV;

        TruncTy = nullptr;

        InvertStep = false;

        AddRecPhiMatch = &PN;

        break;

      }


      // Try whether the phi can be translated into the requested form

      // (truncated and/or offset by a constant).

      if ((!TruncTy || InvertStep) &&

          canBeCheaplyTransformed(SE, PhiSCEV, Normalized, InvertStep)) {

        // Record the phi node. But don't stop we might find an exact match

        // later.

        AddRecPhiMatch = &PN;

        IncV = TempIncV;

        TruncTy = Normalized->getType();

      }

    }


    if (AddRecPhiMatch) {

      // Ok, the add recurrence looks usable.

      // Remember this PHI, even in post-inc mode.

      InsertedValues.insert(AddRecPhiMatch);

      // Remember the increment.

      rememberInstruction(IncV);

      // Those values were not actually inserted but re-used.

      ReusedValues.insert(AddRecPhiMatch);

      ReusedValues.insert(IncV);

      return AddRecPhiMatch;

    }

  }


  // Save the original insertion point so we can restore it when we're done.

  SCEVInsertPointGuard Guard(Builder, this);


  // Another AddRec may need to be recursively expanded below. For example, if

  // this AddRec is quadratic, the StepV may itself be an AddRec in this

  // loop. Remove this loop from the PostIncLoops set before expanding such

  // AddRecs. Otherwise, we cannot find a valid position for the step

  // (i.e. StepV can never dominate its loop header).  Ideally, we could do

  // SavedIncLoops.swap(PostIncLoops), but we generally have a single element,

  // so it's not worth implementing SmallPtrSet::swap.

  PostIncLoopSet SavedPostIncLoops = PostIncLoops;

  PostIncLoops.clear();


  // Expand code for the start value into the loop preheader.

  assert(L->getLoopPreheader() &&

         "Can't expand add recurrences without a loop preheader!");

  Value *StartV =

      expand(Normalized->getStart(), L->getLoopPreheader()->getTerminator());


  // StartV must have been be inserted into L's preheader to dominate the new

  // phi.

  assert(!isa<Instruction>(StartV) ||

         SE.DT.properlyDominates(cast<Instruction>(StartV)->getParent(),

                                 L->getHeader()));


  // Expand code for the step value. Do this before creating the PHI so that PHI

  // reuse code doesn't see an incomplete PHI.

  const SCEV *Step = Normalized->getStepRecurrence(SE);

  Type *ExpandTy = Normalized->getType();

  // If the stride is negative, insert a sub instead of an add for the increment

  // (unless it's a constant, because subtracts of constants are canonicalized

  // to adds).

  bool useSubtract = !ExpandTy->isPointerTy() && Step->isNonConstantNegative();

  if (useSubtract)

    Step = SE.getNegativeSCEV(Step);

  // Expand the step somewhere that dominates the loop header.

  Value *StepV = expand(Step, L->getHeader()->getFirstInsertionPt());


  // The no-wrap behavior proved by IsIncrement(NUW|NSW) is only applicable if

  // we actually do emit an addition.  It does not apply if we emit a

  // subtraction.

  bool IncrementIsNUW = !useSubtract && IsIncrementNUW(SE, Normalized);

  bool IncrementIsNSW = !useSubtract && IsIncrementNSW(SE, Normalized);


  // Create the PHI.

  BasicBlock *Header = L->getHeader();

  Builder.SetInsertPoint(Header, Header->begin());

  PHINode *PN =

      Builder.CreatePHI(ExpandTy, pred_size(Header), Twine(IVName) + ".iv");


  // Create the step instructions and populate the PHI.

  for (BasicBlock *Pred : predecessors(Header)) {

    // Add a start value.

    if (!L->contains(Pred)) {

      PN->addIncoming(StartV, Pred);

      continue;

    }


    // Create a step value and add it to the PHI.

    // If IVIncInsertLoop is non-null and equal to the addrec's loop, insert the

    // instructions at IVIncInsertPos.

    Instruction *InsertPos = L == IVIncInsertLoop ?

      IVIncInsertPos : Pred->getTerminator();

    Builder.SetInsertPoint(InsertPos);

    Value *IncV = expandIVInc(PN, StepV, L, useSubtract);


    if (isa<OverflowingBinaryOperator>(IncV)) {

      if (IncrementIsNUW)

        cast<BinaryOperator>(IncV)->setHasNoUnsignedWrap();

      if (IncrementIsNSW)

        cast<BinaryOperator>(IncV)->setHasNoSignedWrap();

    }

    PN->addIncoming(IncV, Pred);

  }


  // After expanding subexpressions, restore the PostIncLoops set so the caller

  // can ensure that IVIncrement dominates the current uses.

  PostIncLoops = SavedPostIncLoops;


  // Remember this PHI, even in post-inc mode. LSR SCEV-based salvaging is most

  // effective when we are able to use an IV inserted here, so record it.

  InsertedValues.insert(PN);

  InsertedIVs.push_back(PN);

  return PN;

}


Value *

SCEVExpander::expandAddRecExprLiterally(SCEVUseT<const SCEVAddRecExpr *> S) {

  const Loop *L = S->getLoop();


  // Determine a normalized form of this expression, which is the expression

  // before any post-inc adjustment is made.

  const SCEVAddRecExpr *Normalized = S;

  if (PostIncLoops.count(L)) {

    PostIncLoopSet Loops;

    Loops.insert(L);

    Normalized = cast<SCEVAddRecExpr>(

        normalizeForPostIncUse(S, Loops, SE, /*CheckInvertible=*/false));

  }


  [[maybe_unused]] const SCEV *Start = Normalized->getStart();

  const SCEV *Step = Normalized->getStepRecurrence(SE);

  assert(SE.properlyDominates(Start, L->getHeader()) &&

         "Start does not properly dominate loop header");

  assert(SE.dominates(Step, L->getHeader()) && "Step not dominate loop header");


  // In some cases, we decide to reuse an existing phi node but need to truncate

  // it and/or invert the step.

  Type *TruncTy = nullptr;

  bool InvertStep = false;

  PHINode *PN = getAddRecExprPHILiterally(Normalized, L, TruncTy, InvertStep);


  // Accommodate post-inc mode, if necessary.

  Value *Result;

  if (!PostIncLoops.count(L))

    Result = PN;

  else {

    // In PostInc mode, use the post-incremented value.

    BasicBlock *LatchBlock = L->getLoopLatch();

    assert(LatchBlock && "PostInc mode requires a unique loop latch!");

    Result = PN->getIncomingValueForBlock(LatchBlock);


    // We might be introducing a new use of the post-inc IV that is not poison

    // safe, in which case we should drop poison generating flags. Only keep

    // those flags for which SCEV has proven that they always hold.

    if (isa<OverflowingBinaryOperator>(Result)) {

      auto *I = cast<Instruction>(Result);

      if (!S->hasNoUnsignedWrap())

        I->setHasNoUnsignedWrap(false);

      if (!S->hasNoSignedWrap())

        I->setHasNoSignedWrap(false);

    }


    // For an expansion to use the postinc form, the client must call

    // expandCodeFor with an InsertPoint that is either outside the PostIncLoop

    // or dominated by IVIncInsertPos.

    if (isa<Instruction>(Result) &&

        !SE.DT.dominates(cast<Instruction>(Result),

                         &*Builder.GetInsertPoint())) {

      // The induction variable's postinc expansion does not dominate this use.

      // IVUsers tries to prevent this case, so it is rare. However, it can

      // happen when an IVUser outside the loop is not dominated by the latch

      // block. Adjusting IVIncInsertPos before expansion begins cannot handle

      // all cases. Consider a phi outside whose operand is replaced during

      // expansion with the value of the postinc user. Without fundamentally

      // changing the way postinc users are tracked, the only remedy is

      // inserting an extra IV increment. StepV might fold into PostLoopOffset,

      // but hopefully expandCodeFor handles that.

      bool useSubtract =

          !S->getType()->isPointerTy() && Step->isNonConstantNegative();

      if (useSubtract)

        Step = SE.getNegativeSCEV(Step);

      Value *StepV;

      {

        // Expand the step somewhere that dominates the loop header.

        SCEVInsertPointGuard Guard(Builder, this);

        StepV = expand(Step, L->getHeader()->getFirstInsertionPt());

      }

      Result = expandIVInc(PN, StepV, L, useSubtract);

    }

  }


  // We have decided to reuse an induction variable of a dominating loop. Apply

  // truncation and/or inversion of the step.

  if (TruncTy) {

    // Truncate the result.

    if (TruncTy != Result->getType())

      Result = Builder.CreateTrunc(Result, TruncTy);


    // Invert the result.

    if (InvertStep)

      Result = Builder.CreateSub(expand(Normalized->getStart()), Result);

  }


  return Result;

}


Value *SCEVExpander::tryToReuseLCSSAPhi(SCEVUseT<const SCEVAddRecExpr *> S) {

  Type *STy = S->getType();

  const Loop *L = S->getLoop();

  BasicBlock *EB = L->getExitBlock();

  if (!EB || !EB->getSinglePredecessor() ||

      !SE.DT.dominates(EB, Builder.GetInsertBlock()))

    return nullptr;


  // Helper to check if the diff between S and ExitSCEV is simple enough to

  // allow reusing the LCSSA phi.

  auto CanReuse = [&](const SCEV *ExitSCEV) -> const SCEV * {

    if (isa<SCEVCouldNotCompute>(ExitSCEV))

      return nullptr;

    const SCEV *Diff = SE.getMinusSCEV(S, ExitSCEV);

    const SCEV *Op = Diff;

    match(Op, m_scev_Add(m_SCEVConstant(), m_SCEV(Op)));

    match(Op, m_scev_Mul(m_scev_AllOnes(), m_SCEV(Op)));

    match(Op, m_scev_PtrToAddr(m_SCEV(Op))) ||

        match(Op, m_scev_PtrToInt(m_SCEV(Op)));

    if (!isa<SCEVConstant, SCEVUnknown>(Op))

      return nullptr;

    return Diff;

  };


  for (auto &PN : EB->phis()) {

    if (!SE.isSCEVable(PN.getType()))

      continue;

    auto *ExitSCEV = SE.getSCEV(&PN);

    if (!isa<SCEVAddRecExpr>(ExitSCEV))

      continue;

    Type *PhiTy = PN.getType();

    const SCEV *Diff = nullptr;

    if (STy->isIntegerTy() && PhiTy->isPointerTy() &&

        DL.getAddressType(PhiTy) == STy) {

      // Prefer ptrtoaddr over ptrtoint.

      const SCEV *AddrSCEV = SE.getPtrToAddrExpr(ExitSCEV);

      Diff = CanReuse(AddrSCEV);

      if (!Diff) {

        const SCEV *IntSCEV = SE.getPtrToIntExpr(ExitSCEV, STy);

        Diff = CanReuse(IntSCEV);

      }

    } else if (STy == PhiTy) {

      Diff = CanReuse(ExitSCEV);

    }

    if (!Diff)

      continue;


    assert(Diff->getType()->isIntegerTy() &&

           "difference must be of integer type");

    Value *DiffV = expand(Diff);

    Value *BaseV = fixupLCSSAFormFor(&PN);

    if (PhiTy->isPointerTy()) {

      if (STy->isPointerTy())

        return Builder.CreatePtrAdd(BaseV, DiffV);

      BaseV = Builder.CreatePtrToAddr(BaseV);

    }

    return Builder.CreateAdd(BaseV, DiffV);

  }


  return nullptr;

}


Value *SCEVExpander::visitAddRecExpr(SCEVUseT<const SCEVAddRecExpr *> S) {

  // In canonical mode we compute the addrec as an expression of a canonical IV

  // using evaluateAtIteration and expand the resulting SCEV expression. This

  // way we avoid introducing new IVs to carry on the computation of the addrec

  // throughout the loop.

  //

  // For nested addrecs evaluateAtIteration might need a canonical IV of a

  // type wider than the addrec itself. Emitting a canonical IV of the

  // proper type might produce non-legal types, for example expanding an i64

  // {0,+,2,+,1} addrec would need an i65 canonical IV. To avoid this just fall

  // back to non-canonical mode for nested addrecs.

  if (!CanonicalMode || (S->getNumOperands() > 2))

    return expandAddRecExprLiterally(S);


  Type *Ty = SE.getEffectiveSCEVType(S->getType());

  const Loop *L = S->getLoop();


  // First check for an existing canonical IV in a suitable type.

  PHINode *CanonicalIV = nullptr;

  if (PHINode *PN = L->getCanonicalInductionVariable())

    if (SE.getTypeSizeInBits(PN->getType()) >= SE.getTypeSizeInBits(Ty))

      CanonicalIV = PN;


  // Rewrite an AddRec in terms of the canonical induction variable, if

  // its type is more narrow.

  if (CanonicalIV &&

      SE.getTypeSizeInBits(CanonicalIV->getType()) > SE.getTypeSizeInBits(Ty) &&

      !S->getType()->isPointerTy()) {

    SmallVector<SCEVUse, 4> NewOps(S->getNumOperands());

    for (unsigned i = 0, e = S->getNumOperands(); i != e; ++i)

      NewOps[i] = SE.getAnyExtendExpr(S->getOperand(i), CanonicalIV->getType());

    Value *V = expand(

        SE.getAddRecExpr(NewOps, S->getLoop(), S.getNoWrapFlags(SCEV::FlagNW)));

    BasicBlock::iterator NewInsertPt =

        isa<Instruction>(V) ? findInsertPointAfter(cast<Instruction>(V),

                                                   &*Builder.GetInsertPoint())

                            : Builder.GetInsertPoint();

    V = expand(SE.getTruncateExpr(SE.getUnknown(V), Ty), NewInsertPt);

    return V;

  }


  // If S is expanded outside the defining loop, check if there is a

  // matching LCSSA phi node for it.

  if (Value *V = tryToReuseLCSSAPhi(S))

    return V;


  // {X,+,F} --> X + {0,+,F}

  if (!S->getStart()->isZero()) {

    if (isa<PointerType>(S->getType())) {

      Value *StartV = expand(SE.getPointerBase(S));

      return expandAddToGEP(SE.removePointerBase(S), StartV,

                            S.getNoWrapFlags(SCEV::FlagNUW));

    }


    SmallVector<SCEVUse, 4> NewOps(S->operands());

    NewOps[0] = SE.getConstant(Ty, 0);

    const SCEV *Rest =

        SE.getAddRecExpr(NewOps, L, S.getNoWrapFlags(SCEV::FlagNW));


    // Just do a normal add. Pre-expand the operands to suppress folding.

    //

    // The LHS and RHS values are factored out of the expand call to make the

    // output independent of the argument evaluation order.

    const SCEV *AddExprLHS = SE.getUnknown(expand(S->getStart()));

    const SCEV *AddExprRHS = SE.getUnknown(expand(Rest));

    return expand(SE.getAddExpr(AddExprLHS, AddExprRHS));

  }


  // If we don't yet have a canonical IV, create one.

  if (!CanonicalIV) {

    // Create and insert the PHI node for the induction variable in the

    // specified loop.

    BasicBlock *Header = L->getHeader();

    pred_iterator HPB = pred_begin(Header), HPE = pred_end(Header);

    CanonicalIV = PHINode::Create(Ty, std::distance(HPB, HPE), "indvar");

    CanonicalIV->insertBefore(Header->begin());

    rememberInstruction(CanonicalIV);


    SmallPtrSet<BasicBlock *, 4> PredSeen;

    Constant *One = ConstantInt::get(Ty, 1);

    for (pred_iterator HPI = HPB; HPI != HPE; ++HPI) {

      BasicBlock *HP = *HPI;

      if (!PredSeen.insert(HP).second) {

        // There must be an incoming value for each predecessor, even the

        // duplicates!

        CanonicalIV->addIncoming(CanonicalIV->getIncomingValueForBlock(HP), HP);

        continue;

      }


      if (L->contains(HP)) {

        // Insert a unit add instruction right before the terminator

        // corresponding to the back-edge.

        Instruction *Add = BinaryOperator::CreateAdd(CanonicalIV, One,

                                                     "indvar.next",

                                                     HP->getTerminator()->getIterator());

        Add->setDebugLoc(HP->getTerminator()->getDebugLoc());

        rememberInstruction(Add);

        CanonicalIV->addIncoming(Add, HP);

      } else {

        CanonicalIV->addIncoming(Constant::getNullValue(Ty), HP);

      }

    }

  }


  // {0,+,1} --> Insert a canonical induction variable into the loop!

  if (S->isAffine() && S->getOperand(1)->isOne()) {

    assert(Ty == SE.getEffectiveSCEVType(CanonicalIV->getType()) &&

           "IVs with types different from the canonical IV should "

           "already have been handled!");

    return CanonicalIV;

  }


  // {0,+,F} --> {0,+,1} * F


  // If this is a simple linear addrec, emit it now as a special case.

  if (S->isAffine())    // {0,+,F} --> i*F

    return

      expand(SE.getTruncateOrNoop(

        SE.getMulExpr(SE.getUnknown(CanonicalIV),

                      SE.getNoopOrAnyExtend(S->getOperand(1),

                                            CanonicalIV->getType())),

        Ty));


  // If this is a chain of recurrences, turn it into a closed form, using the

  // folders, then expandCodeFor the closed form.  This allows the folders to

  // simplify the expression without having to build a bunch of special code

  // into this folder.

  const SCEV *IH = SE.getUnknown(CanonicalIV);   // Get I as a "symbolic" SCEV.


  // Promote S up to the canonical IV type, if the cast is foldable.

  const SCEV *NewS = S;

  const SCEV *Ext = SE.getNoopOrAnyExtend(S, CanonicalIV->getType());

  if (isa<SCEVAddRecExpr>(Ext))

    NewS = Ext;


  const SCEV *V = cast<SCEVAddRecExpr>(NewS)->evaluateAtIteration(IH, SE);


  // Truncate the result down to the original type, if needed.

  const SCEV *T = SE.getTruncateOrNoop(V, Ty);

  return expand(T);

}


Value *SCEVExpander::visitPtrToAddrExpr(SCEVUseT<const SCEVPtrToAddrExpr *> S) {

  Value *V = expand(S->getOperand());

  Type *Ty = S->getType();


  // ptrtoaddr and ptrtoint produce the same value, so try to reuse either.

  if (!isa<Constant>(V)) {

    BasicBlock::iterator BIP = Builder.GetInsertPoint();

    for (User *U : V->users()) {

      auto *CI = dyn_cast<CastInst>(U);

      if (CI && CI->getType() == Ty &&

          (CI->getOpcode() == CastInst::PtrToAddr ||

           CI->getOpcode() == CastInst::PtrToInt) &&

          &*BIP != CI && SE.DT.dominates(CI, &*BIP))

        return CI;

    }

  }

  return ReuseOrCreateCast(V, Ty, CastInst::PtrToAddr,

                           GetOptimalInsertionPointForCastOf(V));

}


Value *SCEVExpander::visitPtrToIntExpr(SCEVUseT<const SCEVPtrToIntExpr *> S) {

  Value *V = expand(S->getOperand());

  return ReuseOrCreateCast(V, S->getType(), CastInst::PtrToInt,

                           GetOptimalInsertionPointForCastOf(V));

}


Value *SCEVExpander::visitTruncateExpr(SCEVUseT<const SCEVTruncateExpr *> S) {

  Value *V = expand(S->getOperand());

  return Builder.CreateTrunc(V, S->getType());

}


Value *

SCEVExpander::visitZeroExtendExpr(SCEVUseT<const SCEVZeroExtendExpr *> S) {

  Value *V = expand(S->getOperand());

  return Builder.CreateZExt(V, S->getType(), "",

                            SE.isKnownNonNegative(S->getOperand()));

}


Value *

SCEVExpander::visitSignExtendExpr(SCEVUseT<const SCEVSignExtendExpr *> S) {

  Value *V = expand(S->getOperand());

  return Builder.CreateSExt(V, S->getType());

}


Value *SCEVExpander::expandMinMaxExpr(SCEVUseT<const SCEVNAryExpr *> S,

                                      Intrinsic::ID IntrinID, Twine Name,

                                      bool IsSequential) {

  bool PrevSafeMode = SafeUDivMode;

  SafeUDivMode |= IsSequential;

  Value *LHS = expand(S->getOperand(S->getNumOperands() - 1));

  Type *Ty = LHS->getType();

  if (IsSequential)

    LHS = Builder.CreateFreeze(LHS);

  for (int i = S->getNumOperands() - 2; i >= 0; --i) {

    SafeUDivMode = (IsSequential && i != 0) || PrevSafeMode;

    Value *RHS = expand(S->getOperand(i));

    if (IsSequential && i != 0)

      RHS = Builder.CreateFreeze(RHS);

    Value *Sel;

    if (Ty->isIntegerTy())

      Sel = Builder.CreateIntrinsic(IntrinID, {Ty}, {LHS, RHS},

                                    /*FMFSource=*/nullptr, Name);

    else {

      Value *ICmp =

          Builder.CreateICmp(MinMaxIntrinsic::getPredicate(IntrinID), LHS, RHS);

      Sel = Builder.CreateSelect(ICmp, LHS, RHS, Name);

    }

    LHS = Sel;

  }

  SafeUDivMode = PrevSafeMode;

  return LHS;

}


Value *SCEVExpander::visitSMaxExpr(SCEVUseT<const SCEVSMaxExpr *> S) {

  return expandMinMaxExpr(S, Intrinsic::smax, "smax");

}


Value *SCEVExpander::visitUMaxExpr(SCEVUseT<const SCEVUMaxExpr *> S) {

  return expandMinMaxExpr(S, Intrinsic::umax, "umax");

}


Value *SCEVExpander::visitSMinExpr(SCEVUseT<const SCEVSMinExpr *> S) {

  return expandMinMaxExpr(S, Intrinsic::smin, "smin");

}


Value *SCEVExpander::visitUMinExpr(SCEVUseT<const SCEVUMinExpr *> S) {

  return expandMinMaxExpr(S, Intrinsic::umin, "umin");

}


Value *SCEVExpander::visitSequentialUMinExpr(

    SCEVUseT<const SCEVSequentialUMinExpr *> S) {

  return expandMinMaxExpr(S, Intrinsic::umin, "umin",

                          /*IsSequential*/ true);

}


Value *SCEVExpander::visitVScale(SCEVUseT<const SCEVVScale *> S) {

  return Builder.CreateVScale(S->getType());

}


Value *SCEVExpander::expandCodeFor(SCEVUse SH, Type *Ty,

                                   BasicBlock::iterator IP) {

  setInsertPoint(IP);

  return expandCodeFor(SH, Ty);

}


Value *SCEVExpander::expandCodeFor(SCEVUse SH, Type *Ty) {

  // Expand the code for this SCEV.

  Value *V = expand(SH);


  if (Ty && Ty != V->getType()) {

    assert(SE.getTypeSizeInBits(Ty) == SE.getTypeSizeInBits(SH->getType()) &&

           "non-trivial casts should be done with the SCEVs directly!");

    V = InsertNoopCastOfTo(V, Ty);

  }

  return V;

}


Value *SCEVExpander::FindValueInExprValueMap(

    SCEVUse S, const Instruction *InsertPt,

    SmallVectorImpl<Instruction *> &DropPoisonGeneratingInsts) {

  // If the expansion is not in CanonicalMode, and the SCEV contains any

  // sub scAddRecExpr type SCEV, it is required to expand the SCEV literally.

  if (!CanonicalMode && SE.containsAddRecurrence(S))

    return nullptr;


  // If S is a constant or unknown, it may be worse to reuse an existing Value.

  if (isa<SCEVConstant>(S) || isa<SCEVUnknown>(S))

    return nullptr;


  for (Value *V : SE.getSCEVValues(S)) {

    Instruction *EntInst = dyn_cast<Instruction>(V);

    if (!EntInst)

      continue;


    // Choose a Value from the set which dominates the InsertPt.

    // InsertPt should be inside the Value's parent loop so as not to break

    // the LCSSA form.

    assert(EntInst->getFunction() == InsertPt->getFunction());

    if (S->getType() != V->getType() || !SE.DT.dominates(EntInst, InsertPt) ||

        !(SE.LI.getLoopFor(EntInst->getParent()) == nullptr ||

          SE.LI.getLoopFor(EntInst->getParent())->contains(InsertPt)))

      continue;


    // Make sure reusing the instruction is poison-safe.

    if (SE.canReuseInstruction(S, EntInst, DropPoisonGeneratingInsts))

      return V;

    DropPoisonGeneratingInsts.clear();

  }

  return nullptr;

}


// The expansion of SCEV will either reuse a previous Value in ExprValueMap,

// or expand the SCEV literally. Specifically, if the expansion is in LSRMode,

// and the SCEV contains any sub scAddRecExpr type SCEV, it will be expanded

// literally, to prevent LSR's transformed SCEV from being reverted. Otherwise,

// the expansion will try to reuse Value from ExprValueMap, and only when it

// fails, expand the SCEV literally.

Value *SCEVExpander::expand(SCEVUse S) {

  // Compute an insertion point for this SCEV object. Hoist the instructions

  // as far out in the loop nest as possible.

  BasicBlock::iterator InsertPt = Builder.GetInsertPoint();


  // We can move insertion point only if there is no div or rem operations

  // otherwise we are risky to move it over the check for zero denominator.

  auto SafeToHoist = [](const SCEV *S) {

    return !SCEVExprContains(S, [](const SCEV *S) {

              if (const auto *D = dyn_cast<SCEVUDivExpr>(S)) {

                if (const auto *SC = dyn_cast<SCEVConstant>(D->getRHS()))

                  // Division by non-zero constants can be hoisted.

                  return SC->getValue()->isZero();

                // All other divisions should not be moved as they may be

                // divisions by zero and should be kept within the

                // conditions of the surrounding loops that guard their

                // execution (see PR35406).

                return true;

              }

              return false;

            });

  };

  if (SafeToHoist(S)) {

    for (Loop *L = SE.LI.getLoopFor(Builder.GetInsertBlock());;

         L = L->getParentLoop()) {

      if (SE.isLoopInvariant(S, L)) {

        if (!L) break;

        if (BasicBlock *Preheader = L->getLoopPreheader()) {

          InsertPt = Preheader->getTerminator()->getIterator();

        } else {

          // LSR sets the insertion point for AddRec start/step values to the

          // block start to simplify value reuse, even though it's an invalid

          // position. SCEVExpander must correct for this in all cases.

          InsertPt = L->getHeader()->getFirstInsertionPt();

        }

      } else {

        // If the SCEV is computable at this level, insert it into the header

        // after the PHIs (and after any other instructions that we've inserted

        // there) so that it is guaranteed to dominate any user inside the loop.

        if (L && SE.hasComputableLoopEvolution(S, L) && !PostIncLoops.count(L))

          InsertPt = L->getHeader()->getFirstInsertionPt();


        while (InsertPt != Builder.GetInsertPoint() &&

               (isInsertedInstruction(&*InsertPt))) {

          InsertPt = std::next(InsertPt);

        }

        break;

      }

    }

  }


  // Check to see if we already expanded this here.

  auto I = InsertedExpressions.find(std::make_pair(S, &*InsertPt));

  if (I != InsertedExpressions.end())

    return I->second;


  SCEVInsertPointGuard Guard(Builder, this);

  Builder.SetInsertPoint(InsertPt->getParent(), InsertPt);


  // Expand the expression into instructions.

  SmallVector<Instruction *> DropPoisonGeneratingInsts;

  Value *V = FindValueInExprValueMap(S, &*InsertPt, DropPoisonGeneratingInsts);

  if (!V) {

    V = visit(S);

    V = fixupLCSSAFormFor(V);

  } else {

    for (Instruction *I : DropPoisonGeneratingInsts) {

      rememberFlags(I);

      dropPoisonGeneratingAnnotationsAndReinfer(SE, I);

    }

  }

  // Remember the expanded value for this SCEV at this location.

  //

  // This is independent of PostIncLoops. The mapped value simply materializes

  // the expression at this insertion point. If the mapped value happened to be

  // a postinc expansion, it could be reused by a non-postinc user, but only if

  // its insertion point was already at the head of the loop.

  InsertedExpressions[std::make_pair(S, &*InsertPt)] = V;

  return V;

}


void SCEVExpander::rememberInstruction(Value *I) {

  auto DoInsert = [this](Value *V) {

    if (!PostIncLoops.empty())

      InsertedPostIncValues.insert(V);

    else

      InsertedValues.insert(V);

  };

  DoInsert(I);

}


void SCEVExpander::rememberFlags(Instruction *I) {

  // If we already have flags for the instruction, keep the existing ones.

  OrigFlags.try_emplace(I, PoisonFlags(I));

}


void SCEVExpander::dropPoisonGeneratingAnnotationsAndReinfer(

    ScalarEvolution &SE, Instruction *I) {

  I->dropPoisonGeneratingAnnotations();

  // See if we can re-infer from first principles any of the flags we just

  // dropped.

  if (auto *OBO = dyn_cast<OverflowingBinaryOperator>(I))

    if (auto Flags = SE.getStrengthenedNoWrapFlagsFromBinOp(OBO)) {

      auto *BO = cast<BinaryOperator>(I);

      BO->setHasNoUnsignedWrap(

          ScalarEvolution::maskFlags(*Flags, SCEV::FlagNUW) == SCEV::FlagNUW);

      BO->setHasNoSignedWrap(

          ScalarEvolution::maskFlags(*Flags, SCEV::FlagNSW) == SCEV::FlagNSW);

    }

  if (auto *NNI = dyn_cast<PossiblyNonNegInst>(I)) {

    auto *Src = NNI->getOperand(0);

    if (isImpliedByDomCondition(ICmpInst::ICMP_SGE, Src,

                                Constant::getNullValue(Src->getType()), I,

                                SE.getDataLayout())

            .value_or(false))

      NNI->setNonNeg(true);

  }

}


void SCEVExpander::replaceCongruentIVInc(

    PHINode *&Phi, PHINode *&OrigPhi, Loop *L, const DominatorTree *DT,

    SmallVectorImpl<WeakTrackingVH> &DeadInsts) {

  BasicBlock *LatchBlock = L->getLoopLatch();

  if (!LatchBlock)

    return;


  Instruction *OrigInc =

      dyn_cast<Instruction>(OrigPhi->getIncomingValueForBlock(LatchBlock));

  Instruction *IsomorphicInc =

      dyn_cast<Instruction>(Phi->getIncomingValueForBlock(LatchBlock));

  if (!OrigInc || !IsomorphicInc)

    return;


  // If this phi has the same width but is more canonical, replace the

  // original with it. As part of the "more canonical" determination,

  // respect a prior decision to use an IV chain.

  if (OrigPhi->getType() == Phi->getType()) {

    bool Chained = ChainedPhis.contains(Phi);

    if (!(Chained || isExpandedAddRecExprPHI(OrigPhi, OrigInc, L)) &&

        (Chained || isExpandedAddRecExprPHI(Phi, IsomorphicInc, L))) {

      std::swap(OrigPhi, Phi);

      std::swap(OrigInc, IsomorphicInc);

    }

  }


  // Replacing the congruent phi is sufficient because acyclic

  // redundancy elimination, CSE/GVN, should handle the

  // rest. However, once SCEV proves that a phi is congruent,

  // it's often the head of an IV user cycle that is isomorphic

  // with the original phi. It's worth eagerly cleaning up the

  // common case of a single IV increment so that DeleteDeadPHIs

  // can remove cycles that had postinc uses.

  // Because we may potentially introduce a new use of OrigIV that didn't

  // exist before at this point, its poison flags need readjustment.

  const SCEV *TruncExpr =

      SE.getTruncateOrNoop(SE.getSCEV(OrigInc), IsomorphicInc->getType());

  if (OrigInc == IsomorphicInc || TruncExpr != SE.getSCEV(IsomorphicInc) ||

      !SE.LI.replacementPreservesLCSSAForm(IsomorphicInc, OrigInc))

    return;


  bool BothHaveNUW = false;

  bool BothHaveNSW = false;

  auto *OBOIncV = dyn_cast<OverflowingBinaryOperator>(OrigInc);

  auto *OBOIsomorphic = dyn_cast<OverflowingBinaryOperator>(IsomorphicInc);

  if (OBOIncV && OBOIsomorphic) {

    BothHaveNUW =

        OBOIncV->hasNoUnsignedWrap() && OBOIsomorphic->hasNoUnsignedWrap();

    BothHaveNSW =

        OBOIncV->hasNoSignedWrap() && OBOIsomorphic->hasNoSignedWrap();

  }


  if (!hoistIVInc(OrigInc, IsomorphicInc,

                  /*RecomputePoisonFlags*/ true))

    return;


  // We are replacing with a wider increment. If both OrigInc and IsomorphicInc

  // are NUW/NSW, then we can preserve them on the wider increment; the narrower

  // IsomorphicInc would wrap before the wider OrigInc, so the replacement won't

  // make IsomorphicInc's uses more poisonous.

  assert(OrigInc->getType()->getScalarSizeInBits() >=

             IsomorphicInc->getType()->getScalarSizeInBits() &&

         "Should only replace an increment with a wider one.");

  if (BothHaveNUW || BothHaveNSW) {

    OrigInc->setHasNoUnsignedWrap(OBOIncV->hasNoUnsignedWrap() || BothHaveNUW);

    OrigInc->setHasNoSignedWrap(OBOIncV->hasNoSignedWrap() || BothHaveNSW);

  }


  SCEV_DEBUG_WITH_TYPE(DebugType,

                       dbgs() << "INDVARS: Eliminated congruent iv.inc: "

                              << *IsomorphicInc << '\n');

  Value *NewInc = OrigInc;

  if (OrigInc->getType() != IsomorphicInc->getType()) {

    BasicBlock::iterator IP;

    if (PHINode *PN = dyn_cast<PHINode>(OrigInc))

      IP = PN->getParent()->getFirstInsertionPt();

    else

      IP = OrigInc->getNextNode()->getIterator();


    IRBuilder<> Builder(IP->getParent(), IP);

    Builder.SetCurrentDebugLocation(IsomorphicInc->getDebugLoc());

    NewInc =

        Builder.CreateTruncOrBitCast(OrigInc, IsomorphicInc->getType(), IVName);

  }

  IsomorphicInc->replaceAllUsesWith(NewInc);

  DeadInsts.emplace_back(IsomorphicInc);

}


/// replaceCongruentIVs - Check for congruent phis in this loop header and

/// replace them with their most canonical representative. Return the number of

/// phis eliminated.

///

/// This does not depend on any SCEVExpander state but should be used in

/// the same context that SCEVExpander is used.

unsigned


SCEVExpander::replaceCongruentIVs(Loop *L, const DominatorTree *DT,

                                  SmallVectorImpl<WeakTrackingVH> &DeadInsts,

                                  const TargetTransformInfo *TTI) {

  // Find integer phis in order of increasing width.

  SmallVector<PHINode *, 8> Phis(

      llvm::make_pointer_range(L->getHeader()->phis()));


  if (TTI)

    // Use stable_sort to preserve order of equivalent PHIs, so the order

    // of the sorted Phis is the same from run to run on the same loop.

    llvm::stable_sort(Phis, [](Value *LHS, Value *RHS) {

      // Put pointers at the back and make sure pointer < pointer = false.

      if (!LHS->getType()->isIntegerTy() || !RHS->getType()->isIntegerTy())

        return RHS->getType()->isIntegerTy() && !LHS->getType()->isIntegerTy();

      return RHS->getType()->getPrimitiveSizeInBits().getFixedValue() <

             LHS->getType()->getPrimitiveSizeInBits().getFixedValue();

    });


  unsigned NumElim = 0;

  DenseMap<const SCEV *, PHINode *> ExprToIVMap;

  // Process phis from wide to narrow. Map wide phis to their truncation

  // so narrow phis can reuse them.

  for (PHINode *Phi : Phis) {

    auto SimplifyPHINode = [&](PHINode *PN) -> Value * {

      if (Value *V = simplifyInstruction(PN, {DL, &SE.TLI, &SE.DT, &SE.AC}))

        return V;

      if (!SE.isSCEVable(PN->getType()))

        return nullptr;

      auto *Const = dyn_cast<SCEVConstant>(SE.getSCEV(PN));

      if (!Const)

        return nullptr;

      return Const->getValue();

    };


    // Fold constant phis. They may be congruent to other constant phis and

    // would confuse the logic below that expects proper IVs.

    if (Value *V = SimplifyPHINode(Phi)) {

      if (V->getType() != Phi->getType())

        continue;

      SE.forgetValue(Phi);

      Phi->replaceAllUsesWith(V);

      DeadInsts.emplace_back(Phi);

      ++NumElim;

      SCEV_DEBUG_WITH_TYPE(DebugType,

                           dbgs() << "INDVARS: Eliminated constant iv: " << *Phi

                                  << '\n');

      continue;

    }


    if (!SE.isSCEVable(Phi->getType()))

      continue;


    PHINode *&OrigPhiRef = ExprToIVMap[SE.getSCEV(Phi)];

    if (!OrigPhiRef) {

      OrigPhiRef = Phi;

      if (Phi->getType()->isIntegerTy() && TTI &&

          TTI->isTruncateFree(Phi->getType(), Phis.back()->getType())) {

        // Make sure we only rewrite using simple induction variables;

        // otherwise, we can make the trip count of a loop unanalyzable

        // to SCEV.

        const SCEV *PhiExpr = SE.getSCEV(Phi);

        if (isa<SCEVAddRecExpr>(PhiExpr)) {

          // This phi can be freely truncated to the narrowest phi type. Map the

          // truncated expression to it so it will be reused for narrow types.

          const SCEV *TruncExpr =

              SE.getTruncateExpr(PhiExpr, Phis.back()->getType());

          ExprToIVMap[TruncExpr] = Phi;

        }

      }

      continue;

    }


    // Replacing a pointer phi with an integer phi or vice-versa doesn't make

    // sense.

    if (OrigPhiRef->getType()->isPointerTy() != Phi->getType()->isPointerTy())

      continue;


    replaceCongruentIVInc(Phi, OrigPhiRef, L, DT, DeadInsts);

    SCEV_DEBUG_WITH_TYPE(DebugType,

                         dbgs() << "INDVARS: Eliminated congruent iv: " << *Phi

                                << '\n');

    SCEV_DEBUG_WITH_TYPE(

        DebugType, dbgs() << "INDVARS: Original iv: " << *OrigPhiRef << '\n');

    ++NumElim;

    Value *NewIV = OrigPhiRef;

    if (OrigPhiRef->getType() != Phi->getType()) {

      IRBuilder<> Builder(L->getHeader(),

                          L->getHeader()->getFirstInsertionPt());

      Builder.SetCurrentDebugLocation(Phi->getDebugLoc());

      NewIV = Builder.CreateTruncOrBitCast(OrigPhiRef, Phi->getType(), IVName);

    }

    Phi->replaceAllUsesWith(NewIV);

    DeadInsts.emplace_back(Phi);

  }

  return NumElim;

}


bool SCEVExpander::hasRelatedExistingExpansion(const SCEV *S,

                                               const Instruction *At,

                                               Loop *L) {

  using namespace llvm::PatternMatch;


  SmallVector<BasicBlock *, 4> ExitingBlocks;

  L->getExitingBlocks(ExitingBlocks);


  // Look for suitable value in simple conditions at the loop exits.

  for (BasicBlock *BB : ExitingBlocks) {

    CmpPredicate Pred;

    Instruction *LHS, *RHS;


    if (!match(BB->getTerminator(),

               m_Br(m_ICmp(Pred, m_Instruction(LHS), m_Instruction(RHS)),

                    m_BasicBlock(), m_BasicBlock())))

      continue;


    if (SE.getSCEV(LHS) == S && SE.DT.dominates(LHS, At))

      return true;


    if (SE.getSCEV(RHS) == S && SE.DT.dominates(RHS, At))

      return true;

  }


  // Use expand's logic which is used for reusing a previous Value in

  // ExprValueMap.  Note that we don't currently model the cost of

  // needing to drop poison generating flags on the instruction if we

  // want to reuse it.  We effectively assume that has zero cost.

  SmallVector<Instruction *> DropPoisonGeneratingInsts;

  return FindValueInExprValueMap(S, At, DropPoisonGeneratingInsts) != nullptr;

}


template<typename T> static InstructionCost costAndCollectOperands(

  const SCEVOperand &WorkItem, const TargetTransformInfo &TTI,

  TargetTransformInfo::TargetCostKind CostKind,

  SmallVectorImpl<SCEVOperand> &Worklist) {


  const T *S = cast<T>(WorkItem.S);

  InstructionCost Cost = 0;

  // Object to help map SCEV operands to expanded IR instructions.

  struct OperationIndices {

    OperationIndices(unsigned Opc, size_t min, size_t max) :

      Opcode(Opc), MinIdx(min), MaxIdx(max) { }

    unsigned Opcode;

    size_t MinIdx;

    size_t MaxIdx;

  };


  // Collect the operations of all the instructions that will be needed to

  // expand the SCEVExpr. This is so that when we come to cost the operands,

  // we know what the generated user(s) will be.

  SmallVector<OperationIndices, 2> Operations;


  auto CastCost = [&](unsigned Opcode) -> InstructionCost {

    Operations.emplace_back(Opcode, 0, 0);

    return TTI.getCastInstrCost(Opcode, S->getType(),

                                S->getOperand(0)->getType(),

                                TTI::CastContextHint::None, CostKind);

  };


  auto ArithCost = [&](unsigned Opcode, unsigned NumRequired,

                       unsigned MinIdx = 0,

                       unsigned MaxIdx = 1) -> InstructionCost {

    Operations.emplace_back(Opcode, MinIdx, MaxIdx);

    return NumRequired *

      TTI.getArithmeticInstrCost(Opcode, S->getType(), CostKind);

  };


  auto CmpSelCost = [&](unsigned Opcode, unsigned NumRequired, unsigned MinIdx,

                        unsigned MaxIdx) -> InstructionCost {

    Operations.emplace_back(Opcode, MinIdx, MaxIdx);

    Type *OpType = S->getType();

    return NumRequired * TTI.getCmpSelInstrCost(

                             Opcode, OpType, CmpInst::makeCmpResultType(OpType),

                             CmpInst::BAD_ICMP_PREDICATE, CostKind);

  };


  switch (S->getSCEVType()) {

  case scCouldNotCompute:

    llvm_unreachable("Attempt to use a SCEVCouldNotCompute object!");

  case scUnknown:

  case scConstant:

  case scVScale:

    return 0;

  case scPtrToAddr:

    Cost = CastCost(Instruction::PtrToAddr);

    break;

  case scPtrToInt:

    Cost = CastCost(Instruction::PtrToInt);

    break;

  case scTruncate:

    Cost = CastCost(Instruction::Trunc);

    break;

  case scZeroExtend:

    Cost = CastCost(Instruction::ZExt);

    break;

  case scSignExtend:

    Cost = CastCost(Instruction::SExt);

    break;

  case scUDivExpr: {

    unsigned Opcode = Instruction::UDiv;

    if (auto *SC = dyn_cast<SCEVConstant>(S->getOperand(1)))

      if (SC->getAPInt().isPowerOf2())

        Opcode = Instruction::LShr;

    Cost = ArithCost(Opcode, 1);

    break;

  }

  case scAddExpr:

    Cost = ArithCost(Instruction::Add, S->getNumOperands() - 1);

    break;

  case scMulExpr: {

    // Match the actual expansion in visitMulExpr: multiply by -1 is

    // expanded as a negate (sub 0, x), and multiply by a power of 2 is

    // expanded as a shift.  Only handle the common two-operand case with a

    // constant LHS; for everything else fall back to the pessimistic

    // all-multiplies estimate.

    // TODO: this is still pessimistic for the general case because of the

    // Bin Pow algorithm actually used by the expander, see

    // SCEVExpander::visitMulExpr(), ExpandOpBinPowN().

    unsigned OpCode = Instruction::Mul;

    if (S->getNumOperands() == 2)

      if (auto *SC = dyn_cast<SCEVConstant>(S->getOperand(0))) {

        if (SC->getAPInt().isAllOnes()) // -1

          OpCode = Instruction::Sub;

        else if (SC->getAPInt().isPowerOf2())

          OpCode = Instruction::Shl;

      }

    Cost = ArithCost(OpCode, S->getNumOperands() - 1);

    break;

  }

  case scSMaxExpr:

  case scUMaxExpr:

  case scSMinExpr:

  case scUMinExpr:

  case scSequentialUMinExpr: {

    // FIXME: should this ask the cost for Intrinsic's?

    // The reduction tree.

    Cost += CmpSelCost(Instruction::ICmp, S->getNumOperands() - 1, 0, 1);

    Cost += CmpSelCost(Instruction::Select, S->getNumOperands() - 1, 0, 2);

    switch (S->getSCEVType()) {

    case scSequentialUMinExpr: {

      // The safety net against poison.

      // FIXME: this is broken.

      Cost += CmpSelCost(Instruction::ICmp, S->getNumOperands() - 1, 0, 0);

      Cost += ArithCost(Instruction::Or,

                        S->getNumOperands() > 2 ? S->getNumOperands() - 2 : 0);

      Cost += CmpSelCost(Instruction::Select, 1, 0, 1);

      break;

    }

    default:

      assert(!isa<SCEVSequentialMinMaxExpr>(S) &&

             "Unhandled SCEV expression type?");

      break;

    }

    break;

  }

  case scAddRecExpr: {

    // Addrec expands to a phi and add per recurrence.

    unsigned NumRecurrences = S->getNumOperands() - 1;

    Cost += TTI.getCFInstrCost(Instruction::PHI, CostKind) * NumRecurrences;

    Cost +=

        TTI.getArithmeticInstrCost(Instruction::Add, S->getType(), CostKind) *

        NumRecurrences;

    // AR start is used in phi.

    Worklist.emplace_back(Instruction::PHI, 0, S->getOperand(0));

    // Other operands are used in add.

    for (const SCEV *Op : S->operands().drop_front())

      Worklist.emplace_back(Instruction::Add, 1, Op);

    break;

  }

  }


  for (auto &CostOp : Operations) {

    for (auto SCEVOp : enumerate(S->operands())) {

      // Clamp the index to account for multiple IR operations being chained.

      size_t MinIdx = std::max(SCEVOp.index(), CostOp.MinIdx);

      size_t OpIdx = std::min(MinIdx, CostOp.MaxIdx);

      Worklist.emplace_back(CostOp.Opcode, OpIdx, SCEVOp.value());

    }

  }

  return Cost;

}


bool SCEVExpander::isHighCostExpansionHelper(

    const SCEVOperand &WorkItem, Loop *L, const Instruction &At,

    InstructionCost &Cost, unsigned Budget, const TargetTransformInfo &TTI,

    SmallPtrSetImpl<const SCEV *> &Processed,

    SmallVectorImpl<SCEVOperand> &Worklist) {

  if (Cost > Budget)

    return true; // Already run out of budget, give up.


  const SCEV *S = WorkItem.S;

  // Was the cost of expansion of this expression already accounted for?

  if (!isa<SCEVConstant>(S) && !Processed.insert(S).second)

    return false; // We have already accounted for this expression.


  // If we can find an existing value for this scev available at the point "At"

  // then consider the expression cheap.

  if (hasRelatedExistingExpansion(S, &At, L))

    return false; // Consider the expression to be free.


  TargetTransformInfo::TargetCostKind CostKind =

      L->getHeader()->getParent()->hasMinSize()

          ? TargetTransformInfo::TCK_CodeSize

          : TargetTransformInfo::TCK_RecipThroughput;


  switch (S->getSCEVType()) {

  case scCouldNotCompute:

    llvm_unreachable("Attempt to use a SCEVCouldNotCompute object!");

  case scUnknown:

  case scVScale:

    // Assume to be zero-cost.

    return false;

  case scConstant: {

    // Only evalulate the costs of constants when optimizing for size.

    if (CostKind != TargetTransformInfo::TCK_CodeSize)

      return false;

    const APInt &Imm = cast<SCEVConstant>(S)->getAPInt();

    Type *Ty = S->getType();

    Cost += TTI.getIntImmCostInst(

        WorkItem.ParentOpcode, WorkItem.OperandIdx, Imm, Ty, CostKind);

    return Cost > Budget;

  }

  case scTruncate:

  case scPtrToAddr:

  case scPtrToInt:

  case scZeroExtend:

  case scSignExtend: {

    Cost +=

        costAndCollectOperands<SCEVCastExpr>(WorkItem, TTI, CostKind, Worklist);

    return false; // Will answer upon next entry into this function.

  }

  case scUDivExpr: {

    // UDivExpr is very likely a UDiv that ScalarEvolution's HowFarToZero or

    // HowManyLessThans produced to compute a precise expression, rather than a

    // UDiv from the user's code. If we can't find a UDiv in the code with some

    // simple searching, we need to account for it's cost.


    // At the beginning of this function we already tried to find existing

    // value for plain 'S'. Now try to lookup 'S + 1' since it is common

    // pattern involving division. This is just a simple search heuristic.

    if (hasRelatedExistingExpansion(

            SE.getAddExpr(S, SE.getConstant(S->getType(), 1)), &At, L))

      return false; // Consider it to be free.


    Cost +=

        costAndCollectOperands<SCEVUDivExpr>(WorkItem, TTI, CostKind, Worklist);

    return false; // Will answer upon next entry into this function.

  }

  case scAddExpr:

  case scMulExpr:

  case scUMaxExpr:

  case scSMaxExpr:

  case scUMinExpr:

  case scSMinExpr:

  case scSequentialUMinExpr: {

    assert(cast<SCEVNAryExpr>(S)->getNumOperands() > 1 &&

           "Nary expr should have more than 1 operand.");

    // The simple nary expr will require one less op (or pair of ops)

    // than the number of it's terms.

    Cost +=

        costAndCollectOperands<SCEVNAryExpr>(WorkItem, TTI, CostKind, Worklist);

    return Cost > Budget;

  }

  case scAddRecExpr: {

    assert(cast<SCEVAddRecExpr>(S)->getNumOperands() >= 2 &&

           "Polynomial should be at least linear");

    Cost += costAndCollectOperands<SCEVAddRecExpr>(

        WorkItem, TTI, CostKind, Worklist);

    return Cost > Budget;

  }

  }

  llvm_unreachable("Unknown SCEV kind!");

}


Value *SCEVExpander::expandCodeForPredicate(const SCEVPredicate *Pred,

                                            Instruction *IP) {

  assert(IP);

  switch (Pred->getKind()) {

  case SCEVPredicate::P_Union:

    return expandUnionPredicate(cast<SCEVUnionPredicate>(Pred), IP);

  case SCEVPredicate::P_Compare:

    return expandComparePredicate(cast<SCEVComparePredicate>(Pred), IP);

  case SCEVPredicate::P_Wrap: {

    auto *AddRecPred = cast<SCEVWrapPredicate>(Pred);

    return expandWrapPredicate(AddRecPred, IP);

  }

  }

  llvm_unreachable("Unknown SCEV predicate type");

}


Value *SCEVExpander::expandComparePredicate(const SCEVComparePredicate *Pred,

                                            Instruction *IP) {

  Value *Expr0 = expand(Pred->getLHS(), IP);

  Value *Expr1 = expand(Pred->getRHS(), IP);


  Builder.SetInsertPoint(IP);

  auto InvPred = ICmpInst::getInversePredicate(Pred->getPredicate());

  auto *I = Builder.CreateICmp(InvPred, Expr0, Expr1, "ident.check");

  return I;

}


Value *SCEVExpander::generateOverflowCheck(const SCEVAddRecExpr *AR,

                                           Instruction *Loc, bool Signed) {

  assert(AR->isAffine() && "Cannot generate RT check for "

                           "non-affine expression");


  // FIXME: It is highly suspicious that we're ignoring the predicates here.

  SmallVector<const SCEVPredicate *, 4> Pred;

  const SCEV *ExitCount =

      SE.getPredicatedSymbolicMaxBackedgeTakenCount(AR->getLoop(), Pred);


  assert(!isa<SCEVCouldNotCompute>(ExitCount) && "Invalid loop count");


  const SCEV *Step = AR->getStepRecurrence(SE);

  const SCEV *Start = AR->getStart();


  Type *ARTy = AR->getType();

  unsigned SrcBits = SE.getTypeSizeInBits(ExitCount->getType());

  unsigned DstBits = SE.getTypeSizeInBits(ARTy);


  // The expression {Start,+,Step} has nusw/nssw if

  //   Step < 0, Start - |Step| * Backedge <= Start

  //   Step >= 0, Start + |Step| * Backedge > Start

  // and |Step| * Backedge doesn't unsigned overflow.


  Builder.SetInsertPoint(Loc);

  Value *TripCountVal = expand(ExitCount, Loc);


  IntegerType *Ty =

      IntegerType::get(Loc->getContext(), SE.getTypeSizeInBits(ARTy));


  Value *StepValue = expand(Step, Loc);

  Value *NegStepValue = expand(SE.getNegativeSCEV(Step), Loc);

  Value *StartValue = expand(Start, Loc);


  ConstantInt *Zero =

      ConstantInt::get(Loc->getContext(), APInt::getZero(DstBits));


  Builder.SetInsertPoint(Loc);

  // Compute |Step|

  Value *StepCompare = Builder.CreateICmp(ICmpInst::ICMP_SLT, StepValue, Zero);

  Value *AbsStep = Builder.CreateSelect(StepCompare, NegStepValue, StepValue);


  // Compute |Step| * Backedge

  // Compute:

  //   1. Start + |Step| * Backedge < Start

  //   2. Start - |Step| * Backedge > Start

  //

  // And select either 1. or 2. depending on whether step is positive or

  // negative. If Step is known to be positive or negative, only create

  // either 1. or 2.

  auto ComputeEndCheck = [&]() -> Value * {

    // Get the backedge taken count and truncate or extended to the AR type.

    Value *TruncTripCount = Builder.CreateZExtOrTrunc(TripCountVal, Ty);


    CallInst *Mul = Builder.CreateIntrinsic(Intrinsic::umul_with_overflow, Ty,

                                            {AbsStep, TruncTripCount},

                                            /*FMFSource=*/nullptr, "mul");

    Value *MulV = Builder.CreateExtractValue(Mul, 0, "mul.result");

    Value *OfMul = Builder.CreateExtractValue(Mul, 1, "mul.overflow");


    Value *Add = nullptr, *Sub = nullptr;

    bool NeedPosCheck = !SE.isKnownNegative(Step);

    bool NeedNegCheck = !SE.isKnownPositive(Step);


    if (isa<PointerType>(ARTy)) {

      Value *NegMulV = Builder.CreateNeg(MulV);

      if (NeedPosCheck)

        Add = Builder.CreatePtrAdd(StartValue, MulV);

      if (NeedNegCheck)

        Sub = Builder.CreatePtrAdd(StartValue, NegMulV);

    } else {

      if (NeedPosCheck)

        Add = Builder.CreateAdd(StartValue, MulV);

      if (NeedNegCheck)

        Sub = Builder.CreateSub(StartValue, MulV);

    }


    Value *EndCompareLT = nullptr;

    Value *EndCompareGT = nullptr;

    Value *EndCheck = nullptr;

    if (NeedPosCheck)

      EndCheck = EndCompareLT = Builder.CreateICmp(

          Signed ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_ULT, Add, StartValue);

    if (NeedNegCheck)

      EndCheck = EndCompareGT = Builder.CreateICmp(

          Signed ? ICmpInst::ICMP_SGT : ICmpInst::ICMP_UGT, Sub, StartValue);

    if (NeedPosCheck && NeedNegCheck) {

      // Select the answer based on the sign of Step.

      EndCheck = Builder.CreateSelect(StepCompare, EndCompareGT, EndCompareLT);

    }

    return Builder.CreateOr(EndCheck, OfMul);

  };

  Value *EndCheck = ComputeEndCheck();


  // If the backedge taken count type is larger than the AR type,

  // check that we don't drop any bits by truncating it. If we are

  // dropping bits, then we have overflow (unless the step is zero).

  if (SrcBits > DstBits) {

    auto MaxVal = APInt::getMaxValue(DstBits).zext(SrcBits);

    auto *BackedgeCheck =

        Builder.CreateICmp(ICmpInst::ICMP_UGT, TripCountVal,

                           ConstantInt::get(Loc->getContext(), MaxVal));

    BackedgeCheck = Builder.CreateAnd(

        BackedgeCheck, Builder.CreateICmp(ICmpInst::ICMP_NE, StepValue, Zero));


    EndCheck = Builder.CreateOr(EndCheck, BackedgeCheck);

  }


  return EndCheck;

}


Value *SCEVExpander::expandWrapPredicate(const SCEVWrapPredicate *Pred,

                                         Instruction *IP) {

  const auto *A = cast<SCEVAddRecExpr>(Pred->getExpr());

  Value *NSSWCheck = nullptr, *NUSWCheck = nullptr;


  // Add a check for NUSW

  if (Pred->getFlags() & SCEVWrapPredicate::IncrementNUSW)

    NUSWCheck = generateOverflowCheck(A, IP, false);


  // Add a check for NSSW

  if (Pred->getFlags() & SCEVWrapPredicate::IncrementNSSW)

    NSSWCheck = generateOverflowCheck(A, IP, true);


  if (NUSWCheck && NSSWCheck)

    return Builder.CreateOr(NUSWCheck, NSSWCheck);


  if (NUSWCheck)

    return NUSWCheck;


  if (NSSWCheck)

    return NSSWCheck;


  return ConstantInt::getFalse(IP->getContext());

}


Value *SCEVExpander::expandUnionPredicate(const SCEVUnionPredicate *Union,

                                          Instruction *IP) {

  // Loop over all checks in this set.

  SmallVector<Value *> Checks;

  for (const auto *Pred : Union->getPredicates()) {

    Checks.push_back(expandCodeForPredicate(Pred, IP));

    Builder.SetInsertPoint(IP);

  }


  if (Checks.empty())

    return ConstantInt::getFalse(IP->getContext());

  return Builder.CreateOr(Checks);

}


Value *SCEVExpander::fixupLCSSAFormFor(Value *V) {

  auto *DefI = dyn_cast<Instruction>(V);

  if (!PreserveLCSSA || !DefI)

    return V;


  BasicBlock::iterator InsertPt = Builder.GetInsertPoint();

  Loop *DefLoop = SE.LI.getLoopFor(DefI->getParent());

  Loop *UseLoop = SE.LI.getLoopFor(InsertPt->getParent());

  if (!DefLoop || UseLoop == DefLoop || DefLoop->contains(UseLoop))

    return V;


  // Create a temporary instruction to at the current insertion point, so we

  // can hand it off to the helper to create LCSSA PHIs if required for the

  // new use.

  // FIXME: Ideally formLCSSAForInstructions (used in fixupLCSSAFormFor)

  // would accept a insertion point and return an LCSSA phi for that

  // insertion point, so there is no need to insert & remove the temporary

  // instruction.

  Type *ToTy;

  if (DefI->getType()->isIntegerTy())

    ToTy = PointerType::get(DefI->getContext(), 0);

  else

    ToTy = Type::getInt32Ty(DefI->getContext());

  Instruction *User =

      CastInst::CreateBitOrPointerCast(DefI, ToTy, "tmp.lcssa.user", InsertPt);

  llvm::scope_exit RemoveUserOnExit([User]() { User->eraseFromParent(); });


  SmallVector<Instruction *, 1> ToUpdate;

  ToUpdate.push_back(DefI);

  SmallVector<PHINode *, 16> PHIsToRemove;

  SmallVector<PHINode *, 16> InsertedPHIs;

  formLCSSAForInstructions(ToUpdate, SE.DT, SE.LI, &SE, &PHIsToRemove,

                           &InsertedPHIs);

  for (PHINode *PN : InsertedPHIs)

    rememberInstruction(PN);

  for (PHINode *PN : PHIsToRemove) {

    if (!PN->use_empty())

      continue;

    InsertedValues.erase(PN);

    InsertedPostIncValues.erase(PN);

    PN->eraseFromParent();

  }


  return User->getOperand(0);

}


namespace {

// Search for a SCEV subexpression that is not safe to expand.  Any expression

// that may expand to a !isSafeToSpeculativelyExecute value is unsafe, namely

// UDiv expressions. We don't know if the UDiv is derived from an IR divide

// instruction, but the important thing is that we prove the denominator is

// nonzero before expansion.

//

// IVUsers already checks that IV-derived expressions are safe. So this check is

// only needed when the expression includes some subexpression that is not IV

// derived.

//

// Currently, we only allow division by a value provably non-zero here.

//

// We cannot generally expand recurrences unless the step dominates the loop

// header. The expander handles the special case of affine recurrences by

// scaling the recurrence outside the loop, but this technique isn't generally

// applicable. Expanding a nested recurrence outside a loop requires computing

// binomial coefficients. This could be done, but the recurrence has to be in a

// perfectly reduced form, which can't be guaranteed.

struct SCEVFindUnsafe {

  ScalarEvolution &SE;

  bool CanonicalMode;

  bool IsUnsafe = false;


  SCEVFindUnsafe(ScalarEvolution &SE, bool CanonicalMode)

      : SE(SE), CanonicalMode(CanonicalMode) {}


  bool follow(const SCEV *S) {

    if (const SCEVUDivExpr *D = dyn_cast<SCEVUDivExpr>(S)) {

      if (!SE.isKnownNonZero(D->getRHS()) ||

          !SE.isGuaranteedNotToBePoison(D->getRHS())) {

        IsUnsafe = true;

        return false;

      }

    }

    if (const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(S)) {

      // For non-affine addrecs or in non-canonical mode we need a preheader

      // to insert into.

      if (!AR->getLoop()->getLoopPreheader() &&

          (!CanonicalMode || !AR->isAffine())) {

        IsUnsafe = true;

        return false;

      }

    }

    return true;

  }

  bool isDone() const { return IsUnsafe; }

};

} // namespace


bool SCEVExpander::isSafeToExpand(const SCEV *S) const {

  SCEVFindUnsafe Search(SE, CanonicalMode);

  visitAll(S, Search);

  return !Search.IsUnsafe;

}


bool SCEVExpander::isSafeToExpandAt(const SCEV *S,

                                    const Instruction *InsertionPoint) const {

  if (!isSafeToExpand(S))

    return false;

  // We have to prove that the expanded site of S dominates InsertionPoint.

  // This is easy when not in the same block, but hard when S is an instruction

  // to be expanded somewhere inside the same block as our insertion point.

  // What we really need here is something analogous to an OrderedBasicBlock,

  // but for the moment, we paper over the problem by handling two common and

  // cheap to check cases.

  if (SE.properlyDominates(S, InsertionPoint->getParent()))

    return true;

  if (SE.dominates(S, InsertionPoint->getParent())) {

    if (InsertionPoint->getParent()->getTerminator() == InsertionPoint)

      return true;

    if (const SCEVUnknown *U = dyn_cast<SCEVUnknown>(S))

      if (llvm::is_contained(InsertionPoint->operand_values(), U->getValue()))

        return true;

  }

  return false;

}


void SCEVExpanderCleaner::cleanup() {

  // Result is used, nothing to remove.

  if (ResultUsed)

    return;


  // Restore original poison flags.

  for (auto [I, Flags] : Expander.OrigFlags)

    Flags.apply(I);


  auto InsertedInstructions = Expander.getAllInsertedInstructions();

#ifndef NDEBUG

  SmallPtrSet<Instruction *, 8> InsertedSet(llvm::from_range,

                                            InsertedInstructions);

  (void)InsertedSet;

#endif

  // Remove sets with value handles.

  Expander.clear();


  // Remove all inserted instructions.

  for (Instruction *I : reverse(InsertedInstructions)) {

#ifndef NDEBUG

    assert(all_of(I->users(),

                  [&InsertedSet](Value *U) {

                    return InsertedSet.contains(cast<Instruction>(U));

                  }) &&

           "removed instruction should only be used by instructions inserted "

           "during expansion");

#endif

    assert(!I->getType()->isVoidTy() &&

           "inserted instruction should have non-void types");

    I->replaceAllUsesWith(PoisonValue::get(I->getType()));

    I->eraseFromParent();

  }

}


assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

none
@ none
Definition AArch64StackTagging.cpp:75

X
#define X(NUM, ENUM, NAME)
Definition ELF.h:853

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

E
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

CommandLine.h

CostKind
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))

DataLayout.h

Dominators.h

GEP
Hexagon Common GEP
Definition HexagonCommonGEP.cpp:164

Loops
Hexagon Hardware Loops
Definition HexagonHardwareLoops.cpp:370

IntrinsicInst.h

InstructionSimplify.h

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

LoopInfo.h

LoopUtils.h

I
#define I(x, y, z)
Definition MD5.cpp:57

T
#define T
Definition Mips16ISelLowering.cpp:282

OpIdx
MachineInstr unsigned OpIdx
Definition NVPTXPrologEpilogPass.cpp:56

P
#define P(N)

if
if(PassOpts->AAPipeline)
Definition PassBuilderBindings.cpp:64

PatternMatch.h

Opc
auto Opc
Definition RISCVRedundantCopyElimination.cpp:77

STLExtras.h
This file contains some templates that are useful if you are working with the STL at all.

IsIncrementNUW
static bool IsIncrementNUW(ScalarEvolution &SE, const SCEVAddRecExpr *AR)
Definition ScalarEvolutionExpander.cpp:965

PickMostRelevantLoop
static const Loop * PickMostRelevantLoop(const Loop *A, const Loop *B, DominatorTree &DT)
PickMostRelevantLoop - Given two loops pick the one that's most relevant for SCEV expansion.
Definition ScalarEvolutionExpander.cpp:436

costAndCollectOperands
static InstructionCost costAndCollectOperands(const SCEVOperand &WorkItem, const TargetTransformInfo &TTI, TargetTransformInfo::TargetCostKind CostKind, SmallVectorImpl< SCEVOperand > &Worklist)
Definition ScalarEvolutionExpander.cpp:1957

IsIncrementNSW
static bool IsIncrementNSW(ScalarEvolution &SE, const SCEVAddRecExpr *AR)
Definition ScalarEvolutionExpander.cpp:951

canBeCheaplyTransformed
static bool canBeCheaplyTransformed(ScalarEvolution &SE, const SCEVAddRecExpr *Phi, const SCEVAddRecExpr *Requested, bool &InvertStep)
Check whether we can cheaply express the requested SCEV in terms of the available PHI SCEV by truncat...
Definition ScalarEvolutionExpander.cpp:918

SCEV_DEBUG_WITH_TYPE
#define SCEV_DEBUG_WITH_TYPE(TYPE, X)
Definition ScalarEvolutionExpander.cpp:35

ScalarEvolutionExpander.h

ScalarEvolutionPatternMatch.h

ScopeExit.h
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

Local.h

ValueTracking.h

RHS
Value * RHS
Definition X86PartialReduction.cpp:81

LHS
Value * LHS
Definition X86PartialReduction.cpp:80

llvm::APInt::zext
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
Definition APInt.cpp:1055

llvm::APInt::getMaxValue
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
Definition APInt.h:207

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:201

llvm::Argument
This class represents an incoming formal argument to a Function.
Definition Argument.h:32

llvm::BasicBlock
LLVM Basic Block Representation.
Definition BasicBlock.h:62

llvm::BasicBlock::phis
iterator_range< const_phi_iterator > phis() const
Returns a range that iterates over the phis in the basic block.
Definition BasicBlock.h:530

llvm::BasicBlock::getSinglePredecessor
LLVM_ABI const BasicBlock * getSinglePredecessor() const
Return the predecessor of this block if it has a single predecessor block.
Definition BasicBlock.cpp:401

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition BasicBlock.h:170

llvm::BasicBlock::getTerminator
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction; assumes that the block is well-formed.
Definition BasicBlock.h:237

llvm::BinaryOperator::Create
static LLVM_ABI BinaryOperator * Create(BinaryOps Op, Value *S1, Value *S2, const Twine &Name=Twine(), InsertPosition InsertBefore=nullptr)
Construct a binary instruction, given the opcode and the two operands.
Definition Instructions.cpp:2738

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition Instructions.h:1531

llvm::CastInst
This is the base class for all instructions that perform data casts.
Definition InstrTypes.h:512

llvm::CastInst::getCastOpcode
static LLVM_ABI Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
Definition Instructions.cpp:3265

llvm::CastInst::getOpcode
Instruction::CastOps getOpcode() const
Return the opcode of this CastInst.
Definition InstrTypes.h:674

llvm::CastInst::CreateBitOrPointerCast
static LLVM_ABI CastInst * CreateBitOrPointerCast(Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a BitCast, a PtrToInt, or an IntToPTr cast instruction.
Definition Instructions.cpp:3168

llvm::CmpInst::makeCmpResultType
static Type * makeCmpResultType(Type *opnd_type)
Create a result type for fcmp/icmp.
Definition InstrTypes.h:1049

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition InstrTypes.h:773

llvm::CmpInst::ICMP_SLT
@ ICMP_SLT
signed less than
Definition InstrTypes.h:769

llvm::CmpInst::ICMP_UGT
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:763

llvm::CmpInst::ICMP_SGT
@ ICMP_SGT
signed greater than
Definition InstrTypes.h:767

llvm::CmpInst::ICMP_ULT
@ ICMP_ULT
unsigned less than
Definition InstrTypes.h:765

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition InstrTypes.h:762

llvm::CmpInst::ICMP_SGE
@ ICMP_SGE
signed greater or equal
Definition InstrTypes.h:768

llvm::CmpInst::getInversePredicate
Predicate getInversePredicate() const
For example, EQ -> NE, UGT -> ULE, SLT -> SGE, OEQ -> UNE, UGT -> OLE, OLT -> UGE,...
Definition InstrTypes.h:852

llvm::CmpPredicate
An abstraction over a floating-point predicate, and a pack of an integer predicate with samesign info...
Definition CmpPredicate.h:23

llvm::ConstantExpr::getCast
static LLVM_ABI Constant * getCast(unsigned ops, Constant *C, Type *Ty, bool OnlyIfReduced=false)
Convenience function for getting a Cast operation.
Definition Constants.cpp:2365

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition Constants.h:87

llvm::ConstantInt::getFalse
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
Definition Constants.cpp:904

llvm::Constant::getNullValue
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
Definition Constants.cpp:363

llvm::DenseMap
Definition DenseMap.h:834

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:151

llvm::DominatorTree::dominates
LLVM_ABI bool dominates(const BasicBlock *BB, const Use &U) const
Return true if the (end of the) basic block BB dominates the use U.
Definition Dominators.cpp:123

llvm::GEPNoWrapFlags::noUnsignedWrap
static GEPNoWrapFlags noUnsignedWrap()
Definition GEPNoWrapFlags.h:56

llvm::GEPNoWrapFlags::none
static GEPNoWrapFlags none()
Definition GEPNoWrapFlags.h:46

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2868

llvm::InstructionCost
Definition InstructionCost.h:30

llvm::Instruction
Definition Instruction.h:70

llvm::Instruction::setHasNoUnsignedWrap
LLVM_ABI void setHasNoUnsignedWrap(bool b=true)
Set or clear the nuw flag on this instruction, which must be an operator which supports this flag.
Definition Instruction.cpp:395

llvm::Instruction::setHasNoSignedWrap
LLVM_ABI void setHasNoSignedWrap(bool b=true)
Set or clear the nsw flag on this instruction, which must be an operator which supports this flag.
Definition Instruction.cpp:402

llvm::Instruction::getDebugLoc
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
Definition Instruction.h:546

llvm::Instruction::insertBefore
LLVM_ABI void insertBefore(InstListType::iterator InsertPos)
Insert an unlinked instruction into a basic block immediately before the specified position.
Definition Instruction.cpp:123

llvm::Instruction::eraseFromParent
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Definition Instruction.cpp:112

llvm::Instruction::getFunction
LLVM_ABI const Function * getFunction() const
Return the function this instruction belongs to.
Definition Instruction.cpp:90

llvm::Instruction::mayHaveSideEffects
LLVM_ABI bool mayHaveSideEffects() const LLVM_READONLY
Return true if the instruction may have side effects.
Definition Instruction.cpp:1345

llvm::Instruction::comesBefore
LLVM_ABI bool comesBefore(const Instruction *Other) const
Given an instruction Other in the same basic block as this instruction, return true if this instructi...
Definition Instruction.cpp:350

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition Instruction.h:344

llvm::Instruction::BinaryOps
BinaryOps
Definition Instruction.h:1056

llvm::Instruction::CastOps
CastOps
Definition Instruction.h:1070

llvm::IntegerType
Class to represent integer types.
Definition DerivedTypes.h:42

llvm::IntegerType::get
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:350

llvm::LoopBase::contains
bool contains(const LoopT *L) const
Return true if the specified loop is contained within in this loop.
Definition GenericLoopInfo.h:124

llvm::LoopInfoBase::getLoopFor
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
Definition GenericLoopInfo.h:630

llvm::Loop
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40

llvm::MinMaxIntrinsic::getPredicate
ICmpInst::Predicate getPredicate() const
Returns the comparison predicate underlying the intrinsic.
Definition IntrinsicInst.h:807

llvm::PHINode
Definition Instructions.h:2661

llvm::PHINode::addIncoming
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
Definition Instructions.h:2795

llvm::PHINode::isComplete
bool isComplete() const
If the PHI node is complete which means all of its parent's predecessors have incoming value in this ...
Definition Instructions.h:2865

llvm::PHINode::getIncomingValueForBlock
Value * getIncomingValueForBlock(const BasicBlock *BB) const
Definition Instructions.h:2835

llvm::PHINode::Create
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
Definition Instructions.h:2695

llvm::PointerType::get
static LLVM_ABI PointerType * get(Type *ElementType, unsigned AddressSpace)
This constructs a pointer to an object of the specified type in a numbered address space.

llvm::PoisonValue::get
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition Constants.cpp:2030

llvm::SCEVAddRecExpr
This node represents a polynomial recurrence on the trip count of the specified loop.
Definition ScalarEvolutionExpressions.h:365

llvm::SCEVAddRecExpr::getType
Type * getType() const
Definition ScalarEvolutionExpressions.h:375

llvm::SCEVAddRecExpr::isAffine
bool isAffine() const
Return true if this represents an expression A + B*x where A and B are loop invariant values.
Definition ScalarEvolutionExpressions.h:392

llvm::SCEVAddRecExpr::getLoop
const Loop * getLoop() const
Definition ScalarEvolutionExpressions.h:377

llvm::SCEVAddRecExpr::getStepRecurrence
SCEVUse getStepRecurrence(ScalarEvolution &SE) const
Constructs and returns the recurrence indicating how much this expression steps by.
Definition ScalarEvolutionExpressions.h:383

llvm::SCEVAddRecExpr::getStart
SCEVUse getStart() const
Definition ScalarEvolutionExpressions.h:376

llvm::SCEVComparePredicate
This class represents an assumption that the expression LHS Pred RHS evaluates to true,...
Definition ScalarEvolution.h:437

llvm::SCEVExpanderCleaner::cleanup
LLVM_ABI void cleanup()
Definition ScalarEvolutionExpander.cpp:2501

llvm::SCEVExpander::generateOverflowCheck
LLVM_ABI Value * generateOverflowCheck(const SCEVAddRecExpr *AR, Instruction *Loc, bool Signed)
Generates code that evaluates if the AR expression will overflow.
Definition ScalarEvolutionExpander.cpp:2227

llvm::SCEVExpander::hasRelatedExistingExpansion
LLVM_ABI bool hasRelatedExistingExpansion(const SCEV *S, const Instruction *At, Loop *L)
Determine whether there is an existing expansion of S that can be reused.
Definition ScalarEvolutionExpander.cpp:1924

llvm::SCEVExpander::getAllInsertedInstructions
SmallVector< Instruction *, 32 > getAllInsertedInstructions() const
Return a vector containing all instructions inserted during expansion.
Definition ScalarEvolutionExpander.h:225

llvm::SCEVExpander::isSafeToExpand
LLVM_ABI bool isSafeToExpand(const SCEV *S) const
Return true if the given expression is safe to expand in the sense that all materialized values are s...
Definition ScalarEvolutionExpander.cpp:2473

llvm::SCEVExpander::isSafeToExpandAt
LLVM_ABI bool isSafeToExpandAt(const SCEV *S, const Instruction *InsertionPoint) const
Return true if the given expression is safe to expand in the sense that all materialized values are d...
Definition ScalarEvolutionExpander.cpp:2479

llvm::SCEVExpander::replaceCongruentIVs
LLVM_ABI unsigned replaceCongruentIVs(Loop *L, const DominatorTree *DT, SmallVectorImpl< WeakTrackingVH > &DeadInsts, const TargetTransformInfo *TTI=nullptr)
replace congruent phis with their most canonical representative.
Definition ScalarEvolutionExpander.cpp:1827

llvm::SCEVExpander::dropPoisonGeneratingAnnotationsAndReinfer
static LLVM_ABI void dropPoisonGeneratingAnnotationsAndReinfer(ScalarEvolution &SE, Instruction *I)
Drop poison-generating flags from I, then try re-infer via SCEV.
Definition ScalarEvolutionExpander.cpp:1709

llvm::SCEVExpander::expandUnionPredicate
LLVM_ABI Value * expandUnionPredicate(const SCEVUnionPredicate *Pred, Instruction *Loc)
A specialized variant of expandCodeForPredicate, handling the case when we are expanding code for a S...
Definition ScalarEvolutionExpander.cpp:2363

llvm::SCEVExpander::hoistIVInc
LLVM_ABI bool hoistIVInc(Instruction *IncV, Instruction *InsertPos, bool RecomputePoisonFlags=false)
Utility for hoisting IncV (with all subexpressions requried for its computation) before InsertPos.
Definition ScalarEvolutionExpander.cpp:820

llvm::SCEVExpander::isInsertedInstruction
bool isInsertedInstruction(Instruction *I) const
Return true if the specified instruction was inserted by the code rewriter.
Definition ScalarEvolutionExpander.h:419

llvm::SCEVExpander::expandCodeForPredicate
LLVM_ABI Value * expandCodeForPredicate(const SCEVPredicate *Pred, Instruction *Loc)
Generates a code sequence that evaluates this predicate.
Definition ScalarEvolutionExpander.cpp:2200

llvm::SCEVExpander::canReuseFlagsFromOriginalIVInc
static LLVM_ABI bool canReuseFlagsFromOriginalIVInc(PHINode *OrigPhi, PHINode *WidePhi, Instruction *OrigInc, Instruction *WideInc)
Return true if both increments directly increment the corresponding IV PHI nodes and have the same op...
Definition ScalarEvolutionExpander.cpp:873

llvm::SCEVExpander::expandCodeFor
LLVM_ABI Value * expandCodeFor(SCEVUse SH, Type *Ty, BasicBlock::iterator I)
Insert code to directly compute the specified SCEV expression into the program.
Definition ScalarEvolutionExpander.cpp:1555

llvm::SCEVExpander::expandComparePredicate
LLVM_ABI Value * expandComparePredicate(const SCEVComparePredicate *Pred, Instruction *Loc)
A specialized variant of expandCodeForPredicate, handling the case when we are expanding code for a S...
Definition ScalarEvolutionExpander.cpp:2216

llvm::SCEVExpander::expandWrapPredicate
LLVM_ABI Value * expandWrapPredicate(const SCEVWrapPredicate *P, Instruction *Loc)
A specialized variant of expandCodeForPredicate, handling the case when we are expanding code for a S...
Definition ScalarEvolutionExpander.cpp:2338

llvm::SCEVExpander::getIVIncOperand
LLVM_ABI Instruction * getIVIncOperand(Instruction *IncV, Instruction *InsertPos, bool allowScale)
Return the induction variable increment's IV operand.
Definition ScalarEvolutionExpander.cpp:760

llvm::SCEVExpander::eraseDeadInstructions
LLVM_ABI void eraseDeadInstructions(Value *Root)
Remove inserted instructions that are dead, e.g.
Definition ScalarEvolutionExpander.cpp:173

llvm::SCEVExpander::findInsertPointAfter
LLVM_ABI BasicBlock::iterator findInsertPointAfter(Instruction *I, Instruction *MustDominate) const
Returns a suitable insert point after I, that dominates MustDominate.
Definition ScalarEvolutionExpander.cpp:153

llvm::SCEVExpander::setInsertPoint
void setInsertPoint(Instruction *IP)
Set the current insertion point.
Definition ScalarEvolutionExpander.h:393

llvm::SCEVPredicate
This class represents an assumption made using SCEV expressions which can be checked at run-time.
Definition ScalarEvolution.h:374

llvm::SCEVPredicate::P_Compare
@ P_Compare
Definition ScalarEvolution.h:382

llvm::SCEVPredicate::P_Union
@ P_Union
Definition ScalarEvolution.h:382

llvm::SCEVPredicate::P_Wrap
@ P_Wrap
Definition ScalarEvolution.h:382

llvm::SCEVUnionPredicate
This class represents a composition of other SCEV predicates, and is the class that most clients will...
Definition ScalarEvolution.h:572

llvm::SCEVUnknown
This means that we are dealing with an entirely unknown SCEV value, and only represent it as its LLVM...
Definition ScalarEvolutionExpressions.h:599

llvm::SCEVWrapPredicate
This class represents an assumption made on an AddRec expression.
Definition ScalarEvolution.h:477

llvm::SCEVWrapPredicate::IncrementNUSW
@ IncrementNUSW
Definition ScalarEvolution.h:503

llvm::SCEVWrapPredicate::IncrementNSSW
@ IncrementNSSW
Definition ScalarEvolution.h:504

llvm::SCEV
This class represents an analyzed expression in the program.
Definition ScalarEvolution.h:249

llvm::SCEV::NoWrapFlags
SCEVNoWrapFlags NoWrapFlags
Definition ScalarEvolution.h:272

llvm::SCEV::FlagNUW
static constexpr auto FlagNUW
Definition ScalarEvolution.h:275

llvm::SCEV::FlagAnyWrap
static constexpr auto FlagAnyWrap
Definition ScalarEvolution.h:273

llvm::SCEV::isNonConstantNegative
LLVM_ABI bool isNonConstantNegative() const
Return true if the specified scev is negated, but not a constant.
Definition ScalarEvolution.cpp:533

llvm::SCEV::FlagNSW
static constexpr auto FlagNSW
Definition ScalarEvolution.h:276

llvm::SCEV::operands
LLVM_ABI ArrayRef< SCEVUse > operands() const
Return operands of this SCEV expression.
Definition ScalarEvolution.cpp:498

llvm::SCEV::getSCEVType
SCEVTypes getSCEVType() const
Definition ScalarEvolution.h:285

llvm::SCEV::FlagNW
static constexpr auto FlagNW
Definition ScalarEvolution.h:274

llvm::SCEV::getType
LLVM_ABI Type * getType() const
Return the LLVM type of this SCEV expression.
Definition ScalarEvolution.cpp:463

llvm::ScalarEvolution
The main scalar evolution driver.
Definition ScalarEvolution.h:616

llvm::ScalarEvolution::isKnownNonZero
LLVM_ABI bool isKnownNonZero(const SCEV *S)
Test if the given expression is known to be non-zero.
Definition ScalarEvolution.cpp:11307

llvm::ScalarEvolution::getMinusSCEV
LLVM_ABI const SCEV * getMinusSCEV(SCEVUse LHS, SCEVUse RHS, SCEV::NoWrapFlags Flags=SCEV::FlagAnyWrap, unsigned Depth=0)
Return LHS-RHS.
Definition ScalarEvolution.cpp:4842

llvm::ScalarEvolution::isGuaranteedNotToBePoison
static LLVM_ABI bool isGuaranteedNotToBePoison(const SCEV *Op)
Returns true if Op is guaranteed to not be poison.
Definition ScalarEvolution.cpp:7590

llvm::ScalarEvolution::getTruncateOrNoop
LLVM_ABI const SCEV * getTruncateOrNoop(const SCEV *V, Type *Ty)
Return a SCEV corresponding to a conversion of the input value to the specified type.
Definition ScalarEvolution.cpp:4953

llvm::ScalarEvolution::containsAddRecurrence
LLVM_ABI bool containsAddRecurrence(const SCEV *S)
Return true if the SCEV is a scAddRecExpr or it contains scAddRecExpr.
Definition ScalarEvolution.cpp:4693

llvm::ScalarEvolution::getZeroExtendExpr
LLVM_ABI const SCEV * getZeroExtendExpr(const SCEV *Op, Type *Ty, unsigned Depth=0)
Definition ScalarEvolution.cpp:1671

llvm::ScalarEvolution::clearFlags
static SCEV::NoWrapFlags clearFlags(SCEV::NoWrapFlags Flags, SCEV::NoWrapFlags OffFlags)
Definition ScalarEvolution.h:646

llvm::ScalarEvolution::maskFlags
static SCEV::NoWrapFlags maskFlags(SCEV::NoWrapFlags Flags, SCEV::NoWrapFlags Mask)
Convenient NoWrapFlags manipulation.
Definition ScalarEvolution.h:637

llvm::ScalarEvolution::getSignExtendExpr
LLVM_ABI const SCEV * getSignExtendExpr(const SCEV *Op, Type *Ty, unsigned Depth=0)
Definition ScalarEvolution.cpp:2019

llvm::ScalarEvolution::getAddExpr
LLVM_ABI const SCEV * getAddExpr(SmallVectorImpl< SCEVUse > &Ops, SCEV::NoWrapFlags Flags=SCEV::FlagAnyWrap, unsigned Depth=0)
Get a canonical add expression, or something simpler if possible.
Definition ScalarEvolution.cpp:2641

llvm::ScalarEvolution::canReuseInstruction
LLVM_ABI bool canReuseInstruction(const SCEV *S, Instruction *I, SmallVectorImpl< Instruction * > &DropPoisonGeneratingInsts)
Check whether it is poison-safe to represent the expression S using the instruction I.
Definition ScalarEvolution.cpp:4361

llvm::SmallPtrSetImplBase::clear
void clear()
Definition SmallPtrSet.h:102

llvm::SmallPtrSetImpl
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
Definition SmallPtrSet.h:366

llvm::SmallPtrSetImpl::insert
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
Definition SmallPtrSet.h:387

llvm::SmallPtrSetImpl::contains
bool contains(ConstPtrType Ptr) const
Definition SmallPtrSet.h:467

llvm::SmallPtrSet
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
Definition SmallPtrSet.h:533

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:581

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition SmallVector.h:681

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition SmallVector.h:966

llvm::SmallVectorImpl::clear
void clear()
Definition SmallVector.h:618

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:423

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition SmallVector.h:278

llvm::SmallVectorTemplateCommon::begin
iterator begin()
Definition SmallVector.h:276

llvm::SmallVectorTemplateCommon::back
reference back()
Definition SmallVector.h:317

llvm::SmallVectorTemplateCommon::empty
bool empty() const
Definition SmallVector.h:86

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1225

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition TargetTransformInfo.h:268

llvm::TargetTransformInfo::VectorInstrContext::None
@ None
The insert/extract is not used with a load/store.
Definition TargetTransformInfo.h:1069

llvm::TargetTransformInfo::getIntImmCostInst
LLVM_ABI InstructionCost getIntImmCostInst(unsigned Opc, unsigned Idx, const APInt &Imm, Type *Ty, TargetCostKind CostKind, Instruction *Inst=nullptr) const
Return the expected cost of materialization for the given integer immediate of the specified type for...
Definition TargetTransformInfo.cpp:778

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition TargetTransformInfo.h:331

llvm::TargetTransformInfo::TCK_RecipThroughput
@ TCK_RecipThroughput
Reciprocal throughput.
Definition TargetTransformInfo.h:332

llvm::TargetTransformInfo::TCK_CodeSize
@ TCK_CodeSize
Instruction code size.
Definition TargetTransformInfo.h:334

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46

llvm::Type::getIntegerBitWidth
LLVM_ABI unsigned getIntegerBitWidth() const
Definition DerivedTypes.h:107

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:288

llvm::Type::getInt32Ty
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:309

llvm::Type::isPointerTy
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:282

llvm::Type::getContext
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:130

llvm::Type::getScalarSizeInBits
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:232

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:257

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition Use.h:35

llvm::User
Definition User.h:44

llvm::User::operands
op_range operands()
Definition User.h:267

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition User.h:207

llvm::User::getNumOperands
unsigned getNumOperands() const
Definition User.h:229

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255

llvm::Value::replaceAllUsesWith
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition Value.cpp:553

llvm::Value::getContext
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:258

llvm::Value::users
iterator_range< user_iterator > users()
Definition Value.h:426

llvm::Value::use_empty
bool use_empty() const
Definition Value.h:346

llvm::cl::opt
Definition CommandLine.h:1449

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition ilist_node.h:34

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition ilist_node.h:123

llvm::ilist_node_with_parent::getNextNode
NodeTy * getNextNode()
Get the next node, or nullptr for the list tail.
Definition ilist_node.h:348

llvm::scope_exit
Definition ScopeExit.h:23

UINT64_MAX
#define UINT64_MAX
Definition DataTypes.h:77

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AMDGPU::Imm
@ Imm
Definition AMDGPURegBankLegalizeRules.h:170

llvm::BitmaskEnumDetail::any
constexpr bool any(E Val)
Definition BitmaskEnum.h:147

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::GraphProgram::Name
Name
Definition GraphWriter.h:51

llvm::ISD::BasicBlock
@ BasicBlock
Various leaf nodes.
Definition ISDOpcodes.h:81

llvm::ISD::Constant
@ Constant
Definition ISDOpcodes.h:86

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::Loc
Definition DwarfDebug.h:130

llvm::M68k::MemAddrModeKind::U
@ U
Definition M68kBaseInfo.h:60

llvm::M68k::MemAddrModeKind::V
@ V
Definition M68kBaseInfo.h:62

llvm::M68k::MemAddrModeKind::L
@ L
Definition M68kBaseInfo.h:69

llvm::PatternMatch
Definition PatternMatch.h:51

llvm::PatternMatch::m_Power2
cst_pred_ty< is_power2 > m_Power2()
Match an integer or vector power-of-2.
Definition PatternMatch.h:600

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition PatternMatch.h:53

llvm::PatternMatch::m_Instruction
match_bind< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
Definition PatternMatch.h:826

llvm::PatternMatch::m_Specific
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
Definition PatternMatch.h:943

llvm::PatternMatch::m_BasicBlock
auto m_BasicBlock()
Match an arbitrary basic block value and ignore it.
Definition PatternMatch.h:216

llvm::PatternMatch::m_Value
auto m_Value()
Match an arbitrary value and ignore it.
Definition PatternMatch.h:135

llvm::PatternMatch::m_c_BinOp
AnyBinaryOp_match< LHS, RHS, true > m_c_BinOp(const LHS &L, const RHS &R)
Matches a BinaryOperator with LHS and RHS in either order.
Definition PatternMatch.h:3055

llvm::PatternMatch::m_ICmp
CmpClass_match< LHS, RHS, ICmpInst > m_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
Definition PatternMatch.h:1726

llvm::PatternMatch::m_Br
brc_match< Cond_t, match_bind< BasicBlock >, match_bind< BasicBlock > > m_Br(const Cond_t &C, BasicBlock *&T, BasicBlock *&F)
Definition PatternMatch.h:2438

llvm::RISCVFenceField::W
@ W
Definition RISCVBaseInfo.h:491

llvm::SCEVPatternMatch
Definition ScalarEvolutionPatternMatch.h:36

llvm::SCEVPatternMatch::m_scev_AllOnes
cst_pred_ty< is_all_ones > m_scev_AllOnes()
Match an integer with all bits set.
Definition ScalarEvolutionPatternMatch.h:77

llvm::SCEVPatternMatch::m_scev_PtrToAddr
SCEVUnaryExpr_match< SCEVPtrToAddrExpr, Op0_t > m_scev_PtrToAddr(const Op0_t &Op0)
Definition ScalarEvolutionPatternMatch.h:197

llvm::SCEVPatternMatch::m_scev_Mul
match_bind< const SCEVMulExpr > m_scev_Mul(const SCEVMulExpr *&V)
Definition ScalarEvolutionPatternMatch.h:103

llvm::SCEVPatternMatch::m_SCEVConstant
auto m_SCEVConstant()
Definition ScalarEvolutionPatternMatch.h:82

llvm::SCEVPatternMatch::m_scev_PtrToInt
SCEVUnaryExpr_match< SCEVPtrToIntExpr, Op0_t > m_scev_PtrToInt(const Op0_t &Op0)
Definition ScalarEvolutionPatternMatch.h:191

llvm::SCEVPatternMatch::m_scev_Add
match_bind< const SCEVAddExpr > m_scev_Add(const SCEVAddExpr *&V)
Definition ScalarEvolutionPatternMatch.h:99

llvm::SCEVPatternMatch::m_SCEV
auto m_SCEV()
Definition ScalarEvolutionPatternMatch.h:81

llvm::SCEVPatternMatch::m_scev_URem
SCEVURem_match< Op0_t, Op1_t > m_scev_URem(Op0_t LHS, Op1_t RHS, ScalarEvolution &SE)
Match the mathematical pattern A - (A / B) * B, where A and B can be arbitrary expressions.
Definition ScalarEvolutionPatternMatch.h:349

llvm::WinEH::EncodingType::CE
@ CE
Windows NT (Windows on ARM)
Definition MCAsmInfo.h:50

llvm::cl::Hidden
@ Hidden
Definition CommandLine.h:138

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition CommandLine.h:439

llvm::dwarf_linker::DebugSectionKind::DebugLoc
@ DebugLoc
Definition DWARFLinkerBase.h:34

llvm::memprof::Meta::Start
@ Start
Definition MemProf.h:69

llvm::ms_demangle::QualifierMangleMode::Result
@ Result
Definition MicrosoftDemangle.h:132

llvm::objcarc::ARCInstKind::User
@ User
could "use" a pointer
Definition ObjCARCInstKind.h:52

llvm::sandboxir::Instruction
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73

llvm::sframe::Flags
Flags
Definition SFrame.h:39

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition FunctionInfo.h:25

llvm::visitAll
void visitAll(const SCEV *Root, SV &Visitor)
Use SCEVTraversal to visit all nodes in the given expression tree.
Definition ScalarEvolutionExpressions.h:803

llvm::drop_begin
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:315

llvm::Offset
@ Offset
Definition DWP.cpp:558

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::stable_sort
void stable_sort(R &&Range)
Definition STLExtras.h:2115

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1738

llvm::Cost
InstructionCost Cost
Definition FunctionSpecialization.h:103

llvm::enumerate
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2553

llvm::pred_end
auto pred_end(const MachineBasicBlock *BB)
Definition MachineBasicBlock.h:1451

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643

llvm::from_range
constexpr from_range_t from_range
Definition STLForwardCompat.h:206

llvm::min
constexpr NextUseDistance min(NextUseDistance A, NextUseDistance B)
Definition AMDGPUNextUseAnalysis.h:218

llvm::append_range
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
Definition STLExtras.h:2207

llvm::pred_size
auto pred_size(const MachineBasicBlock *BB)
Definition MachineBasicBlock.h:1447

llvm::FloatStyle::Exponent
@ Exponent
Definition NativeFormatting.h:18

llvm::simplifyInstruction
LLVM_ABI Value * simplifyInstruction(Instruction *I, const SimplifyQuery &Q)
See if we can compute a simplified version of this instruction.
Definition InstructionSimplify.cpp:7735

llvm::isInstructionTriviallyDead
LLVM_ABI bool isInstructionTriviallyDead(Instruction *I, const TargetLibraryInfo *TLI=nullptr)
Return true if the result produced by the instruction is not used, and the instruction will return.
Definition Local.cpp:403

llvm::reverse
auto reverse(ContainerTy &&C)
Definition STLExtras.h:407

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209

llvm::SCEVCheapExpansionBudget
LLVM_ABI cl::opt< unsigned > SCEVCheapExpansionBudget

llvm::SmallVector
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
Definition SmallVector.h:1151

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547

llvm::ConstantFoldBinaryOpOperands
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
Definition ConstantFolding.cpp:1452

llvm::normalizeForPostIncUse
LLVM_ABI const SCEV * normalizeForPostIncUse(const SCEV *S, const PostIncLoopSet &Loops, ScalarEvolution &SE, bool CheckInvertible=true)
Normalize S to be post-increment for all loops present in Loops.
Definition ScalarEvolutionNormalization.cpp:97

llvm::TTI
TargetTransformInfo TTI
Definition TargetTransformInfo.h:263

llvm::IRBuilder
IRBuilder(LLVMContext &, FolderTy, InserterTy, MDNode *, ArrayRef< OperandBundleDef >) -> IRBuilder< FolderTy, InserterTy >

llvm::LEB128Sign::Signed
@ Signed
Definition LEB128.h:232

llvm::max
constexpr NextUseDistance max(NextUseDistance A, NextUseDistance B)
Definition AMDGPUNextUseAnalysis.h:222

llvm::RecurKind::Mul
@ Mul
Product of integers.
Definition IVDescriptors.h:41

llvm::RecurKind::Sub
@ Sub
Subtraction of integers.
Definition IVDescriptors.h:39

llvm::RecurKind::Add
@ Add
Sum of integers.
Definition IVDescriptors.h:38

llvm::Op
DWARFExpression::Operation Op
Definition DWARFExpressionPrinter.cpp:25

llvm::pred_iterator
PredIterator< BasicBlock, Value::user_iterator > pred_iterator
Definition CFG.h:93

llvm::BitWidth
constexpr unsigned BitWidth
Definition BitmaskEnum.h:219

llvm::formLCSSAForInstructions
LLVM_ABI bool formLCSSAForInstructions(SmallVectorImpl< Instruction * > &Worklist, const DominatorTree &DT, const LoopInfo &LI, ScalarEvolution *SE, SmallVectorImpl< PHINode * > *PHIsToRemove=nullptr, SmallVectorImpl< PHINode * > *InsertedPHIs=nullptr)
Ensures LCSSA form for every instruction from the Worklist in the scope of innermost containing loop.
Definition LCSSA.cpp:308

llvm::pred_begin
auto pred_begin(const MachineBasicBlock *BB)
Definition MachineBasicBlock.h:1449

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559

llvm::PostIncLoopSet
SmallPtrSet< const Loop *, 2 > PostIncLoopSet
Definition ScalarEvolutionNormalization.h:49

llvm::predecessors
auto predecessors(const MachineBasicBlock *BB)
Definition MachineBasicBlock.h:1443

llvm::make_pointer_range
iterator_range< pointer_iterator< WrappedIteratorT > > make_pointer_range(RangeT &&Range)
Definition iterator.h:368

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition STLExtras.h:1946

llvm::scUMinExpr
@ scUMinExpr
Definition ScalarEvolutionExpressions.h:52

llvm::scAddRecExpr
@ scAddRecExpr
Definition ScalarEvolutionExpressions.h:49

llvm::scSequentialUMinExpr
@ scSequentialUMinExpr
Definition ScalarEvolutionExpressions.h:54

llvm::scAddExpr
@ scAddExpr
Definition ScalarEvolutionExpressions.h:46

llvm::scVScale
@ scVScale
Definition ScalarEvolutionExpressions.h:42

llvm::scSMaxExpr
@ scSMaxExpr
Definition ScalarEvolutionExpressions.h:51

llvm::scUnknown
@ scUnknown
Definition ScalarEvolutionExpressions.h:57

llvm::scSMinExpr
@ scSMinExpr
Definition ScalarEvolutionExpressions.h:53

llvm::scPtrToAddr
@ scPtrToAddr
Definition ScalarEvolutionExpressions.h:55

llvm::scCouldNotCompute
@ scCouldNotCompute
Definition ScalarEvolutionExpressions.h:58

llvm::scConstant
@ scConstant
Definition ScalarEvolutionExpressions.h:41

llvm::scSignExtend
@ scSignExtend
Definition ScalarEvolutionExpressions.h:45

llvm::scTruncate
@ scTruncate
Definition ScalarEvolutionExpressions.h:43

llvm::scUMaxExpr
@ scUMaxExpr
Definition ScalarEvolutionExpressions.h:50

llvm::scZeroExtend
@ scZeroExtend
Definition ScalarEvolutionExpressions.h:44

llvm::scPtrToInt
@ scPtrToInt
Definition ScalarEvolutionExpressions.h:56

llvm::scUDivExpr
@ scUDivExpr
Definition ScalarEvolutionExpressions.h:48

llvm::scMulExpr
@ scMulExpr
Definition ScalarEvolutionExpressions.h:47

llvm::isImpliedByDomCondition
LLVM_ABI std::optional< bool > isImpliedByDomCondition(const Value *Cond, const Instruction *ContextI, const DataLayout &DL)
Return the boolean condition value in the context of the given instruction if it is known based on do...
Definition ValueTracking.cpp:9971

llvm::SCEVUse
SCEVUseT< const SCEV * > SCEVUse
Definition ScalarEvolution.h:187

llvm::SCEVExprContains
bool SCEVExprContains(const SCEV *Root, PredTy Pred)
Return true if any node in Root satisfies the predicate Pred.
Definition ScalarEvolutionExpressions.h:810

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:862

raw_ostream.h

InsertionPoint
Definition CFIFixup.cpp:186

WorkItem
Definition WinEHPrepare.cpp:235

llvm::PoisonFlags::NUW
unsigned NUW
Definition ScalarEvolutionExpander.h:46

llvm::PoisonFlags::Disjoint
unsigned Disjoint
Definition ScalarEvolutionExpander.h:49

llvm::PoisonFlags::NNeg
unsigned NNeg
Definition ScalarEvolutionExpander.h:50

llvm::PoisonFlags::apply
LLVM_ABI void apply(Instruction *I)
Definition ScalarEvolutionExpander.cpp:76

llvm::PoisonFlags::PoisonFlags
LLVM_ABI PoisonFlags(const Instruction *I)
Definition ScalarEvolutionExpander.cpp:48

llvm::PoisonFlags::GEPNW
GEPNoWrapFlags GEPNW
Definition ScalarEvolutionExpander.h:52

llvm::PoisonFlags::NSW
unsigned NSW
Definition ScalarEvolutionExpander.h:47

llvm::PoisonFlags::SameSign
unsigned SameSign
Definition ScalarEvolutionExpander.h:51

llvm::PoisonFlags::Exact
unsigned Exact
Definition ScalarEvolutionExpander.h:48

llvm::SCEVOperand
struct for holding enough information to help calculate the cost of the given SCEV when expanded into...
Definition ScalarEvolutionExpander.h:34

llvm::SCEVOperand::S
const SCEV * S
The SCEV operand to be costed.
Definition ScalarEvolutionExpander.h:42

llvm::SCEVOperand::ParentOpcode
unsigned ParentOpcode
LLVM instruction opcode that uses the operand.
Definition ScalarEvolutionExpander.h:38

llvm::SCEVOperand::OperandIdx
int OperandIdx
The use index of an expanded instruction.
Definition ScalarEvolutionExpander.h:40

llvm::SCEVUseT
Definition ScalarEvolution.h:121

llvm::SCEVUseT::getNoWrapFlags
SCEVNoWrapFlags getNoWrapFlags(SCEVNoWrapFlags Mask=SCEVNoWrapFlags::NoWrapMask) const
Return the no-wrap flags for this SCEVUse, which is the union of the use-specific flags and the under...
Definition ScalarEvolutionExpressions.h:1055

llvm::SCEVUseVisitor< SCEVExpander, Value * >::visit
Value * visit(SCEVUse S)
Definition ScalarEvolutionExpressions.h:681

llvm::cl::desc
Definition CommandLine.h:405