doxygen/html/JumpThreading_8cpp_source.html

//===- JumpThreading.cpp - Thread control through conditional blocks ------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the Jump Threading pass.

//

//===----------------------------------------------------------------------===//


#include "llvm/Transforms/Scalar/JumpThreading.h"

#include "llvm/ADT/DenseMap.h"

#include "llvm/ADT/MapVector.h"

#include "llvm/ADT/STLExtras.h"

#include "llvm/ADT/SmallPtrSet.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/BlockFrequencyInfo.h"

#include "llvm/Analysis/BranchProbabilityInfo.h"

#include "llvm/Analysis/CFG.h"

#include "llvm/Analysis/ConstantFolding.h"

#include "llvm/Analysis/GlobalsModRef.h"

#include "llvm/Analysis/GuardUtils.h"

#include "llvm/Analysis/InstructionSimplify.h"

#include "llvm/Analysis/LazyValueInfo.h"

#include "llvm/Analysis/Loads.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/MemoryLocation.h"

#include "llvm/Analysis/PostDominators.h"

#include "llvm/Analysis/TargetLibraryInfo.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/IR/BasicBlock.h"

#include "llvm/IR/CFG.h"

#include "llvm/IR/Constant.h"

#include "llvm/IR/ConstantRange.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/DebugInfo.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instruction.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/LLVMContext.h"

#include "llvm/IR/MDBuilder.h"

#include "llvm/IR/Metadata.h"

#include "llvm/IR/Module.h"

#include "llvm/IR/PassManager.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/IR/ProfDataUtils.h"

#include "llvm/IR/Type.h"

#include "llvm/IR/Use.h"

#include "llvm/IR/Value.h"

#include "llvm/Support/BlockFrequency.h"

#include "llvm/Support/BranchProbability.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/raw_ostream.h"

#include "llvm/Transforms/Utils/BasicBlockUtils.h"

#include "llvm/Transforms/Utils/Cloning.h"

#include "llvm/Transforms/Utils/Local.h"

#include "llvm/Transforms/Utils/SSAUpdater.h"

#include "llvm/Transforms/Utils/ValueMapper.h"

#include <cassert>

#include <cstdint>

#include <iterator>

#include <memory>

#include <utility>


using namespace llvm;

using namespace jumpthreading;


#define DEBUG_TYPE "jump-threading"


STATISTIC(NumThreads, "Number of jumps threaded");

STATISTIC(NumFolds,   "Number of terminators folded");

STATISTIC(NumDupes,   "Number of branch blocks duplicated to eliminate phi");


static cl::opt<unsigned>

BBDuplicateThreshold("jump-threading-threshold",

          cl::desc("Max block size to duplicate for jump threading"),

          cl::init(6), cl::Hidden);


static cl::opt<unsigned>

ImplicationSearchThreshold(

  "jump-threading-implication-search-threshold",

  cl::desc("The number of predecessors to search for a stronger "

           "condition to use to thread over a weaker condition"),

  cl::init(3), cl::Hidden);


static cl::opt<unsigned> PhiDuplicateThreshold(

    "jump-threading-phi-threshold",

    cl::desc("Max PHIs in BB to duplicate for jump threading"), cl::init(76),

    cl::Hidden);


static cl::opt<bool> ThreadAcrossLoopHeaders(

    "jump-threading-across-loop-headers",

    cl::desc("Allow JumpThreading to thread across loop headers, for testing"),

    cl::init(false), cl::Hidden);


JumpThreadingPass::JumpThreadingPass(int T) {

  DefaultBBDupThreshold = (T == -1) ? BBDuplicateThreshold : unsigned(T);

}


// Update branch probability information according to conditional

// branch probability. This is usually made possible for cloned branches

// in inline instances by the context specific profile in the caller.

// For instance,

//

//  [Block PredBB]

//  [Branch PredBr]

//  if (t) {

//     Block A;

//  } else {

//     Block B;

//  }

//

//  [Block BB]

//  cond = PN([true, %A], [..., %B]); // PHI node

//  [Branch CondBr]

//  if (cond) {

//    ...  // P(cond == true) = 1%

//  }

//

//  Here we know that when block A is taken, cond must be true, which means

//      P(cond == true | A) = 1

//

//  Given that P(cond == true) = P(cond == true | A) * P(A) +

//                               P(cond == true | B) * P(B)

//  we get:

//     P(cond == true ) = P(A) + P(cond == true | B) * P(B)

//

//  which gives us:

//     P(A) is less than P(cond == true), i.e.

//     P(t == true) <= P(cond == true)

//

//  In other words, if we know P(cond == true) is unlikely, we know

//  that P(t == true) is also unlikely.

//

static void updatePredecessorProfileMetadata(PHINode *PN, BasicBlock *BB) {

  BranchInst *CondBr = dyn_cast<BranchInst>(BB->getTerminator());

  if (!CondBr)

    return;


  uint64_t TrueWeight, FalseWeight;

  if (!extractBranchWeights(*CondBr, TrueWeight, FalseWeight))

    return;


  if (TrueWeight + FalseWeight == 0)

    // Zero branch_weights do not give a hint for getting branch probabilities.

    // Technically it would result in division by zero denominator, which is

    // TrueWeight + FalseWeight.

    return;


  // Returns the outgoing edge of the dominating predecessor block

  // that leads to the PhiNode's incoming block:

  auto GetPredOutEdge =

      [](BasicBlock *IncomingBB,

         BasicBlock *PhiBB) -> std::pair<BasicBlock *, BasicBlock *> {

    auto *PredBB = IncomingBB;

    auto *SuccBB = PhiBB;

    SmallPtrSet<BasicBlock *, 16> Visited;

    while (true) {

      BranchInst *PredBr = dyn_cast<BranchInst>(PredBB->getTerminator());

      if (PredBr && PredBr->isConditional())

        return {PredBB, SuccBB};

      Visited.insert(PredBB);

      auto *SinglePredBB = PredBB->getSinglePredecessor();

      if (!SinglePredBB)

        return {nullptr, nullptr};


      // Stop searching when SinglePredBB has been visited. It means we see

      // an unreachable loop.

      if (Visited.count(SinglePredBB))

        return {nullptr, nullptr};


      SuccBB = PredBB;

      PredBB = SinglePredBB;

    }

  };


  for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) {

    Value *PhiOpnd = PN->getIncomingValue(i);

    ConstantInt *CI = dyn_cast<ConstantInt>(PhiOpnd);


    if (!CI || !CI->getType()->isIntegerTy(1))

      continue;


    BranchProbability BP =

        (CI->isOne() ? BranchProbability::getBranchProbability(

                           TrueWeight, TrueWeight + FalseWeight)

                     : BranchProbability::getBranchProbability(

                           FalseWeight, TrueWeight + FalseWeight));


    auto PredOutEdge = GetPredOutEdge(PN->getIncomingBlock(i), BB);

    if (!PredOutEdge.first)

      return;


    BasicBlock *PredBB = PredOutEdge.first;

    BranchInst *PredBr = dyn_cast<BranchInst>(PredBB->getTerminator());

    if (!PredBr)

      return;


    uint64_t PredTrueWeight, PredFalseWeight;

    // FIXME: We currently only set the profile data when it is missing.

    // With PGO, this can be used to refine even existing profile data with

    // context information. This needs to be done after more performance

    // testing.

    if (extractBranchWeights(*PredBr, PredTrueWeight, PredFalseWeight))

      continue;


    // We can not infer anything useful when BP >= 50%, because BP is the

    // upper bound probability value.

    if (BP >= BranchProbability(50, 100))

      continue;


    uint32_t Weights[2];

    if (PredBr->getSuccessor(0) == PredOutEdge.second) {

      Weights[0] = BP.getNumerator();

      Weights[1] = BP.getCompl().getNumerator();

    } else {

      Weights[0] = BP.getCompl().getNumerator();

      Weights[1] = BP.getNumerator();

    }

    setBranchWeights(*PredBr, Weights, hasBranchWeightOrigin(*PredBr));

  }

}


PreservedAnalyses JumpThreadingPass::run(Function &F,

                                         FunctionAnalysisManager &AM) {

  auto &TTI = AM.getResult<TargetIRAnalysis>(F);

  // Jump Threading has no sense for the targets with divergent CF

  if (TTI.hasBranchDivergence(&F))

    return PreservedAnalyses::all();

  auto &TLI = AM.getResult<TargetLibraryAnalysis>(F);

  auto &LVI = AM.getResult<LazyValueAnalysis>(F);

  auto &AA = AM.getResult<AAManager>(F);

  auto &DT = AM.getResult<DominatorTreeAnalysis>(F);


  bool Changed =

      runImpl(F, &AM, &TLI, &TTI, &LVI, &AA,

              std::make_unique<DomTreeUpdater>(

                  &DT, nullptr, DomTreeUpdater::UpdateStrategy::Lazy),

              std::nullopt, std::nullopt);


  if (!Changed)

    return PreservedAnalyses::all();


  getDomTreeUpdater()->flush();


#if defined(EXPENSIVE_CHECKS)

  assert(getDomTreeUpdater()->getDomTree().verify(

             DominatorTree::VerificationLevel::Full) &&

         "DT broken after JumpThreading");

  assert((!getDomTreeUpdater()->hasPostDomTree() ||

          getDomTreeUpdater()->getPostDomTree().verify(

              PostDominatorTree::VerificationLevel::Full)) &&

         "PDT broken after JumpThreading");

#else

  assert(getDomTreeUpdater()->getDomTree().verify(

             DominatorTree::VerificationLevel::Fast) &&

         "DT broken after JumpThreading");

  assert((!getDomTreeUpdater()->hasPostDomTree() ||

          getDomTreeUpdater()->getPostDomTree().verify(

              PostDominatorTree::VerificationLevel::Fast)) &&

         "PDT broken after JumpThreading");

#endif


  return getPreservedAnalysis();

}


bool JumpThreadingPass::runImpl(Function &F_, FunctionAnalysisManager *FAM_,

                                TargetLibraryInfo *TLI_,

                                TargetTransformInfo *TTI_, LazyValueInfo *LVI_,

                                AliasAnalysis *AA_,

                                std::unique_ptr<DomTreeUpdater> DTU_,

                                std::optional<BlockFrequencyInfo *> BFI_,

                                std::optional<BranchProbabilityInfo *> BPI_) {

  LLVM_DEBUG(dbgs() << "Jump threading on function '" << F_.getName() << "'\n");

  F = &F_;

  FAM = FAM_;

  TLI = TLI_;

  TTI = TTI_;

  LVI = LVI_;

  AA = AA_;

  DTU = std::move(DTU_);

  BFI = BFI_;

  BPI = BPI_;

  auto *GuardDecl = Intrinsic::getDeclarationIfExists(

      F->getParent(), Intrinsic::experimental_guard);

  HasGuards = GuardDecl && !GuardDecl->use_empty();


  // Reduce the number of instructions duplicated when optimizing strictly for

  // size.

  if (BBDuplicateThreshold.getNumOccurrences())

    BBDupThreshold = BBDuplicateThreshold;

  else if (F->hasFnAttribute(Attribute::MinSize))

    BBDupThreshold = 3;

  else

    BBDupThreshold = DefaultBBDupThreshold;


  // JumpThreading must not processes blocks unreachable from entry. It's a

  // waste of compute time and can potentially lead to hangs.

  SmallPtrSet<BasicBlock *, 16> Unreachable;

  assert(DTU && "DTU isn't passed into JumpThreading before using it.");

  assert(DTU->hasDomTree() && "JumpThreading relies on DomTree to proceed.");

  DominatorTree &DT = DTU->getDomTree();

  for (auto &BB : *F)

    if (!DT.isReachableFromEntry(&BB))

      Unreachable.insert(&BB);


  if (!ThreadAcrossLoopHeaders)

    findLoopHeaders(*F);


  bool EverChanged = false;

  bool Changed;

  do {

    Changed = false;

    for (auto &BB : *F) {

      if (Unreachable.count(&BB))

        continue;

      while (processBlock(&BB)) // Thread all of the branches we can over BB.

        Changed = ChangedSinceLastAnalysisUpdate = true;


      // Jump threading may have introduced redundant debug values into BB

      // which should be removed.

      if (Changed)

        RemoveRedundantDbgInstrs(&BB);


      // Stop processing BB if it's the entry or is now deleted. The following

      // routines attempt to eliminate BB and locating a suitable replacement

      // for the entry is non-trivial.

      if (&BB == &F->getEntryBlock() || DTU->isBBPendingDeletion(&BB))

        continue;


      if (pred_empty(&BB)) {

        // When processBlock makes BB unreachable it doesn't bother to fix up

        // the instructions in it. We must remove BB to prevent invalid IR.

        LLVM_DEBUG(dbgs() << "  JT: Deleting dead block '" << BB.getName()

                          << "' with terminator: " << *BB.getTerminator()

                          << '\n');

        LoopHeaders.erase(&BB);

        LVI->eraseBlock(&BB);

        DeleteDeadBlock(&BB, DTU.get());

        Changed = ChangedSinceLastAnalysisUpdate = true;

        continue;

      }


      // processBlock doesn't thread BBs with unconditional TIs. However, if BB

      // is "almost empty", we attempt to merge BB with its sole successor.

      auto *BI = dyn_cast<BranchInst>(BB.getTerminator());

      if (BI && BI->isUnconditional()) {

        BasicBlock *Succ = BI->getSuccessor(0);

        if (

            // The terminator must be the only non-phi instruction in BB.

            BB.getFirstNonPHIOrDbg(true)->isTerminator() &&

            // Don't alter Loop headers and latches to ensure another pass can

            // detect and transform nested loops later.

            !LoopHeaders.count(&BB) && !LoopHeaders.count(Succ) &&

            TryToSimplifyUncondBranchFromEmptyBlock(&BB, DTU.get())) {

          RemoveRedundantDbgInstrs(Succ);

          // BB is valid for cleanup here because we passed in DTU. F remains

          // BB's parent until a DTU->getDomTree() event.

          LVI->eraseBlock(&BB);

          Changed = ChangedSinceLastAnalysisUpdate = true;

        }

      }

    }

    EverChanged |= Changed;

  } while (Changed);


  LoopHeaders.clear();

  return EverChanged;

}


// Replace uses of Cond with ToVal when safe to do so. If all uses are

// replaced, we can remove Cond. We cannot blindly replace all uses of Cond

// because we may incorrectly replace uses when guards/assumes are uses of

// of `Cond` and we used the guards/assume to reason about the `Cond` value

// at the end of block. RAUW unconditionally replaces all uses

// including the guards/assumes themselves and the uses before the

// guard/assume.

static bool replaceFoldableUses(Instruction *Cond, Value *ToVal,

                                BasicBlock *KnownAtEndOfBB) {

  bool Changed = false;

  assert(Cond->getType() == ToVal->getType());

  // We can unconditionally replace all uses in non-local blocks (i.e. uses

  // strictly dominated by BB), since LVI information is true from the

  // terminator of BB.

  if (Cond->getParent() == KnownAtEndOfBB)

    Changed |= replaceNonLocalUsesWith(Cond, ToVal);

  for (Instruction &I : reverse(*KnownAtEndOfBB)) {

    // Replace any debug-info record users of Cond with ToVal.

    for (DbgVariableRecord &DVR : filterDbgVars(I.getDbgRecordRange()))

      DVR.replaceVariableLocationOp(Cond, ToVal, true);


    // Reached the Cond whose uses we are trying to replace, so there are no

    // more uses.

    if (&I == Cond)

      break;

    // We only replace uses in instructions that are guaranteed to reach the end

    // of BB, where we know Cond is ToVal.

    if (!isGuaranteedToTransferExecutionToSuccessor(&I))

      break;

    Changed |= I.replaceUsesOfWith(Cond, ToVal);

  }

  if (Cond->use_empty() && !Cond->mayHaveSideEffects()) {

    Cond->eraseFromParent();

    Changed = true;

  }

  return Changed;

}


/// Return the cost of duplicating a piece of this block from first non-phi

/// and before StopAt instruction to thread across it. Stop scanning the block

/// when exceeding the threshold. If duplication is impossible, returns ~0U.

static unsigned getJumpThreadDuplicationCost(const TargetTransformInfo *TTI,

                                             BasicBlock *BB,

                                             Instruction *StopAt,

                                             unsigned Threshold) {

  assert(StopAt->getParent() == BB && "Not an instruction from proper BB?");


  // Do not duplicate the BB if it has a lot of PHI nodes.

  // If a threadable chain is too long then the number of PHI nodes can add up,

  // leading to a substantial increase in compile time when rewriting the SSA.

  unsigned PhiCount = 0;

  Instruction *FirstNonPHI = nullptr;

  for (Instruction &I : *BB) {

    if (!isa<PHINode>(&I)) {

      FirstNonPHI = &I;

      break;

    }

    if (++PhiCount > PhiDuplicateThreshold)

      return ~0U;

  }


  /// Ignore PHI nodes, these will be flattened when duplication happens.

  BasicBlock::const_iterator I(FirstNonPHI);


  // FIXME: THREADING will delete values that are just used to compute the

  // branch, so they shouldn't count against the duplication cost.


  unsigned Bonus = 0;

  if (BB->getTerminator() == StopAt) {

    // Threading through a switch statement is particularly profitable.  If this

    // block ends in a switch, decrease its cost to make it more likely to

    // happen.

    if (isa<SwitchInst>(StopAt))

      Bonus = 6;


    // The same holds for indirect branches, but slightly more so.

    if (isa<IndirectBrInst>(StopAt))

      Bonus = 8;

  }


  // Bump the threshold up so the early exit from the loop doesn't skip the

  // terminator-based Size adjustment at the end.

  Threshold += Bonus;


  // Sum up the cost of each instruction until we get to the terminator.  Don't

  // include the terminator because the copy won't include it.

  unsigned Size = 0;

  for (; &*I != StopAt; ++I) {


    // Stop scanning the block if we've reached the threshold.

    if (Size > Threshold)

      return Size;


    // Bail out if this instruction gives back a token type, it is not possible

    // to duplicate it if it is used outside this BB.

    if (I->getType()->isTokenTy() && I->isUsedOutsideOfBlock(BB))

      return ~0U;


    // Blocks with NoDuplicate are modelled as having infinite cost, so they

    // are never duplicated.

    if (const CallInst *CI = dyn_cast<CallInst>(I))

      if (CI->cannotDuplicate() || CI->isConvergent())

        return ~0U;


    if (TTI->getInstructionCost(&*I, TargetTransformInfo::TCK_SizeAndLatency) ==

        TargetTransformInfo::TCC_Free)

      continue;


    // All other instructions count for at least one unit.

    ++Size;


    // Calls are more expensive.  If they are non-intrinsic calls, we model them

    // as having cost of 4.  If they are a non-vector intrinsic, we model them

    // as having cost of 2 total, and if they are a vector intrinsic, we model

    // them as having cost 1.

    if (const CallInst *CI = dyn_cast<CallInst>(I)) {

      if (!isa<IntrinsicInst>(CI))

        Size += 3;

      else if (!CI->getType()->isVectorTy())

        Size += 1;

    }

  }


  return Size > Bonus ? Size - Bonus : 0;

}


/// findLoopHeaders - We do not want jump threading to turn proper loop

/// structures into irreducible loops.  Doing this breaks up the loop nesting

/// hierarchy and pessimizes later transformations.  To prevent this from

/// happening, we first have to find the loop headers.  Here we approximate this

/// by finding targets of backedges in the CFG.

///

/// Note that there definitely are cases when we want to allow threading of

/// edges across a loop header.  For example, threading a jump from outside the

/// loop (the preheader) to an exit block of the loop is definitely profitable.

/// It is also almost always profitable to thread backedges from within the loop

/// to exit blocks, and is often profitable to thread backedges to other blocks

/// within the loop (forming a nested loop).  This simple analysis is not rich

/// enough to track all of these properties and keep it up-to-date as the CFG

/// mutates, so we don't allow any of these transformations.

void JumpThreadingPass::findLoopHeaders(Function &F) {

  SmallVector<std::pair<const BasicBlock*,const BasicBlock*>, 32> Edges;

  FindFunctionBackedges(F, Edges);


  for (const auto &Edge : Edges)

    LoopHeaders.insert(Edge.second);

}


/// getKnownConstant - Helper method to determine if we can thread over a

/// terminator with the given value as its condition, and if so what value to

/// use for that. What kind of value this is depends on whether we want an

/// integer or a block address, but an undef is always accepted.

/// Returns null if Val is null or not an appropriate constant.

static Constant *getKnownConstant(Value *Val, ConstantPreference Preference) {

  if (!Val)

    return nullptr;


  // Undef is "known" enough.

  if (UndefValue *U = dyn_cast<UndefValue>(Val))

    return U;


  if (Preference == WantBlockAddress)

    return dyn_cast<BlockAddress>(Val->stripPointerCasts());


  return dyn_cast<ConstantInt>(Val);

}


/// computeValueKnownInPredecessors - Given a basic block BB and a value V, see

/// if we can infer that the value is a known ConstantInt/BlockAddress or undef

/// in any of our predecessors.  If so, return the known list of value and pred

/// BB in the result vector.

///

/// This returns true if there were any known values.

bool JumpThreadingPass::computeValueKnownInPredecessorsImpl(

    Value *V, BasicBlock *BB, PredValueInfo &Result,

    ConstantPreference Preference, SmallPtrSet<Value *, 4> &RecursionSet,

    Instruction *CxtI) {

  const DataLayout &DL = BB->getDataLayout();


  // This method walks up use-def chains recursively.  Because of this, we could

  // get into an infinite loop going around loops in the use-def chain.  To

  // prevent this, keep track of what (value, block) pairs we've already visited

  // and terminate the search if we loop back to them

  if (!RecursionSet.insert(V).second)

    return false;


  // If V is a constant, then it is known in all predecessors.

  if (Constant *KC = getKnownConstant(V, Preference)) {

    for (BasicBlock *Pred : predecessors(BB))

      Result.emplace_back(KC, Pred);


    return !Result.empty();

  }


  // If V is a non-instruction value, or an instruction in a different block,

  // then it can't be derived from a PHI.

  Instruction *I = dyn_cast<Instruction>(V);

  if (!I || I->getParent() != BB) {


    // Okay, if this is a live-in value, see if it has a known value at the any

    // edge from our predecessors.

    for (BasicBlock *P : predecessors(BB)) {

      using namespace PatternMatch;

      // If the value is known by LazyValueInfo to be a constant in a

      // predecessor, use that information to try to thread this block.

      Constant *PredCst = LVI->getConstantOnEdge(V, P, BB, CxtI);

      // If I is a non-local compare-with-constant instruction, use more-rich

      // 'getPredicateOnEdge' method. This would be able to handle value

      // inequalities better, for example if the compare is "X < 4" and "X < 3"

      // is known true but "X < 4" itself is not available.

      CmpPredicate Pred;

      Value *Val;

      Constant *Cst;

      if (!PredCst && match(V, m_Cmp(Pred, m_Value(Val), m_Constant(Cst))))

        PredCst = LVI->getPredicateOnEdge(Pred, Val, Cst, P, BB, CxtI);

      if (Constant *KC = getKnownConstant(PredCst, Preference))

        Result.emplace_back(KC, P);

    }


    return !Result.empty();

  }


  /// If I is a PHI node, then we know the incoming values for any constants.

  if (PHINode *PN = dyn_cast<PHINode>(I)) {

    for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) {

      Value *InVal = PN->getIncomingValue(i);

      if (Constant *KC = getKnownConstant(InVal, Preference)) {

        Result.emplace_back(KC, PN->getIncomingBlock(i));

      } else {

        Constant *CI = LVI->getConstantOnEdge(InVal,

                                              PN->getIncomingBlock(i),

                                              BB, CxtI);

        if (Constant *KC = getKnownConstant(CI, Preference))

          Result.emplace_back(KC, PN->getIncomingBlock(i));

      }

    }


    return !Result.empty();

  }


  // Handle Cast instructions.

  if (CastInst *CI = dyn_cast<CastInst>(I)) {

    Value *Source = CI->getOperand(0);

    PredValueInfoTy Vals;

    computeValueKnownInPredecessorsImpl(Source, BB, Vals, Preference,

                                        RecursionSet, CxtI);

    if (Vals.empty())

      return false;


    // Convert the known values.

    for (auto &Val : Vals)

      if (Constant *Folded = ConstantFoldCastOperand(CI->getOpcode(), Val.first,

                                                     CI->getType(), DL))

        Result.emplace_back(Folded, Val.second);


    return !Result.empty();

  }


  if (FreezeInst *FI = dyn_cast<FreezeInst>(I)) {

    Value *Source = FI->getOperand(0);

    computeValueKnownInPredecessorsImpl(Source, BB, Result, Preference,

                                        RecursionSet, CxtI);


    erase_if(Result, [](auto &Pair) {

      return !isGuaranteedNotToBeUndefOrPoison(Pair.first);

    });


    return !Result.empty();

  }


  // Handle some boolean conditions.

  if (I->getType()->getPrimitiveSizeInBits() == 1) {

    using namespace PatternMatch;

    if (Preference != WantInteger)

      return false;

    // X | true -> true

    // X & false -> false

    Value *Op0, *Op1;

    if (match(I, m_LogicalOr(m_Value(Op0), m_Value(Op1))) ||

        match(I, m_LogicalAnd(m_Value(Op0), m_Value(Op1)))) {

      PredValueInfoTy LHSVals, RHSVals;


      computeValueKnownInPredecessorsImpl(Op0, BB, LHSVals, WantInteger,

                                          RecursionSet, CxtI);

      computeValueKnownInPredecessorsImpl(Op1, BB, RHSVals, WantInteger,

                                          RecursionSet, CxtI);


      if (LHSVals.empty() && RHSVals.empty())

        return false;


      ConstantInt *InterestingVal;

      if (match(I, m_LogicalOr()))

        InterestingVal = ConstantInt::getTrue(I->getContext());

      else

        InterestingVal = ConstantInt::getFalse(I->getContext());


      SmallPtrSet<BasicBlock*, 4> LHSKnownBBs;


      // Scan for the sentinel.  If we find an undef, force it to the

      // interesting value: x|undef -> true and x&undef -> false.

      for (const auto &LHSVal : LHSVals)

        if (LHSVal.first == InterestingVal || isa<UndefValue>(LHSVal.first)) {

          Result.emplace_back(InterestingVal, LHSVal.second);

          LHSKnownBBs.insert(LHSVal.second);

        }

      for (const auto &RHSVal : RHSVals)

        if (RHSVal.first == InterestingVal || isa<UndefValue>(RHSVal.first)) {

          // If we already inferred a value for this block on the LHS, don't

          // re-add it.

          if (!LHSKnownBBs.count(RHSVal.second))

            Result.emplace_back(InterestingVal, RHSVal.second);

        }


      return !Result.empty();

    }


    // Handle the NOT form of XOR.

    if (I->getOpcode() == Instruction::Xor &&

        isa<ConstantInt>(I->getOperand(1)) &&

        cast<ConstantInt>(I->getOperand(1))->isOne()) {

      computeValueKnownInPredecessorsImpl(I->getOperand(0), BB, Result,

                                          WantInteger, RecursionSet, CxtI);

      if (Result.empty())

        return false;


      // Invert the known values.

      for (auto &R : Result)

        R.first = ConstantExpr::getNot(R.first);


      return true;

    }


  // Try to simplify some other binary operator values.

  } else if (BinaryOperator *BO = dyn_cast<BinaryOperator>(I)) {

    if (Preference != WantInteger)

      return false;

    if (ConstantInt *CI = dyn_cast<ConstantInt>(BO->getOperand(1))) {

      PredValueInfoTy LHSVals;

      computeValueKnownInPredecessorsImpl(BO->getOperand(0), BB, LHSVals,

                                          WantInteger, RecursionSet, CxtI);


      // Try to use constant folding to simplify the binary operator.

      for (const auto &LHSVal : LHSVals) {

        Constant *V = LHSVal.first;

        Constant *Folded =

            ConstantFoldBinaryOpOperands(BO->getOpcode(), V, CI, DL);


        if (Constant *KC = getKnownConstant(Folded, WantInteger))

          Result.emplace_back(KC, LHSVal.second);

      }

    }


    return !Result.empty();

  }


  // Handle compare with phi operand, where the PHI is defined in this block.

  if (CmpInst *Cmp = dyn_cast<CmpInst>(I)) {

    if (Preference != WantInteger)

      return false;

    Type *CmpType = Cmp->getType();

    Value *CmpLHS = Cmp->getOperand(0);

    Value *CmpRHS = Cmp->getOperand(1);

    CmpInst::Predicate Pred = Cmp->getPredicate();


    PHINode *PN = dyn_cast<PHINode>(CmpLHS);

    if (!PN)

      PN = dyn_cast<PHINode>(CmpRHS);

    // Do not perform phi translation across a loop header phi, because this

    // may result in comparison of values from two different loop iterations.

    // FIXME: This check is broken if LoopHeaders is not populated.

    if (PN && PN->getParent() == BB && !LoopHeaders.contains(BB)) {

      const DataLayout &DL = PN->getDataLayout();

      // We can do this simplification if any comparisons fold to true or false.

      // See if any do.

      for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) {

        BasicBlock *PredBB = PN->getIncomingBlock(i);

        Value *LHS, *RHS;

        if (PN == CmpLHS) {

          LHS = PN->getIncomingValue(i);

          RHS = CmpRHS->DoPHITranslation(BB, PredBB);

        } else {

          LHS = CmpLHS->DoPHITranslation(BB, PredBB);

          RHS = PN->getIncomingValue(i);

        }

        Value *Res = simplifyCmpInst(Pred, LHS, RHS, {DL});

        if (!Res) {

          if (!isa<Constant>(RHS))

            continue;


          // getPredicateOnEdge call will make no sense if LHS is defined in BB.

          auto LHSInst = dyn_cast<Instruction>(LHS);

          if (LHSInst && LHSInst->getParent() == BB)

            continue;


          Res = LVI->getPredicateOnEdge(Pred, LHS, cast<Constant>(RHS), PredBB,

                                        BB, CxtI ? CxtI : Cmp);

        }


        if (Constant *KC = getKnownConstant(Res, WantInteger))

          Result.emplace_back(KC, PredBB);

      }


      return !Result.empty();

    }


    // If comparing a live-in value against a constant, see if we know the

    // live-in value on any predecessors.

    if (isa<Constant>(CmpRHS) && !CmpType->isVectorTy()) {

      Constant *CmpConst = cast<Constant>(CmpRHS);


      if (!isa<Instruction>(CmpLHS) ||

          cast<Instruction>(CmpLHS)->getParent() != BB) {

        for (BasicBlock *P : predecessors(BB)) {

          // If the value is known by LazyValueInfo to be a constant in a

          // predecessor, use that information to try to thread this block.

          Constant *Res = LVI->getPredicateOnEdge(Pred, CmpLHS, CmpConst, P, BB,

                                                  CxtI ? CxtI : Cmp);

          if (Constant *KC = getKnownConstant(Res, WantInteger))

            Result.emplace_back(KC, P);

        }


        return !Result.empty();

      }


      // InstCombine can fold some forms of constant range checks into

      // (icmp (add (x, C1)), C2). See if we have we have such a thing with

      // x as a live-in.

      {

        using namespace PatternMatch;


        Value *AddLHS;

        ConstantInt *AddConst;

        if (isa<ConstantInt>(CmpConst) &&

            match(CmpLHS, m_Add(m_Value(AddLHS), m_ConstantInt(AddConst)))) {

          if (!isa<Instruction>(AddLHS) ||

              cast<Instruction>(AddLHS)->getParent() != BB) {

            for (BasicBlock *P : predecessors(BB)) {

              // If the value is known by LazyValueInfo to be a ConstantRange in

              // a predecessor, use that information to try to thread this

              // block.

              ConstantRange CR = LVI->getConstantRangeOnEdge(

                  AddLHS, P, BB, CxtI ? CxtI : cast<Instruction>(CmpLHS));

              // Propagate the range through the addition.

              CR = CR.add(AddConst->getValue());


              // Get the range where the compare returns true.

              ConstantRange CmpRange = ConstantRange::makeExactICmpRegion(

                  Pred, cast<ConstantInt>(CmpConst)->getValue());


              Constant *ResC;

              if (CmpRange.contains(CR))

                ResC = ConstantInt::getTrue(CmpType);

              else if (CmpRange.inverse().contains(CR))

                ResC = ConstantInt::getFalse(CmpType);

              else

                continue;


              Result.emplace_back(ResC, P);

            }


            return !Result.empty();

          }

        }

      }


      // Try to find a constant value for the LHS of a comparison,

      // and evaluate it statically if we can.

      PredValueInfoTy LHSVals;

      computeValueKnownInPredecessorsImpl(I->getOperand(0), BB, LHSVals,

                                          WantInteger, RecursionSet, CxtI);


      for (const auto &LHSVal : LHSVals) {

        Constant *V = LHSVal.first;

        Constant *Folded =

            ConstantFoldCompareInstOperands(Pred, V, CmpConst, DL);

        if (Constant *KC = getKnownConstant(Folded, WantInteger))

          Result.emplace_back(KC, LHSVal.second);

      }


      return !Result.empty();

    }

  }


  if (SelectInst *SI = dyn_cast<SelectInst>(I)) {

    // Handle select instructions where at least one operand is a known constant

    // and we can figure out the condition value for any predecessor block.

    Constant *TrueVal = getKnownConstant(SI->getTrueValue(), Preference);

    Constant *FalseVal = getKnownConstant(SI->getFalseValue(), Preference);

    PredValueInfoTy Conds;

    if ((TrueVal || FalseVal) &&

        computeValueKnownInPredecessorsImpl(SI->getCondition(), BB, Conds,

                                            WantInteger, RecursionSet, CxtI)) {

      for (auto &C : Conds) {

        Constant *Cond = C.first;


        // Figure out what value to use for the condition.

        bool KnownCond;

        if (ConstantInt *CI = dyn_cast<ConstantInt>(Cond)) {

          // A known boolean.

          KnownCond = CI->isOne();

        } else {

          assert(isa<UndefValue>(Cond) && "Unexpected condition value");

          // Either operand will do, so be sure to pick the one that's a known

          // constant.

          // FIXME: Do this more cleverly if both values are known constants?

          KnownCond = (TrueVal != nullptr);

        }


        // See if the select has a known constant value for this predecessor.

        if (Constant *Val = KnownCond ? TrueVal : FalseVal)

          Result.emplace_back(Val, C.second);

      }


      return !Result.empty();

    }

  }


  // If all else fails, see if LVI can figure out a constant value for us.

  assert(CxtI->getParent() == BB && "CxtI should be in BB");

  Constant *CI = LVI->getConstant(V, CxtI);

  if (Constant *KC = getKnownConstant(CI, Preference)) {

    for (BasicBlock *Pred : predecessors(BB))

      Result.emplace_back(KC, Pred);

  }


  return !Result.empty();

}


/// GetBestDestForBranchOnUndef - If we determine that the specified block ends

/// in an undefined jump, decide which block is best to revector to.

///

/// Since we can pick an arbitrary destination, we pick the successor with the

/// fewest predecessors.  This should reduce the in-degree of the others.

static unsigned getBestDestForJumpOnUndef(BasicBlock *BB) {

  Instruction *BBTerm = BB->getTerminator();

  unsigned MinSucc = 0;

  BasicBlock *TestBB = BBTerm->getSuccessor(MinSucc);

  // Compute the successor with the minimum number of predecessors.

  unsigned MinNumPreds = pred_size(TestBB);

  for (unsigned i = 1, e = BBTerm->getNumSuccessors(); i != e; ++i) {

    TestBB = BBTerm->getSuccessor(i);

    unsigned NumPreds = pred_size(TestBB);

    if (NumPreds < MinNumPreds) {

      MinSucc = i;

      MinNumPreds = NumPreds;

    }

  }


  return MinSucc;

}


static bool hasAddressTakenAndUsed(BasicBlock *BB) {

  if (!BB->hasAddressTaken()) return false;


  // If the block has its address taken, it may be a tree of dead constants

  // hanging off of it.  These shouldn't keep the block alive.

  BlockAddress *BA = BlockAddress::get(BB);

  BA->removeDeadConstantUsers();

  return !BA->use_empty();

}


/// processBlock - If there are any predecessors whose control can be threaded

/// through to a successor, transform them now.

bool JumpThreadingPass::processBlock(BasicBlock *BB) {

  // If the block is trivially dead, just return and let the caller nuke it.

  // This simplifies other transformations.

  if (DTU->isBBPendingDeletion(BB) ||

      (pred_empty(BB) && BB != &BB->getParent()->getEntryBlock()))

    return false;


  // If this block has a single predecessor, and if that pred has a single

  // successor, merge the blocks.  This encourages recursive jump threading

  // because now the condition in this block can be threaded through

  // predecessors of our predecessor block.

  if (maybeMergeBasicBlockIntoOnlyPred(BB))

    return true;


  if (tryToUnfoldSelectInCurrBB(BB))

    return true;


  // Look if we can propagate guards to predecessors.

  if (HasGuards && processGuards(BB))

    return true;


  // What kind of constant we're looking for.

  ConstantPreference Preference = WantInteger;


  // Look to see if the terminator is a conditional branch, switch or indirect

  // branch, if not we can't thread it.

  Value *Condition;

  Instruction *Terminator = BB->getTerminator();

  if (BranchInst *BI = dyn_cast<BranchInst>(Terminator)) {

    // Can't thread an unconditional jump.

    if (BI->isUnconditional()) return false;

    Condition = BI->getCondition();

  } else if (SwitchInst *SI = dyn_cast<SwitchInst>(Terminator)) {

    Condition = SI->getCondition();

  } else if (IndirectBrInst *IB = dyn_cast<IndirectBrInst>(Terminator)) {

    // Can't thread indirect branch with no successors.

    if (IB->getNumSuccessors() == 0) return false;

    Condition = IB->getAddress()->stripPointerCasts();

    Preference = WantBlockAddress;

  } else {

    return false; // Must be an invoke or callbr.

  }


  // Keep track if we constant folded the condition in this invocation.

  bool ConstantFolded = false;


  // Run constant folding to see if we can reduce the condition to a simple

  // constant.

  if (Instruction *I = dyn_cast<Instruction>(Condition)) {

    Value *SimpleVal =

        ConstantFoldInstruction(I, BB->getDataLayout(), TLI);

    if (SimpleVal) {

      I->replaceAllUsesWith(SimpleVal);

      if (isInstructionTriviallyDead(I, TLI))

        I->eraseFromParent();

      Condition = SimpleVal;

      ConstantFolded = true;

    }

  }


  // If the terminator is branching on an undef or freeze undef, we can pick any

  // of the successors to branch to.  Let getBestDestForJumpOnUndef decide.

  auto *FI = dyn_cast<FreezeInst>(Condition);

  if (isa<UndefValue>(Condition) ||

      (FI && isa<UndefValue>(FI->getOperand(0)) && FI->hasOneUse())) {

    unsigned BestSucc = getBestDestForJumpOnUndef(BB);

    std::vector<DominatorTree::UpdateType> Updates;


    // Fold the branch/switch.

    Instruction *BBTerm = BB->getTerminator();

    Updates.reserve(BBTerm->getNumSuccessors());

    for (unsigned i = 0, e = BBTerm->getNumSuccessors(); i != e; ++i) {

      if (i == BestSucc) continue;

      BasicBlock *Succ = BBTerm->getSuccessor(i);

      Succ->removePredecessor(BB, true);

      Updates.push_back({DominatorTree::Delete, BB, Succ});

    }


    LLVM_DEBUG(dbgs() << "  In block '" << BB->getName()

                      << "' folding undef terminator: " << *BBTerm << '\n');

    Instruction *NewBI = BranchInst::Create(BBTerm->getSuccessor(BestSucc), BBTerm->getIterator());

    NewBI->setDebugLoc(BBTerm->getDebugLoc());

    ++NumFolds;

    BBTerm->eraseFromParent();

    DTU->applyUpdatesPermissive(Updates);

    if (FI)

      FI->eraseFromParent();

    return true;

  }


  // If the terminator of this block is branching on a constant, simplify the

  // terminator to an unconditional branch.  This can occur due to threading in

  // other blocks.

  if (getKnownConstant(Condition, Preference)) {

    LLVM_DEBUG(dbgs() << "  In block '" << BB->getName()

                      << "' folding terminator: " << *BB->getTerminator()

                      << '\n');

    ++NumFolds;

    ConstantFoldTerminator(BB, true, nullptr, DTU.get());

    if (auto *BPI = getBPI())

      BPI->eraseBlock(BB);

    return true;

  }


  Instruction *CondInst = dyn_cast<Instruction>(Condition);


  // All the rest of our checks depend on the condition being an instruction.

  if (!CondInst) {

    // FIXME: Unify this with code below.

    if (processThreadableEdges(Condition, BB, Preference, Terminator))

      return true;

    return ConstantFolded;

  }


  // Some of the following optimization can safely work on the unfrozen cond.

  Value *CondWithoutFreeze = CondInst;

  if (auto *FI = dyn_cast<FreezeInst>(CondInst))

    CondWithoutFreeze = FI->getOperand(0);


  if (CmpInst *CondCmp = dyn_cast<CmpInst>(CondWithoutFreeze)) {

    // If we're branching on a conditional, LVI might be able to determine

    // it's value at the branch instruction.  We only handle comparisons

    // against a constant at this time.

    if (Constant *CondConst = dyn_cast<Constant>(CondCmp->getOperand(1))) {

      Constant *Res =

          LVI->getPredicateAt(CondCmp->getPredicate(), CondCmp->getOperand(0),

                              CondConst, BB->getTerminator(),

                              /*UseBlockValue=*/false);

      if (Res) {

        // We can safely replace *some* uses of the CondInst if it has

        // exactly one value as returned by LVI. RAUW is incorrect in the

        // presence of guards and assumes, that have the `Cond` as the use. This

        // is because we use the guards/assume to reason about the `Cond` value

        // at the end of block, but RAUW unconditionally replaces all uses

        // including the guards/assumes themselves and the uses before the

        // guard/assume.

        if (replaceFoldableUses(CondCmp, Res, BB))

          return true;

      }


      // We did not manage to simplify this branch, try to see whether

      // CondCmp depends on a known phi-select pattern.

      if (tryToUnfoldSelect(CondCmp, BB))

        return true;

    }

  }


  if (SwitchInst *SI = dyn_cast<SwitchInst>(BB->getTerminator()))

    if (tryToUnfoldSelect(SI, BB))

      return true;


  // Check for some cases that are worth simplifying.  Right now we want to look

  // for loads that are used by a switch or by the condition for the branch.  If

  // we see one, check to see if it's partially redundant.  If so, insert a PHI

  // which can then be used to thread the values.

  Value *SimplifyValue = CondWithoutFreeze;


  if (CmpInst *CondCmp = dyn_cast<CmpInst>(SimplifyValue))

    if (isa<Constant>(CondCmp->getOperand(1)))

      SimplifyValue = CondCmp->getOperand(0);


  // TODO: There are other places where load PRE would be profitable, such as

  // more complex comparisons.

  if (LoadInst *LoadI = dyn_cast<LoadInst>(SimplifyValue))

    if (simplifyPartiallyRedundantLoad(LoadI))

      return true;


  // Before threading, try to propagate profile data backwards:

  if (PHINode *PN = dyn_cast<PHINode>(CondInst))

    if (PN->getParent() == BB && isa<BranchInst>(BB->getTerminator()))

      updatePredecessorProfileMetadata(PN, BB);


  // Handle a variety of cases where we are branching on something derived from

  // a PHI node in the current block.  If we can prove that any predecessors

  // compute a predictable value based on a PHI node, thread those predecessors.

  if (processThreadableEdges(CondInst, BB, Preference, Terminator))

    return true;


  // If this is an otherwise-unfoldable branch on a phi node or freeze(phi) in

  // the current block, see if we can simplify.

  PHINode *PN = dyn_cast<PHINode>(CondWithoutFreeze);

  if (PN && PN->getParent() == BB && isa<BranchInst>(BB->getTerminator()))

    return processBranchOnPHI(PN);


  // If this is an otherwise-unfoldable branch on a XOR, see if we can simplify.

  if (CondInst->getOpcode() == Instruction::Xor &&

      CondInst->getParent() == BB && isa<BranchInst>(BB->getTerminator()))

    return processBranchOnXOR(cast<BinaryOperator>(CondInst));


  // Search for a stronger dominating condition that can be used to simplify a

  // conditional branch leaving BB.

  if (processImpliedCondition(BB))

    return true;


  return false;

}


bool JumpThreadingPass::processImpliedCondition(BasicBlock *BB) {

  auto *BI = dyn_cast<BranchInst>(BB->getTerminator());

  if (!BI || !BI->isConditional())

    return false;


  Value *Cond = BI->getCondition();

  // Assuming that predecessor's branch was taken, if pred's branch condition

  // (V) implies Cond, Cond can be either true, undef, or poison. In this case,

  // freeze(Cond) is either true or a nondeterministic value.

  // If freeze(Cond) has only one use, we can freely fold freeze(Cond) to true

  // without affecting other instructions.

  auto *FICond = dyn_cast<FreezeInst>(Cond);

  if (FICond && FICond->hasOneUse())

    Cond = FICond->getOperand(0);

  else

    FICond = nullptr;


  BasicBlock *CurrentBB = BB;

  BasicBlock *CurrentPred = BB->getSinglePredecessor();

  unsigned Iter = 0;


  auto &DL = BB->getDataLayout();


  while (CurrentPred && Iter++ < ImplicationSearchThreshold) {

    auto *PBI = dyn_cast<BranchInst>(CurrentPred->getTerminator());

    if (!PBI || !PBI->isConditional())

      return false;

    if (PBI->getSuccessor(0) != CurrentBB && PBI->getSuccessor(1) != CurrentBB)

      return false;


    bool CondIsTrue = PBI->getSuccessor(0) == CurrentBB;

    std::optional<bool> Implication =

        isImpliedCondition(PBI->getCondition(), Cond, DL, CondIsTrue);


    // If the branch condition of BB (which is Cond) and CurrentPred are

    // exactly the same freeze instruction, Cond can be folded into CondIsTrue.

    if (!Implication && FICond && isa<FreezeInst>(PBI->getCondition())) {

      if (cast<FreezeInst>(PBI->getCondition())->getOperand(0) ==

          FICond->getOperand(0))

        Implication = CondIsTrue;

    }


    if (Implication) {

      BasicBlock *KeepSucc = BI->getSuccessor(*Implication ? 0 : 1);

      BasicBlock *RemoveSucc = BI->getSuccessor(*Implication ? 1 : 0);

      RemoveSucc->removePredecessor(BB);

      BranchInst *UncondBI = BranchInst::Create(KeepSucc, BI->getIterator());

      UncondBI->setDebugLoc(BI->getDebugLoc());

      ++NumFolds;

      BI->eraseFromParent();

      if (FICond)

        FICond->eraseFromParent();


      DTU->applyUpdatesPermissive({{DominatorTree::Delete, BB, RemoveSucc}});

      if (auto *BPI = getBPI())

        BPI->eraseBlock(BB);

      return true;

    }

    CurrentBB = CurrentPred;

    CurrentPred = CurrentBB->getSinglePredecessor();

  }


  return false;

}


/// Return true if Op is an instruction defined in the given block.

static bool isOpDefinedInBlock(Value *Op, BasicBlock *BB) {

  if (Instruction *OpInst = dyn_cast<Instruction>(Op))

    if (OpInst->getParent() == BB)

      return true;

  return false;

}


/// simplifyPartiallyRedundantLoad - If LoadI is an obviously partially

/// redundant load instruction, eliminate it by replacing it with a PHI node.

/// This is an important optimization that encourages jump threading, and needs

/// to be run interlaced with other jump threading tasks.

bool JumpThreadingPass::simplifyPartiallyRedundantLoad(LoadInst *LoadI) {

  // Don't hack volatile and ordered loads.

  if (!LoadI->isUnordered()) return false;


  // If the load is defined in a block with exactly one predecessor, it can't be

  // partially redundant.

  BasicBlock *LoadBB = LoadI->getParent();

  if (LoadBB->getSinglePredecessor())

    return false;


  // If the load is defined in an EH pad, it can't be partially redundant,

  // because the edges between the invoke and the EH pad cannot have other

  // instructions between them.

  if (LoadBB->isEHPad())

    return false;


  Value *LoadedPtr = LoadI->getOperand(0);


  // If the loaded operand is defined in the LoadBB and its not a phi,

  // it can't be available in predecessors.

  if (isOpDefinedInBlock(LoadedPtr, LoadBB) && !isa<PHINode>(LoadedPtr))

    return false;


  // Scan a few instructions up from the load, to see if it is obviously live at

  // the entry to its block.

  BasicBlock::iterator BBIt(LoadI);

  bool IsLoadCSE;

  BatchAAResults BatchAA(*AA);

  // The dominator tree is updated lazily and may not be valid at this point.

  BatchAA.disableDominatorTree();

  if (Value *AvailableVal = FindAvailableLoadedValue(

          LoadI, LoadBB, BBIt, DefMaxInstsToScan, &BatchAA, &IsLoadCSE)) {

    // If the value of the load is locally available within the block, just use

    // it.  This frequently occurs for reg2mem'd allocas.


    if (IsLoadCSE) {

      LoadInst *NLoadI = cast<LoadInst>(AvailableVal);

      combineMetadataForCSE(NLoadI, LoadI, false);

      LVI->forgetValue(NLoadI);

    };


    // If the returned value is the load itself, replace with poison. This can

    // only happen in dead loops.

    if (AvailableVal == LoadI)

      AvailableVal = PoisonValue::get(LoadI->getType());

    if (AvailableVal->getType() != LoadI->getType()) {

      AvailableVal = CastInst::CreateBitOrPointerCast(

          AvailableVal, LoadI->getType(), "", LoadI->getIterator());

      cast<Instruction>(AvailableVal)->setDebugLoc(LoadI->getDebugLoc());

    }

    LoadI->replaceAllUsesWith(AvailableVal);

    LoadI->eraseFromParent();

    return true;

  }


  // Otherwise, if we scanned the whole block and got to the top of the block,

  // we know the block is locally transparent to the load.  If not, something

  // might clobber its value.

  if (BBIt != LoadBB->begin())

    return false;


  // If all of the loads and stores that feed the value have the same AA tags,

  // then we can propagate them onto any newly inserted loads.

  AAMDNodes AATags = LoadI->getAAMetadata();


  SmallPtrSet<BasicBlock*, 8> PredsScanned;


  using AvailablePredsTy = SmallVector<std::pair<BasicBlock *, Value *>, 8>;


  AvailablePredsTy AvailablePreds;

  BasicBlock *OneUnavailablePred = nullptr;

  SmallVector<LoadInst*, 8> CSELoads;


  // If we got here, the loaded value is transparent through to the start of the

  // block.  Check to see if it is available in any of the predecessor blocks.

  for (BasicBlock *PredBB : predecessors(LoadBB)) {

    // If we already scanned this predecessor, skip it.

    if (!PredsScanned.insert(PredBB).second)

      continue;


    BBIt = PredBB->end();

    unsigned NumScanedInst = 0;

    Value *PredAvailable = nullptr;

    // NOTE: We don't CSE load that is volatile or anything stronger than

    // unordered, that should have been checked when we entered the function.

    assert(LoadI->isUnordered() &&

           "Attempting to CSE volatile or atomic loads");

    // If this is a load on a phi pointer, phi-translate it and search

    // for available load/store to the pointer in predecessors.

    Type *AccessTy = LoadI->getType();

    const auto &DL = LoadI->getDataLayout();

    MemoryLocation Loc(LoadedPtr->DoPHITranslation(LoadBB, PredBB),

                       LocationSize::precise(DL.getTypeStoreSize(AccessTy)),

                       AATags);

    PredAvailable = findAvailablePtrLoadStore(

        Loc, AccessTy, LoadI->isAtomic(), PredBB, BBIt, DefMaxInstsToScan,

        &BatchAA, &IsLoadCSE, &NumScanedInst);


    // If PredBB has a single predecessor, continue scanning through the

    // single predecessor.

    BasicBlock *SinglePredBB = PredBB;

    while (!PredAvailable && SinglePredBB && BBIt == SinglePredBB->begin() &&

           NumScanedInst < DefMaxInstsToScan) {

      SinglePredBB = SinglePredBB->getSinglePredecessor();

      if (SinglePredBB) {

        BBIt = SinglePredBB->end();

        PredAvailable = findAvailablePtrLoadStore(

            Loc, AccessTy, LoadI->isAtomic(), SinglePredBB, BBIt,

            (DefMaxInstsToScan - NumScanedInst), &BatchAA, &IsLoadCSE,

            &NumScanedInst);

      }

    }


    if (!PredAvailable) {

      OneUnavailablePred = PredBB;

      continue;

    }


    if (IsLoadCSE)

      CSELoads.push_back(cast<LoadInst>(PredAvailable));


    // If so, this load is partially redundant.  Remember this info so that we

    // can create a PHI node.

    AvailablePreds.emplace_back(PredBB, PredAvailable);

  }


  // If the loaded value isn't available in any predecessor, it isn't partially

  // redundant.

  if (AvailablePreds.empty()) return false;


  // Okay, the loaded value is available in at least one (and maybe all!)

  // predecessors.  If the value is unavailable in more than one unique

  // predecessor, we want to insert a merge block for those common predecessors.

  // This ensures that we only have to insert one reload, thus not increasing

  // code size.

  BasicBlock *UnavailablePred = nullptr;


  // If the value is unavailable in one of predecessors, we will end up

  // inserting a new instruction into them. It is only valid if all the

  // instructions before LoadI are guaranteed to pass execution to its

  // successor, or if LoadI is safe to speculate.

  // TODO: If this logic becomes more complex, and we will perform PRE insertion

  // farther than to a predecessor, we need to reuse the code from GVN's PRE.

  // It requires domination tree analysis, so for this simple case it is an

  // overkill.

  if (PredsScanned.size() != AvailablePreds.size() &&

      !isSafeToSpeculativelyExecute(LoadI))

    for (auto I = LoadBB->begin(); &*I != LoadI; ++I)

      if (!isGuaranteedToTransferExecutionToSuccessor(&*I))

        return false;


  // If there is exactly one predecessor where the value is unavailable, the

  // already computed 'OneUnavailablePred' block is it.  If it ends in an

  // unconditional branch, we know that it isn't a critical edge.

  if (PredsScanned.size() == AvailablePreds.size()+1 &&

      OneUnavailablePred->getTerminator()->getNumSuccessors() == 1) {

    UnavailablePred = OneUnavailablePred;

  } else if (PredsScanned.size() != AvailablePreds.size()) {

    // Otherwise, we had multiple unavailable predecessors or we had a critical

    // edge from the one.

    SmallVector<BasicBlock*, 8> PredsToSplit;

    SmallPtrSet<BasicBlock*, 8> AvailablePredSet;


    for (const auto &AvailablePred : AvailablePreds)

      AvailablePredSet.insert(AvailablePred.first);


    // Add all the unavailable predecessors to the PredsToSplit list.

    for (BasicBlock *P : predecessors(LoadBB)) {

      // If the predecessor is an indirect goto, we can't split the edge.

      if (isa<IndirectBrInst>(P->getTerminator()))

        return false;


      if (!AvailablePredSet.count(P))

        PredsToSplit.push_back(P);

    }


    // Split them out to their own block.

    UnavailablePred = splitBlockPreds(LoadBB, PredsToSplit, "thread-pre-split");

  }


  // If the value isn't available in all predecessors, then there will be

  // exactly one where it isn't available.  Insert a load on that edge and add

  // it to the AvailablePreds list.

  if (UnavailablePred) {

    assert(UnavailablePred->getTerminator()->getNumSuccessors() == 1 &&

           "Can't handle critical edge here!");

    LoadInst *NewVal = new LoadInst(

        LoadI->getType(), LoadedPtr->DoPHITranslation(LoadBB, UnavailablePred),

        LoadI->getName() + ".pr", false, LoadI->getAlign(),

        LoadI->getOrdering(), LoadI->getSyncScopeID(),

        UnavailablePred->getTerminator()->getIterator());

    NewVal->setDebugLoc(LoadI->getDebugLoc());

    if (AATags)

      NewVal->setAAMetadata(AATags);


    AvailablePreds.emplace_back(UnavailablePred, NewVal);

  }


  // Now we know that each predecessor of this block has a value in

  // AvailablePreds, sort them for efficient access as we're walking the preds.

  array_pod_sort(AvailablePreds.begin(), AvailablePreds.end());


  // Create a PHI node at the start of the block for the PRE'd load value.

  PHINode *PN = PHINode::Create(LoadI->getType(), pred_size(LoadBB), "");

  PN->insertBefore(LoadBB->begin());

  PN->takeName(LoadI);

  PN->setDebugLoc(LoadI->getDebugLoc());


  // Insert new entries into the PHI for each predecessor.  A single block may

  // have multiple entries here.

  for (BasicBlock *P : predecessors(LoadBB)) {

    AvailablePredsTy::iterator I =

        llvm::lower_bound(AvailablePreds, std::make_pair(P, (Value *)nullptr));


    assert(I != AvailablePreds.end() && I->first == P &&

           "Didn't find entry for predecessor!");


    // If we have an available predecessor but it requires casting, insert the

    // cast in the predecessor and use the cast. Note that we have to update the

    // AvailablePreds vector as we go so that all of the PHI entries for this

    // predecessor use the same bitcast.

    Value *&PredV = I->second;

    if (PredV->getType() != LoadI->getType())

      PredV = CastInst::CreateBitOrPointerCast(

          PredV, LoadI->getType(), "", P->getTerminator()->getIterator());


    PN->addIncoming(PredV, I->first);

  }


  for (LoadInst *PredLoadI : CSELoads) {

    combineMetadataForCSE(PredLoadI, LoadI, true);

    LVI->forgetValue(PredLoadI);

  }


  LoadI->replaceAllUsesWith(PN);

  LoadI->eraseFromParent();


  return true;

}


/// findMostPopularDest - The specified list contains multiple possible

/// threadable destinations.  Pick the one that occurs the most frequently in

/// the list.

static BasicBlock *

findMostPopularDest(BasicBlock *BB,

                    const SmallVectorImpl<std::pair<BasicBlock *,

                                          BasicBlock *>> &PredToDestList) {

  assert(!PredToDestList.empty());


  // Determine popularity.  If there are multiple possible destinations, we

  // explicitly choose to ignore 'undef' destinations.  We prefer to thread

  // blocks with known and real destinations to threading undef.  We'll handle

  // them later if interesting.

  MapVector<BasicBlock *, unsigned> DestPopularity;


  // Populate DestPopularity with the successors in the order they appear in the

  // successor list.  This way, we ensure determinism by iterating it in the

  // same order in llvm::max_element below.  We map nullptr to 0 so that we can

  // return nullptr when PredToDestList contains nullptr only.

  DestPopularity[nullptr] = 0;

  for (auto *SuccBB : successors(BB))

    DestPopularity[SuccBB] = 0;


  for (const auto &PredToDest : PredToDestList)

    if (PredToDest.second)

      DestPopularity[PredToDest.second]++;


  // Find the most popular dest.

  auto MostPopular = llvm::max_element(DestPopularity, llvm::less_second());


  // Okay, we have finally picked the most popular destination.

  return MostPopular->first;

}


// Try to evaluate the value of V when the control flows from PredPredBB to

// BB->getSinglePredecessor() and then on to BB.

Constant *JumpThreadingPass::evaluateOnPredecessorEdge(BasicBlock *BB,

                                                       BasicBlock *PredPredBB,

                                                       Value *V,

                                                       const DataLayout &DL) {

  BasicBlock *PredBB = BB->getSinglePredecessor();

  assert(PredBB && "Expected a single predecessor");


  if (Constant *Cst = dyn_cast<Constant>(V)) {

    return Cst;

  }


  // Consult LVI if V is not an instruction in BB or PredBB.

  Instruction *I = dyn_cast<Instruction>(V);

  if (!I || (I->getParent() != BB && I->getParent() != PredBB)) {

    return LVI->getConstantOnEdge(V, PredPredBB, PredBB, nullptr);

  }


  // Look into a PHI argument.

  if (PHINode *PHI = dyn_cast<PHINode>(V)) {

    if (PHI->getParent() == PredBB)

      return dyn_cast<Constant>(PHI->getIncomingValueForBlock(PredPredBB));

    return nullptr;

  }


  // If we have a CmpInst, try to fold it for each incoming edge into PredBB.

  if (CmpInst *CondCmp = dyn_cast<CmpInst>(V)) {

    if (CondCmp->getParent() == BB) {

      Constant *Op0 =

          evaluateOnPredecessorEdge(BB, PredPredBB, CondCmp->getOperand(0), DL);

      Constant *Op1 =

          evaluateOnPredecessorEdge(BB, PredPredBB, CondCmp->getOperand(1), DL);

      if (Op0 && Op1) {

        return ConstantFoldCompareInstOperands(CondCmp->getPredicate(), Op0,

                                               Op1, DL);

      }

    }

    return nullptr;

  }


  return nullptr;

}


bool JumpThreadingPass::processThreadableEdges(Value *Cond, BasicBlock *BB,

                                               ConstantPreference Preference,

                                               Instruction *CxtI) {

  // If threading this would thread across a loop header, don't even try to

  // thread the edge.

  if (LoopHeaders.count(BB))

    return false;


  PredValueInfoTy PredValues;

  if (!computeValueKnownInPredecessors(Cond, BB, PredValues, Preference,

                                       CxtI)) {

    // We don't have known values in predecessors.  See if we can thread through

    // BB and its sole predecessor.

    return maybethreadThroughTwoBasicBlocks(BB, Cond);

  }


  assert(!PredValues.empty() &&

         "computeValueKnownInPredecessors returned true with no values");


  LLVM_DEBUG(dbgs() << "IN BB: " << *BB;

             for (const auto &PredValue : PredValues) {

               dbgs() << "  BB '" << BB->getName()

                      << "': FOUND condition = " << *PredValue.first

                      << " for pred '" << PredValue.second->getName() << "'.\n";

  });


  // Decide what we want to thread through.  Convert our list of known values to

  // a list of known destinations for each pred.  This also discards duplicate

  // predecessors and keeps track of the undefined inputs (which are represented

  // as a null dest in the PredToDestList).

  SmallPtrSet<BasicBlock*, 16> SeenPreds;

  SmallVector<std::pair<BasicBlock*, BasicBlock*>, 16> PredToDestList;


  BasicBlock *OnlyDest = nullptr;

  BasicBlock *MultipleDestSentinel = (BasicBlock*)(intptr_t)~0ULL;

  Constant *OnlyVal = nullptr;

  Constant *MultipleVal = (Constant *)(intptr_t)~0ULL;


  for (const auto &PredValue : PredValues) {

    BasicBlock *Pred = PredValue.second;

    if (!SeenPreds.insert(Pred).second)

      continue;  // Duplicate predecessor entry.


    Constant *Val = PredValue.first;


    BasicBlock *DestBB;

    if (isa<UndefValue>(Val))

      DestBB = nullptr;

    else if (BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator())) {

      assert(isa<ConstantInt>(Val) && "Expecting a constant integer");

      DestBB = BI->getSuccessor(cast<ConstantInt>(Val)->isZero());

    } else if (SwitchInst *SI = dyn_cast<SwitchInst>(BB->getTerminator())) {

      assert(isa<ConstantInt>(Val) && "Expecting a constant integer");

      DestBB = SI->findCaseValue(cast<ConstantInt>(Val))->getCaseSuccessor();

    } else {

      assert(isa<IndirectBrInst>(BB->getTerminator())

              && "Unexpected terminator");

      assert(isa<BlockAddress>(Val) && "Expecting a constant blockaddress");

      DestBB = cast<BlockAddress>(Val)->getBasicBlock();

    }


    // If we have exactly one destination, remember it for efficiency below.

    if (PredToDestList.empty()) {

      OnlyDest = DestBB;

      OnlyVal = Val;

    } else {

      if (OnlyDest != DestBB)

        OnlyDest = MultipleDestSentinel;

      // It possible we have same destination, but different value, e.g. default

      // case in switchinst.

      if (Val != OnlyVal)

        OnlyVal = MultipleVal;

    }


    // If the predecessor ends with an indirect goto, we can't change its

    // destination.

    if (isa<IndirectBrInst>(Pred->getTerminator()))

      continue;


    PredToDestList.emplace_back(Pred, DestBB);

  }


  // If all edges were unthreadable, we fail.

  if (PredToDestList.empty())

    return false;


  // If all the predecessors go to a single known successor, we want to fold,

  // not thread. By doing so, we do not need to duplicate the current block and

  // also miss potential opportunities in case we dont/cant duplicate.

  if (OnlyDest && OnlyDest != MultipleDestSentinel) {

    if (BB->hasNPredecessors(PredToDestList.size())) {

      bool SeenFirstBranchToOnlyDest = false;

      std::vector <DominatorTree::UpdateType> Updates;

      Updates.reserve(BB->getTerminator()->getNumSuccessors() - 1);

      for (BasicBlock *SuccBB : successors(BB)) {

        if (SuccBB == OnlyDest && !SeenFirstBranchToOnlyDest) {

          SeenFirstBranchToOnlyDest = true; // Don't modify the first branch.

        } else {

          SuccBB->removePredecessor(BB, true); // This is unreachable successor.

          Updates.push_back({DominatorTree::Delete, BB, SuccBB});

        }

      }


      // Finally update the terminator.

      Instruction *Term = BB->getTerminator();

      Instruction *NewBI = BranchInst::Create(OnlyDest, Term->getIterator());

      NewBI->setDebugLoc(Term->getDebugLoc());

      ++NumFolds;

      Term->eraseFromParent();

      DTU->applyUpdatesPermissive(Updates);

      if (auto *BPI = getBPI())

        BPI->eraseBlock(BB);


      // If the condition is now dead due to the removal of the old terminator,

      // erase it.

      if (auto *CondInst = dyn_cast<Instruction>(Cond)) {

        if (CondInst->use_empty() && !CondInst->mayHaveSideEffects())

          CondInst->eraseFromParent();

        // We can safely replace *some* uses of the CondInst if it has

        // exactly one value as returned by LVI. RAUW is incorrect in the

        // presence of guards and assumes, that have the `Cond` as the use. This

        // is because we use the guards/assume to reason about the `Cond` value

        // at the end of block, but RAUW unconditionally replaces all uses

        // including the guards/assumes themselves and the uses before the

        // guard/assume.

        else if (OnlyVal && OnlyVal != MultipleVal)

          replaceFoldableUses(CondInst, OnlyVal, BB);

      }

      return true;

    }

  }


  // Determine which is the most common successor.  If we have many inputs and

  // this block is a switch, we want to start by threading the batch that goes

  // to the most popular destination first.  If we only know about one

  // threadable destination (the common case) we can avoid this.

  BasicBlock *MostPopularDest = OnlyDest;


  if (MostPopularDest == MultipleDestSentinel) {

    // Remove any loop headers from the Dest list, threadEdge conservatively

    // won't process them, but we might have other destination that are eligible

    // and we still want to process.

    erase_if(PredToDestList,

             [&](const std::pair<BasicBlock *, BasicBlock *> &PredToDest) {

               return LoopHeaders.contains(PredToDest.second);

             });


    if (PredToDestList.empty())

      return false;


    MostPopularDest = findMostPopularDest(BB, PredToDestList);

  }


  // Now that we know what the most popular destination is, factor all

  // predecessors that will jump to it into a single predecessor.

  SmallVector<BasicBlock*, 16> PredsToFactor;

  for (const auto &PredToDest : PredToDestList)

    if (PredToDest.second == MostPopularDest) {

      BasicBlock *Pred = PredToDest.first;


      // This predecessor may be a switch or something else that has multiple

      // edges to the block.  Factor each of these edges by listing them

      // according to # occurrences in PredsToFactor.

      for (BasicBlock *Succ : successors(Pred))

        if (Succ == BB)

          PredsToFactor.push_back(Pred);

    }


  // If the threadable edges are branching on an undefined value, we get to pick

  // the destination that these predecessors should get to.

  if (!MostPopularDest)

    MostPopularDest = BB->getTerminator()->

                            getSuccessor(getBestDestForJumpOnUndef(BB));


  // Ok, try to thread it!

  return tryThreadEdge(BB, PredsToFactor, MostPopularDest);

}


/// processBranchOnPHI - We have an otherwise unthreadable conditional branch on

/// a PHI node (or freeze PHI) in the current block.  See if there are any

/// simplifications we can do based on inputs to the phi node.

bool JumpThreadingPass::processBranchOnPHI(PHINode *PN) {

  BasicBlock *BB = PN->getParent();


  // TODO: We could make use of this to do it once for blocks with common PHI

  // values.

  SmallVector<BasicBlock*, 1> PredBBs;

  PredBBs.resize(1);


  // If any of the predecessor blocks end in an unconditional branch, we can

  // *duplicate* the conditional branch into that block in order to further

  // encourage jump threading and to eliminate cases where we have branch on a

  // phi of an icmp (branch on icmp is much better).

  // This is still beneficial when a frozen phi is used as the branch condition

  // because it allows CodeGenPrepare to further canonicalize br(freeze(icmp))

  // to br(icmp(freeze ...)).

  for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) {

    BasicBlock *PredBB = PN->getIncomingBlock(i);

    if (BranchInst *PredBr = dyn_cast<BranchInst>(PredBB->getTerminator()))

      if (PredBr->isUnconditional()) {

        PredBBs[0] = PredBB;

        // Try to duplicate BB into PredBB.

        if (duplicateCondBranchOnPHIIntoPred(BB, PredBBs))

          return true;

      }

  }


  return false;

}


/// processBranchOnXOR - We have an otherwise unthreadable conditional branch on

/// a xor instruction in the current block.  See if there are any

/// simplifications we can do based on inputs to the xor.

bool JumpThreadingPass::processBranchOnXOR(BinaryOperator *BO) {

  BasicBlock *BB = BO->getParent();


  // If either the LHS or RHS of the xor is a constant, don't do this

  // optimization.

  if (isa<ConstantInt>(BO->getOperand(0)) ||

      isa<ConstantInt>(BO->getOperand(1)))

    return false;


  // If the first instruction in BB isn't a phi, we won't be able to infer

  // anything special about any particular predecessor.

  if (!isa<PHINode>(BB->front()))

    return false;


  // If this BB is a landing pad, we won't be able to split the edge into it.

  if (BB->isEHPad())

    return false;


  // If we have a xor as the branch input to this block, and we know that the

  // LHS or RHS of the xor in any predecessor is true/false, then we can clone

  // the condition into the predecessor and fix that value to true, saving some

  // logical ops on that path and encouraging other paths to simplify.

  //

  // This copies something like this:

  //

  //  BB:

  //    %X = phi i1 [1],  [%X']

  //    %Y = icmp eq i32 %A, %B

  //    %Z = xor i1 %X, %Y

  //    br i1 %Z, ...

  //

  // Into:

  //  BB':

  //    %Y = icmp ne i32 %A, %B

  //    br i1 %Y, ...


  PredValueInfoTy XorOpValues;

  bool isLHS = true;

  if (!computeValueKnownInPredecessors(BO->getOperand(0), BB, XorOpValues,

                                       WantInteger, BO)) {

    assert(XorOpValues.empty());

    if (!computeValueKnownInPredecessors(BO->getOperand(1), BB, XorOpValues,

                                         WantInteger, BO))

      return false;

    isLHS = false;

  }


  assert(!XorOpValues.empty() &&

         "computeValueKnownInPredecessors returned true with no values");


  // Scan the information to see which is most popular: true or false.  The

  // predecessors can be of the set true, false, or undef.

  unsigned NumTrue = 0, NumFalse = 0;

  for (const auto &XorOpValue : XorOpValues) {

    if (isa<UndefValue>(XorOpValue.first))

      // Ignore undefs for the count.

      continue;

    if (cast<ConstantInt>(XorOpValue.first)->isZero())

      ++NumFalse;

    else

      ++NumTrue;

  }


  // Determine which value to split on, true, false, or undef if neither.

  ConstantInt *SplitVal = nullptr;

  if (NumTrue > NumFalse)

    SplitVal = ConstantInt::getTrue(BB->getContext());

  else if (NumTrue != 0 || NumFalse != 0)

    SplitVal = ConstantInt::getFalse(BB->getContext());


  // Collect all of the blocks that this can be folded into so that we can

  // factor this once and clone it once.

  SmallVector<BasicBlock*, 8> BlocksToFoldInto;

  for (const auto &XorOpValue : XorOpValues) {

    if (XorOpValue.first != SplitVal && !isa<UndefValue>(XorOpValue.first))

      continue;


    BlocksToFoldInto.push_back(XorOpValue.second);

  }


  // If we inferred a value for all of the predecessors, then duplication won't

  // help us.  However, we can just replace the LHS or RHS with the constant.

  if (BlocksToFoldInto.size() ==

      cast<PHINode>(BB->front()).getNumIncomingValues()) {

    if (!SplitVal) {

      // If all preds provide undef, just nuke the xor, because it is undef too.

      BO->replaceAllUsesWith(UndefValue::get(BO->getType()));

      BO->eraseFromParent();

    } else if (SplitVal->isZero() && BO != BO->getOperand(isLHS)) {

      // If all preds provide 0, replace the xor with the other input.

      BO->replaceAllUsesWith(BO->getOperand(isLHS));

      BO->eraseFromParent();

    } else {

      // If all preds provide 1, set the computed value to 1.

      BO->setOperand(!isLHS, SplitVal);

    }


    return true;

  }


  // If any of predecessors end with an indirect goto, we can't change its

  // destination.

  if (any_of(BlocksToFoldInto, [](BasicBlock *Pred) {

        return isa<IndirectBrInst>(Pred->getTerminator());

      }))

    return false;


  // Try to duplicate BB into PredBB.

  return duplicateCondBranchOnPHIIntoPred(BB, BlocksToFoldInto);

}


/// addPHINodeEntriesForMappedBlock - We're adding 'NewPred' as a new

/// predecessor to the PHIBB block.  If it has PHI nodes, add entries for

/// NewPred using the entries from OldPred (suitably mapped).

static void addPHINodeEntriesForMappedBlock(BasicBlock *PHIBB,

                                            BasicBlock *OldPred,

                                            BasicBlock *NewPred,

                                            ValueToValueMapTy &ValueMap) {

  for (PHINode &PN : PHIBB->phis()) {

    // Ok, we have a PHI node.  Figure out what the incoming value was for the

    // DestBlock.

    Value *IV = PN.getIncomingValueForBlock(OldPred);


    // Remap the value if necessary.

    if (Instruction *Inst = dyn_cast<Instruction>(IV)) {

      ValueToValueMapTy::iterator I = ValueMap.find(Inst);

      if (I != ValueMap.end())

        IV = I->second;

    }


    PN.addIncoming(IV, NewPred);

  }

}


/// Merge basic block BB into its sole predecessor if possible.

bool JumpThreadingPass::maybeMergeBasicBlockIntoOnlyPred(BasicBlock *BB) {

  BasicBlock *SinglePred = BB->getSinglePredecessor();

  if (!SinglePred)

    return false;


  const Instruction *TI = SinglePred->getTerminator();

  if (TI->isSpecialTerminator() || TI->getNumSuccessors() != 1 ||

      SinglePred == BB || hasAddressTakenAndUsed(BB))

    return false;


  // If SinglePred was a loop header, BB becomes one.

  if (LoopHeaders.erase(SinglePred))

    LoopHeaders.insert(BB);


  LVI->eraseBlock(SinglePred);

  MergeBasicBlockIntoOnlyPred(BB, DTU.get());


  // Now that BB is merged into SinglePred (i.e. SinglePred code followed by

  // BB code within one basic block `BB`), we need to invalidate the LVI

  // information associated with BB, because the LVI information need not be

  // true for all of BB after the merge. For example,

  // Before the merge, LVI info and code is as follows:

  // SinglePred: <LVI info1 for %p val>

  // %y = use of %p

  // call @exit() // need not transfer execution to successor.

  // assume(%p) // from this point on %p is true

  // br label %BB

  // BB: <LVI info2 for %p val, i.e. %p is true>

  // %x = use of %p

  // br label exit

  //

  // Note that this LVI info for blocks BB and SinglPred is correct for %p

  // (info2 and info1 respectively). After the merge and the deletion of the

  // LVI info1 for SinglePred. We have the following code:

  // BB: <LVI info2 for %p val>

  // %y = use of %p

  // call @exit()

  // assume(%p)

  // %x = use of %p <-- LVI info2 is correct from here onwards.

  // br label exit

  // LVI info2 for BB is incorrect at the beginning of BB.


  // Invalidate LVI information for BB if the LVI is not provably true for

  // all of BB.

  if (!isGuaranteedToTransferExecutionToSuccessor(BB))

    LVI->eraseBlock(BB);

  return true;

}


/// Update the SSA form.  NewBB contains instructions that are copied from BB.

/// ValueMapping maps old values in BB to new ones in NewBB.

void JumpThreadingPass::updateSSA(BasicBlock *BB, BasicBlock *NewBB,

                                  ValueToValueMapTy &ValueMapping) {

  // If there were values defined in BB that are used outside the block, then we

  // now have to update all uses of the value to use either the original value,

  // the cloned value, or some PHI derived value.  This can require arbitrary

  // PHI insertion, of which we are prepared to do, clean these up now.

  SSAUpdater SSAUpdate;

  SmallVector<Use *, 16> UsesToRename;

  SmallVector<DbgValueInst *, 4> DbgValues;

  SmallVector<DbgVariableRecord *, 4> DbgVariableRecords;


  for (Instruction &I : *BB) {

    // Scan all uses of this instruction to see if it is used outside of its

    // block, and if so, record them in UsesToRename.

    for (Use &U : I.uses()) {

      Instruction *User = cast<Instruction>(U.getUser());

      if (PHINode *UserPN = dyn_cast<PHINode>(User)) {

        if (UserPN->getIncomingBlock(U) == BB)

          continue;

      } else if (User->getParent() == BB)

        continue;


      UsesToRename.push_back(&U);

    }


    // Find debug values outside of the block

    findDbgValues(DbgValues, &I, &DbgVariableRecords);

    llvm::erase_if(DbgValues, [&](const DbgValueInst *DbgVal) {

      return DbgVal->getParent() == BB;

    });

    llvm::erase_if(DbgVariableRecords, [&](const DbgVariableRecord *DbgVarRec) {

      return DbgVarRec->getParent() == BB;

    });


    // If there are no uses outside the block, we're done with this instruction.

    if (UsesToRename.empty() && DbgValues.empty() && DbgVariableRecords.empty())

      continue;

    LLVM_DEBUG(dbgs() << "JT: Renaming non-local uses of: " << I << "\n");


    // We found a use of I outside of BB.  Rename all uses of I that are outside

    // its block to be uses of the appropriate PHI node etc.  See ValuesInBlocks

    // with the two values we know.

    SSAUpdate.Initialize(I.getType(), I.getName());

    SSAUpdate.AddAvailableValue(BB, &I);

    SSAUpdate.AddAvailableValue(NewBB, ValueMapping[&I]);


    while (!UsesToRename.empty())

      SSAUpdate.RewriteUse(*UsesToRename.pop_back_val());

    if (!DbgValues.empty() || !DbgVariableRecords.empty()) {

      SSAUpdate.UpdateDebugValues(&I, DbgValues);

      SSAUpdate.UpdateDebugValues(&I, DbgVariableRecords);

      DbgValues.clear();

      DbgVariableRecords.clear();

    }


    LLVM_DEBUG(dbgs() << "\n");

  }

}


/// Clone instructions in range [BI, BE) to NewBB.  For PHI nodes, we only clone

/// arguments that come from PredBB.  Return the map from the variables in the

/// source basic block to the variables in the newly created basic block.


void JumpThreadingPass::cloneInstructions(ValueToValueMapTy &ValueMapping,

                                          BasicBlock::iterator BI,

                                          BasicBlock::iterator BE,

                                          BasicBlock *NewBB,

                                          BasicBlock *PredBB) {

  // We are going to have to map operands from the source basic block to the new

  // copy of the block 'NewBB'.  If there are PHI nodes in the source basic

  // block, evaluate them to account for entry from PredBB.


  // Retargets llvm.dbg.value to any renamed variables.

  auto RetargetDbgValueIfPossible = [&](Instruction *NewInst) -> bool {

    auto DbgInstruction = dyn_cast<DbgValueInst>(NewInst);

    if (!DbgInstruction)

      return false;


    SmallSet<std::pair<Value *, Value *>, 16> OperandsToRemap;

    for (auto DbgOperand : DbgInstruction->location_ops()) {

      auto DbgOperandInstruction = dyn_cast<Instruction>(DbgOperand);

      if (!DbgOperandInstruction)

        continue;


      auto I = ValueMapping.find(DbgOperandInstruction);

      if (I != ValueMapping.end()) {

        OperandsToRemap.insert(

            std::pair<Value *, Value *>(DbgOperand, I->second));

      }

    }


    for (auto &[OldOp, MappedOp] : OperandsToRemap)

      DbgInstruction->replaceVariableLocationOp(OldOp, MappedOp);

    return true;

  };


  // Duplicate implementation of the above dbg.value code, using

  // DbgVariableRecords instead.

  auto RetargetDbgVariableRecordIfPossible = [&](DbgVariableRecord *DVR) {

    SmallSet<std::pair<Value *, Value *>, 16> OperandsToRemap;

    for (auto *Op : DVR->location_ops()) {

      Instruction *OpInst = dyn_cast<Instruction>(Op);

      if (!OpInst)

        continue;


      auto I = ValueMapping.find(OpInst);

      if (I != ValueMapping.end())

        OperandsToRemap.insert({OpInst, I->second});

    }


    for (auto &[OldOp, MappedOp] : OperandsToRemap)

      DVR->replaceVariableLocationOp(OldOp, MappedOp);

  };


  BasicBlock *RangeBB = BI->getParent();


  // Clone the phi nodes of the source basic block into NewBB.  The resulting

  // phi nodes are trivial since NewBB only has one predecessor, but SSAUpdater

  // might need to rewrite the operand of the cloned phi.

  for (; PHINode *PN = dyn_cast<PHINode>(BI); ++BI) {

    PHINode *NewPN = PHINode::Create(PN->getType(), 1, PN->getName(), NewBB);

    NewPN->addIncoming(PN->getIncomingValueForBlock(PredBB), PredBB);

    ValueMapping[PN] = NewPN;

  }


  // Clone noalias scope declarations in the threaded block. When threading a

  // loop exit, we would otherwise end up with two idential scope declarations

  // visible at the same time.

  SmallVector<MDNode *> NoAliasScopes;

  DenseMap<MDNode *, MDNode *> ClonedScopes;

  LLVMContext &Context = PredBB->getContext();

  identifyNoAliasScopesToClone(BI, BE, NoAliasScopes);

  cloneNoAliasScopes(NoAliasScopes, ClonedScopes, "thread", Context);


  auto CloneAndRemapDbgInfo = [&](Instruction *NewInst, Instruction *From) {

    auto DVRRange = NewInst->cloneDebugInfoFrom(From);

    for (DbgVariableRecord &DVR : filterDbgVars(DVRRange))

      RetargetDbgVariableRecordIfPossible(&DVR);

  };


  // Clone the non-phi instructions of the source basic block into NewBB,

  // keeping track of the mapping and using it to remap operands in the cloned

  // instructions.

  for (; BI != BE; ++BI) {

    Instruction *New = BI->clone();

    New->setName(BI->getName());

    New->insertInto(NewBB, NewBB->end());

    ValueMapping[&*BI] = New;

    adaptNoAliasScopes(New, ClonedScopes, Context);


    CloneAndRemapDbgInfo(New, &*BI);


    if (RetargetDbgValueIfPossible(New))

      continue;


    // Remap operands to patch up intra-block references.

    for (unsigned i = 0, e = New->getNumOperands(); i != e; ++i)

      if (Instruction *Inst = dyn_cast<Instruction>(New->getOperand(i))) {

        ValueToValueMapTy::iterator I = ValueMapping.find(Inst);

        if (I != ValueMapping.end())

          New->setOperand(i, I->second);

      }

  }


  // There may be DbgVariableRecords on the terminator, clone directly from

  // marker to marker as there isn't an instruction there.

  if (BE != RangeBB->end() && BE->hasDbgRecords()) {

    // Dump them at the end.

    DbgMarker *Marker = RangeBB->getMarker(BE);

    DbgMarker *EndMarker = NewBB->createMarker(NewBB->end());

    auto DVRRange = EndMarker->cloneDebugInfoFrom(Marker, std::nullopt);

    for (DbgVariableRecord &DVR : filterDbgVars(DVRRange))

      RetargetDbgVariableRecordIfPossible(&DVR);

  }

}


/// Attempt to thread through two successive basic blocks.

bool JumpThreadingPass::maybethreadThroughTwoBasicBlocks(BasicBlock *BB,

                                                         Value *Cond) {

  // Consider:

  //

  // PredBB:

  //   %var = phi i32* [ null, %bb1 ], [ @a, %bb2 ]

  //   %tobool = icmp eq i32 %cond, 0

  //   br i1 %tobool, label %BB, label ...

  //

  // BB:

  //   %cmp = icmp eq i32* %var, null

  //   br i1 %cmp, label ..., label ...

  //

  // We don't know the value of %var at BB even if we know which incoming edge

  // we take to BB.  However, once we duplicate PredBB for each of its incoming

  // edges (say, PredBB1 and PredBB2), we know the value of %var in each copy of

  // PredBB.  Then we can thread edges PredBB1->BB and PredBB2->BB through BB.


  // Require that BB end with a Branch for simplicity.

  BranchInst *CondBr = dyn_cast<BranchInst>(BB->getTerminator());

  if (!CondBr)

    return false;


  // BB must have exactly one predecessor.

  BasicBlock *PredBB = BB->getSinglePredecessor();

  if (!PredBB)

    return false;


  // Require that PredBB end with a conditional Branch. If PredBB ends with an

  // unconditional branch, we should be merging PredBB and BB instead. For

  // simplicity, we don't deal with a switch.

  BranchInst *PredBBBranch = dyn_cast<BranchInst>(PredBB->getTerminator());

  if (!PredBBBranch || PredBBBranch->isUnconditional())

    return false;


  // If PredBB has exactly one incoming edge, we don't gain anything by copying

  // PredBB.

  if (PredBB->getSinglePredecessor())

    return false;


  // Don't thread through PredBB if it contains a successor edge to itself, in

  // which case we would infinite loop.  Suppose we are threading an edge from

  // PredPredBB through PredBB and BB to SuccBB with PredBB containing a

  // successor edge to itself.  If we allowed jump threading in this case, we

  // could duplicate PredBB and BB as, say, PredBB.thread and BB.thread.  Since

  // PredBB.thread has a successor edge to PredBB, we would immediately come up

  // with another jump threading opportunity from PredBB.thread through PredBB

  // and BB to SuccBB.  This jump threading would repeatedly occur.  That is, we

  // would keep peeling one iteration from PredBB.

  if (llvm::is_contained(successors(PredBB), PredBB))

    return false;


  // Don't thread across a loop header.

  if (LoopHeaders.count(PredBB))

    return false;


  // Avoid complication with duplicating EH pads.

  if (PredBB->isEHPad())

    return false;


  // Find a predecessor that we can thread.  For simplicity, we only consider a

  // successor edge out of BB to which we thread exactly one incoming edge into

  // PredBB.

  unsigned ZeroCount = 0;

  unsigned OneCount = 0;

  BasicBlock *ZeroPred = nullptr;

  BasicBlock *OnePred = nullptr;

  const DataLayout &DL = BB->getDataLayout();

  for (BasicBlock *P : predecessors(PredBB)) {

    // If PredPred ends with IndirectBrInst, we can't handle it.

    if (isa<IndirectBrInst>(P->getTerminator()))

      continue;

    if (ConstantInt *CI = dyn_cast_or_null<ConstantInt>(

            evaluateOnPredecessorEdge(BB, P, Cond, DL))) {

      if (CI->isZero()) {

        ZeroCount++;

        ZeroPred = P;

      } else if (CI->isOne()) {

        OneCount++;

        OnePred = P;

      }

    }

  }


  // Disregard complicated cases where we have to thread multiple edges.

  BasicBlock *PredPredBB;

  if (ZeroCount == 1) {

    PredPredBB = ZeroPred;

  } else if (OneCount == 1) {

    PredPredBB = OnePred;

  } else {

    return false;

  }


  BasicBlock *SuccBB = CondBr->getSuccessor(PredPredBB == ZeroPred);


  // If threading to the same block as we come from, we would infinite loop.

  if (SuccBB == BB) {

    LLVM_DEBUG(dbgs() << "  Not threading across BB '" << BB->getName()

                      << "' - would thread to self!\n");

    return false;

  }


  // If threading this would thread across a loop header, don't thread the edge.

  // See the comments above findLoopHeaders for justifications and caveats.

  if (LoopHeaders.count(BB) || LoopHeaders.count(SuccBB)) {

    LLVM_DEBUG({

      bool BBIsHeader = LoopHeaders.count(BB);

      bool SuccIsHeader = LoopHeaders.count(SuccBB);

      dbgs() << "  Not threading across "

             << (BBIsHeader ? "loop header BB '" : "block BB '")

             << BB->getName() << "' to dest "

             << (SuccIsHeader ? "loop header BB '" : "block BB '")

             << SuccBB->getName()

             << "' - it might create an irreducible loop!\n";

    });

    return false;

  }


  // Compute the cost of duplicating BB and PredBB.

  unsigned BBCost = getJumpThreadDuplicationCost(

      TTI, BB, BB->getTerminator(), BBDupThreshold);

  unsigned PredBBCost = getJumpThreadDuplicationCost(

      TTI, PredBB, PredBB->getTerminator(), BBDupThreshold);


  // Give up if costs are too high.  We need to check BBCost and PredBBCost

  // individually before checking their sum because getJumpThreadDuplicationCost

  // return (unsigned)~0 for those basic blocks that cannot be duplicated.

  if (BBCost > BBDupThreshold || PredBBCost > BBDupThreshold ||

      BBCost + PredBBCost > BBDupThreshold) {

    LLVM_DEBUG(dbgs() << "  Not threading BB '" << BB->getName()

                      << "' - Cost is too high: " << PredBBCost

                      << " for PredBB, " << BBCost << "for BB\n");

    return false;

  }


  // Now we are ready to duplicate PredBB.

  threadThroughTwoBasicBlocks(PredPredBB, PredBB, BB, SuccBB);

  return true;

}


void JumpThreadingPass::threadThroughTwoBasicBlocks(BasicBlock *PredPredBB,

                                                    BasicBlock *PredBB,

                                                    BasicBlock *BB,

                                                    BasicBlock *SuccBB) {

  LLVM_DEBUG(dbgs() << "  Threading through '" << PredBB->getName() << "' and '"

                    << BB->getName() << "'\n");


  // Build BPI/BFI before any changes are made to IR.

  bool HasProfile = doesBlockHaveProfileData(BB);

  auto *BFI = getOrCreateBFI(HasProfile);

  auto *BPI = getOrCreateBPI(BFI != nullptr);


  BranchInst *CondBr = cast<BranchInst>(BB->getTerminator());

  BranchInst *PredBBBranch = cast<BranchInst>(PredBB->getTerminator());


  BasicBlock *NewBB =

      BasicBlock::Create(PredBB->getContext(), PredBB->getName() + ".thread",

                         PredBB->getParent(), PredBB);

  NewBB->moveAfter(PredBB);


  // Set the block frequency of NewBB.

  if (BFI) {

    assert(BPI && "It's expected BPI to exist along with BFI");

    auto NewBBFreq = BFI->getBlockFreq(PredPredBB) *

                     BPI->getEdgeProbability(PredPredBB, PredBB);

    BFI->setBlockFreq(NewBB, NewBBFreq);

  }


  // We are going to have to map operands from the original BB block to the new

  // copy of the block 'NewBB'.  If there are PHI nodes in PredBB, evaluate them

  // to account for entry from PredPredBB.

  ValueToValueMapTy ValueMapping;

  cloneInstructions(ValueMapping, PredBB->begin(), PredBB->end(), NewBB,

                    PredPredBB);


  // Copy the edge probabilities from PredBB to NewBB.

  if (BPI)

    BPI->copyEdgeProbabilities(PredBB, NewBB);


  // Update the terminator of PredPredBB to jump to NewBB instead of PredBB.

  // This eliminates predecessors from PredPredBB, which requires us to simplify

  // any PHI nodes in PredBB.

  Instruction *PredPredTerm = PredPredBB->getTerminator();

  for (unsigned i = 0, e = PredPredTerm->getNumSuccessors(); i != e; ++i)

    if (PredPredTerm->getSuccessor(i) == PredBB) {

      PredBB->removePredecessor(PredPredBB, true);

      PredPredTerm->setSuccessor(i, NewBB);

    }


  addPHINodeEntriesForMappedBlock(PredBBBranch->getSuccessor(0), PredBB, NewBB,

                                  ValueMapping);

  addPHINodeEntriesForMappedBlock(PredBBBranch->getSuccessor(1), PredBB, NewBB,

                                  ValueMapping);


  DTU->applyUpdatesPermissive(

      {{DominatorTree::Insert, NewBB, CondBr->getSuccessor(0)},

       {DominatorTree::Insert, NewBB, CondBr->getSuccessor(1)},

       {DominatorTree::Insert, PredPredBB, NewBB},

       {DominatorTree::Delete, PredPredBB, PredBB}});


  updateSSA(PredBB, NewBB, ValueMapping);


  // Clean up things like PHI nodes with single operands, dead instructions,

  // etc.

  SimplifyInstructionsInBlock(NewBB, TLI);

  SimplifyInstructionsInBlock(PredBB, TLI);


  SmallVector<BasicBlock *, 1> PredsToFactor;

  PredsToFactor.push_back(NewBB);

  threadEdge(BB, PredsToFactor, SuccBB);

}


/// tryThreadEdge - Thread an edge if it's safe and profitable to do so.

bool JumpThreadingPass::tryThreadEdge(

    BasicBlock *BB, const SmallVectorImpl<BasicBlock *> &PredBBs,

    BasicBlock *SuccBB) {

  // If threading to the same block as we come from, we would infinite loop.

  if (SuccBB == BB) {

    LLVM_DEBUG(dbgs() << "  Not threading across BB '" << BB->getName()

                      << "' - would thread to self!\n");

    return false;

  }


  // If threading this would thread across a loop header, don't thread the edge.

  // See the comments above findLoopHeaders for justifications and caveats.

  if (LoopHeaders.count(BB) || LoopHeaders.count(SuccBB)) {

    LLVM_DEBUG({

      bool BBIsHeader = LoopHeaders.count(BB);

      bool SuccIsHeader = LoopHeaders.count(SuccBB);

      dbgs() << "  Not threading across "

          << (BBIsHeader ? "loop header BB '" : "block BB '") << BB->getName()

          << "' to dest " << (SuccIsHeader ? "loop header BB '" : "block BB '")

          << SuccBB->getName() << "' - it might create an irreducible loop!\n";

    });

    return false;

  }


  unsigned JumpThreadCost = getJumpThreadDuplicationCost(

      TTI, BB, BB->getTerminator(), BBDupThreshold);

  if (JumpThreadCost > BBDupThreshold) {

    LLVM_DEBUG(dbgs() << "  Not threading BB '" << BB->getName()

                      << "' - Cost is too high: " << JumpThreadCost << "\n");

    return false;

  }


  threadEdge(BB, PredBBs, SuccBB);

  return true;

}


/// threadEdge - We have decided that it is safe and profitable to factor the

/// blocks in PredBBs to one predecessor, then thread an edge from it to SuccBB

/// across BB.  Transform the IR to reflect this change.

void JumpThreadingPass::threadEdge(BasicBlock *BB,

                                   const SmallVectorImpl<BasicBlock *> &PredBBs,

                                   BasicBlock *SuccBB) {

  assert(SuccBB != BB && "Don't create an infinite loop");


  assert(!LoopHeaders.count(BB) && !LoopHeaders.count(SuccBB) &&

         "Don't thread across loop headers");


  // Build BPI/BFI before any changes are made to IR.

  bool HasProfile = doesBlockHaveProfileData(BB);

  auto *BFI = getOrCreateBFI(HasProfile);

  auto *BPI = getOrCreateBPI(BFI != nullptr);


  // And finally, do it!  Start by factoring the predecessors if needed.

  BasicBlock *PredBB;

  if (PredBBs.size() == 1)

    PredBB = PredBBs[0];

  else {

    LLVM_DEBUG(dbgs() << "  Factoring out " << PredBBs.size()

                      << " common predecessors.\n");

    PredBB = splitBlockPreds(BB, PredBBs, ".thr_comm");

  }


  // And finally, do it!

  LLVM_DEBUG(dbgs() << "  Threading edge from '" << PredBB->getName()

                    << "' to '" << SuccBB->getName()

                    << ", across block:\n    " << *BB << "\n");


  LVI->threadEdge(PredBB, BB, SuccBB);


  BasicBlock *NewBB = BasicBlock::Create(BB->getContext(),

                                         BB->getName()+".thread",

                                         BB->getParent(), BB);

  NewBB->moveAfter(PredBB);


  // Set the block frequency of NewBB.

  if (BFI) {

    assert(BPI && "It's expected BPI to exist along with BFI");

    auto NewBBFreq =

        BFI->getBlockFreq(PredBB) * BPI->getEdgeProbability(PredBB, BB);

    BFI->setBlockFreq(NewBB, NewBBFreq);

  }


  // Copy all the instructions from BB to NewBB except the terminator.

  ValueToValueMapTy ValueMapping;

  cloneInstructions(ValueMapping, BB->begin(), std::prev(BB->end()), NewBB,

                    PredBB);


  // We didn't copy the terminator from BB over to NewBB, because there is now

  // an unconditional jump to SuccBB.  Insert the unconditional jump.

  BranchInst *NewBI = BranchInst::Create(SuccBB, NewBB);

  NewBI->setDebugLoc(BB->getTerminator()->getDebugLoc());


  // Check to see if SuccBB has PHI nodes. If so, we need to add entries to the

  // PHI nodes for NewBB now.

  addPHINodeEntriesForMappedBlock(SuccBB, BB, NewBB, ValueMapping);


  // Update the terminator of PredBB to jump to NewBB instead of BB.  This

  // eliminates predecessors from BB, which requires us to simplify any PHI

  // nodes in BB.

  Instruction *PredTerm = PredBB->getTerminator();

  for (unsigned i = 0, e = PredTerm->getNumSuccessors(); i != e; ++i)

    if (PredTerm->getSuccessor(i) == BB) {

      BB->removePredecessor(PredBB, true);

      PredTerm->setSuccessor(i, NewBB);

    }


  // Enqueue required DT updates.

  DTU->applyUpdatesPermissive({{DominatorTree::Insert, NewBB, SuccBB},

                               {DominatorTree::Insert, PredBB, NewBB},

                               {DominatorTree::Delete, PredBB, BB}});


  updateSSA(BB, NewBB, ValueMapping);


  // At this point, the IR is fully up to date and consistent.  Do a quick scan

  // over the new instructions and zap any that are constants or dead.  This

  // frequently happens because of phi translation.

  SimplifyInstructionsInBlock(NewBB, TLI);


  // Update the edge weight from BB to SuccBB, which should be less than before.

  updateBlockFreqAndEdgeWeight(PredBB, BB, NewBB, SuccBB, BFI, BPI, HasProfile);


  // Threaded an edge!

  ++NumThreads;

}


/// Create a new basic block that will be the predecessor of BB and successor of

/// all blocks in Preds. When profile data is available, update the frequency of

/// this new block.

BasicBlock *JumpThreadingPass::splitBlockPreds(BasicBlock *BB,

                                               ArrayRef<BasicBlock *> Preds,

                                               const char *Suffix) {

  SmallVector<BasicBlock *, 2> NewBBs;


  // Collect the frequencies of all predecessors of BB, which will be used to

  // update the edge weight of the result of splitting predecessors.

  DenseMap<BasicBlock *, BlockFrequency> FreqMap;

  auto *BFI = getBFI();

  if (BFI) {

    auto *BPI = getOrCreateBPI(true);

    for (auto *Pred : Preds)

      FreqMap.insert(std::make_pair(

          Pred, BFI->getBlockFreq(Pred) * BPI->getEdgeProbability(Pred, BB)));

  }


  // In the case when BB is a LandingPad block we create 2 new predecessors

  // instead of just one.

  if (BB->isLandingPad()) {

    std::string NewName = std::string(Suffix) + ".split-lp";

    SplitLandingPadPredecessors(BB, Preds, Suffix, NewName.c_str(), NewBBs);

  } else {

    NewBBs.push_back(SplitBlockPredecessors(BB, Preds, Suffix));

  }


  std::vector<DominatorTree::UpdateType> Updates;

  Updates.reserve((2 * Preds.size()) + NewBBs.size());

  for (auto *NewBB : NewBBs) {

    BlockFrequency NewBBFreq(0);

    Updates.push_back({DominatorTree::Insert, NewBB, BB});

    for (auto *Pred : predecessors(NewBB)) {

      Updates.push_back({DominatorTree::Delete, Pred, BB});

      Updates.push_back({DominatorTree::Insert, Pred, NewBB});

      if (BFI) // Update frequencies between Pred -> NewBB.

        NewBBFreq += FreqMap.lookup(Pred);

    }

    if (BFI) // Apply the summed frequency to NewBB.

      BFI->setBlockFreq(NewBB, NewBBFreq);

  }


  DTU->applyUpdatesPermissive(Updates);

  return NewBBs[0];

}


bool JumpThreadingPass::doesBlockHaveProfileData(BasicBlock *BB) {

  const Instruction *TI = BB->getTerminator();

  if (!TI || TI->getNumSuccessors() < 2)

    return false;


  return hasValidBranchWeightMD(*TI);

}


/// Update the block frequency of BB and branch weight and the metadata on the

/// edge BB->SuccBB. This is done by scaling the weight of BB->SuccBB by 1 -

/// Freq(PredBB->BB) / Freq(BB->SuccBB).

void JumpThreadingPass::updateBlockFreqAndEdgeWeight(BasicBlock *PredBB,

                                                     BasicBlock *BB,

                                                     BasicBlock *NewBB,

                                                     BasicBlock *SuccBB,

                                                     BlockFrequencyInfo *BFI,

                                                     BranchProbabilityInfo *BPI,

                                                     bool HasProfile) {

  assert(((BFI && BPI) || (!BFI && !BFI)) &&

         "Both BFI & BPI should either be set or unset");


  if (!BFI) {

    assert(!HasProfile &&

           "It's expected to have BFI/BPI when profile info exists");

    return;

  }


  // As the edge from PredBB to BB is deleted, we have to update the block

  // frequency of BB.

  auto BBOrigFreq = BFI->getBlockFreq(BB);

  auto NewBBFreq = BFI->getBlockFreq(NewBB);

  auto BB2SuccBBFreq = BBOrigFreq * BPI->getEdgeProbability(BB, SuccBB);

  auto BBNewFreq = BBOrigFreq - NewBBFreq;

  BFI->setBlockFreq(BB, BBNewFreq);


  // Collect updated outgoing edges' frequencies from BB and use them to update

  // edge probabilities.

  SmallVector<uint64_t, 4> BBSuccFreq;

  for (BasicBlock *Succ : successors(BB)) {

    auto SuccFreq = (Succ == SuccBB)

                        ? BB2SuccBBFreq - NewBBFreq

                        : BBOrigFreq * BPI->getEdgeProbability(BB, Succ);

    BBSuccFreq.push_back(SuccFreq.getFrequency());

  }


  uint64_t MaxBBSuccFreq = *llvm::max_element(BBSuccFreq);


  SmallVector<BranchProbability, 4> BBSuccProbs;

  if (MaxBBSuccFreq == 0)

    BBSuccProbs.assign(BBSuccFreq.size(),

                       {1, static_cast<unsigned>(BBSuccFreq.size())});

  else {

    for (uint64_t Freq : BBSuccFreq)

      BBSuccProbs.push_back(

          BranchProbability::getBranchProbability(Freq, MaxBBSuccFreq));

    // Normalize edge probabilities so that they sum up to one.

    BranchProbability::normalizeProbabilities(BBSuccProbs.begin(),

                                              BBSuccProbs.end());

  }


  // Update edge probabilities in BPI.

  BPI->setEdgeProbability(BB, BBSuccProbs);


  // Update the profile metadata as well.

  //

  // Don't do this if the profile of the transformed blocks was statically

  // estimated.  (This could occur despite the function having an entry

  // frequency in completely cold parts of the CFG.)

  //

  // In this case we don't want to suggest to subsequent passes that the

  // calculated weights are fully consistent.  Consider this graph:

  //

  //                 check_1

  //             50% /  |

  //             eq_1   | 50%

  //                 \  |

  //                 check_2

  //             50% /  |

  //             eq_2   | 50%

  //                 \  |

  //                 check_3

  //             50% /  |

  //             eq_3   | 50%

  //                 \  |

  //

  // Assuming the blocks check_* all compare the same value against 1, 2 and 3,

  // the overall probabilities are inconsistent; the total probability that the

  // value is either 1, 2 or 3 is 150%.

  //

  // As a consequence if we thread eq_1 -> check_2 to check_3, check_2->check_3

  // becomes 0%.  This is even worse if the edge whose probability becomes 0% is

  // the loop exit edge.  Then based solely on static estimation we would assume

  // the loop was extremely hot.

  //

  // FIXME this locally as well so that BPI and BFI are consistent as well.  We

  // shouldn't make edges extremely likely or unlikely based solely on static

  // estimation.

  if (BBSuccProbs.size() >= 2 && HasProfile) {

    SmallVector<uint32_t, 4> Weights;

    for (auto Prob : BBSuccProbs)

      Weights.push_back(Prob.getNumerator());


    auto TI = BB->getTerminator();

    setBranchWeights(*TI, Weights, hasBranchWeightOrigin(*TI));

  }

}


/// duplicateCondBranchOnPHIIntoPred - PredBB contains an unconditional branch

/// to BB which contains an i1 PHI node and a conditional branch on that PHI.

/// If we can duplicate the contents of BB up into PredBB do so now, this

/// improves the odds that the branch will be on an analyzable instruction like

/// a compare.

bool JumpThreadingPass::duplicateCondBranchOnPHIIntoPred(

    BasicBlock *BB, const SmallVectorImpl<BasicBlock *> &PredBBs) {

  assert(!PredBBs.empty() && "Can't handle an empty set");


  // If BB is a loop header, then duplicating this block outside the loop would

  // cause us to transform this into an irreducible loop, don't do this.

  // See the comments above findLoopHeaders for justifications and caveats.

  if (LoopHeaders.count(BB)) {

    LLVM_DEBUG(dbgs() << "  Not duplicating loop header '" << BB->getName()

                      << "' into predecessor block '" << PredBBs[0]->getName()

                      << "' - it might create an irreducible loop!\n");

    return false;

  }


  unsigned DuplicationCost = getJumpThreadDuplicationCost(

      TTI, BB, BB->getTerminator(), BBDupThreshold);

  if (DuplicationCost > BBDupThreshold) {

    LLVM_DEBUG(dbgs() << "  Not duplicating BB '" << BB->getName()

                      << "' - Cost is too high: " << DuplicationCost << "\n");

    return false;

  }


  // And finally, do it!  Start by factoring the predecessors if needed.

  std::vector<DominatorTree::UpdateType> Updates;

  BasicBlock *PredBB;

  if (PredBBs.size() == 1)

    PredBB = PredBBs[0];

  else {

    LLVM_DEBUG(dbgs() << "  Factoring out " << PredBBs.size()

                      << " common predecessors.\n");

    PredBB = splitBlockPreds(BB, PredBBs, ".thr_comm");

  }

  Updates.push_back({DominatorTree::Delete, PredBB, BB});


  // Okay, we decided to do this!  Clone all the instructions in BB onto the end

  // of PredBB.

  LLVM_DEBUG(dbgs() << "  Duplicating block '" << BB->getName()

                    << "' into end of '" << PredBB->getName()

                    << "' to eliminate branch on phi.  Cost: "

                    << DuplicationCost << " block is:" << *BB << "\n");


  // Unless PredBB ends with an unconditional branch, split the edge so that we

  // can just clone the bits from BB into the end of the new PredBB.

  BranchInst *OldPredBranch = dyn_cast<BranchInst>(PredBB->getTerminator());


  if (!OldPredBranch || !OldPredBranch->isUnconditional()) {

    BasicBlock *OldPredBB = PredBB;

    PredBB = SplitEdge(OldPredBB, BB);

    Updates.push_back({DominatorTree::Insert, OldPredBB, PredBB});

    Updates.push_back({DominatorTree::Insert, PredBB, BB});

    Updates.push_back({DominatorTree::Delete, OldPredBB, BB});

    OldPredBranch = cast<BranchInst>(PredBB->getTerminator());

  }


  // We are going to have to map operands from the original BB block into the

  // PredBB block.  Evaluate PHI nodes in BB.

  ValueToValueMapTy ValueMapping;


  BasicBlock::iterator BI = BB->begin();

  for (; PHINode *PN = dyn_cast<PHINode>(BI); ++BI)

    ValueMapping[PN] = PN->getIncomingValueForBlock(PredBB);

  // Clone the non-phi instructions of BB into PredBB, keeping track of the

  // mapping and using it to remap operands in the cloned instructions.

  for (; BI != BB->end(); ++BI) {

    Instruction *New = BI->clone();

    New->insertInto(PredBB, OldPredBranch->getIterator());


    // Remap operands to patch up intra-block references.

    for (unsigned i = 0, e = New->getNumOperands(); i != e; ++i)

      if (Instruction *Inst = dyn_cast<Instruction>(New->getOperand(i))) {

        ValueToValueMapTy::iterator I = ValueMapping.find(Inst);

        if (I != ValueMapping.end())

          New->setOperand(i, I->second);

      }


    // Remap debug variable operands.

    remapDebugVariable(ValueMapping, New);


    // If this instruction can be simplified after the operands are updated,

    // just use the simplified value instead.  This frequently happens due to

    // phi translation.

    if (Value *IV = simplifyInstruction(

            New,

            {BB->getDataLayout(), TLI, nullptr, nullptr, New})) {

      ValueMapping[&*BI] = IV;

      if (!New->mayHaveSideEffects()) {

        New->eraseFromParent();

        New = nullptr;

        // Clone debug-info on the elided instruction to the destination

        // position.

        OldPredBranch->cloneDebugInfoFrom(&*BI, std::nullopt, true);

      }

    } else {

      ValueMapping[&*BI] = New;

    }

    if (New) {

      // Otherwise, insert the new instruction into the block.

      New->setName(BI->getName());

      // Clone across any debug-info attached to the old instruction.

      New->cloneDebugInfoFrom(&*BI);

      // Update Dominance from simplified New instruction operands.

      for (unsigned i = 0, e = New->getNumOperands(); i != e; ++i)

        if (BasicBlock *SuccBB = dyn_cast<BasicBlock>(New->getOperand(i)))

          Updates.push_back({DominatorTree::Insert, PredBB, SuccBB});

    }

  }


  // Check to see if the targets of the branch had PHI nodes. If so, we need to

  // add entries to the PHI nodes for branch from PredBB now.

  BranchInst *BBBranch = cast<BranchInst>(BB->getTerminator());

  addPHINodeEntriesForMappedBlock(BBBranch->getSuccessor(0), BB, PredBB,

                                  ValueMapping);

  addPHINodeEntriesForMappedBlock(BBBranch->getSuccessor(1), BB, PredBB,

                                  ValueMapping);


  updateSSA(BB, PredBB, ValueMapping);


  // PredBB no longer jumps to BB, remove entries in the PHI node for the edge

  // that we nuked.

  BB->removePredecessor(PredBB, true);


  // Remove the unconditional branch at the end of the PredBB block.

  OldPredBranch->eraseFromParent();

  if (auto *BPI = getBPI())

    BPI->copyEdgeProbabilities(BB, PredBB);

  DTU->applyUpdatesPermissive(Updates);


  ++NumDupes;

  return true;

}


// Pred is a predecessor of BB with an unconditional branch to BB. SI is

// a Select instruction in Pred. BB has other predecessors and SI is used in

// a PHI node in BB. SI has no other use.

// A new basic block, NewBB, is created and SI is converted to compare and

// conditional branch. SI is erased from parent.

void JumpThreadingPass::unfoldSelectInstr(BasicBlock *Pred, BasicBlock *BB,

                                          SelectInst *SI, PHINode *SIUse,

                                          unsigned Idx) {

  // Expand the select.

  //

  // Pred --

  //  |    v

  //  |  NewBB

  //  |    |

  //  |-----

  //  v

  // BB

  BranchInst *PredTerm = cast<BranchInst>(Pred->getTerminator());

  BasicBlock *NewBB = BasicBlock::Create(BB->getContext(), "select.unfold",

                                         BB->getParent(), BB);

  // Move the unconditional branch to NewBB.

  PredTerm->removeFromParent();

  PredTerm->insertInto(NewBB, NewBB->end());

  // Create a conditional branch and update PHI nodes.

  auto *BI = BranchInst::Create(NewBB, BB, SI->getCondition(), Pred);

  BI->applyMergedLocation(PredTerm->getDebugLoc(), SI->getDebugLoc());

  BI->copyMetadata(*SI, {LLVMContext::MD_prof});

  SIUse->setIncomingValue(Idx, SI->getFalseValue());

  SIUse->addIncoming(SI->getTrueValue(), NewBB);


  uint64_t TrueWeight = 1;

  uint64_t FalseWeight = 1;

  // Copy probabilities from 'SI' to created conditional branch in 'Pred'.

  if (extractBranchWeights(*SI, TrueWeight, FalseWeight) &&

      (TrueWeight + FalseWeight) != 0) {

    SmallVector<BranchProbability, 2> BP;

    BP.emplace_back(BranchProbability::getBranchProbability(

        TrueWeight, TrueWeight + FalseWeight));

    BP.emplace_back(BranchProbability::getBranchProbability(

        FalseWeight, TrueWeight + FalseWeight));

    // Update BPI if exists.

    if (auto *BPI = getBPI())

      BPI->setEdgeProbability(Pred, BP);

  }

  // Set the block frequency of NewBB.

  if (auto *BFI = getBFI()) {

    if ((TrueWeight + FalseWeight) == 0) {

      TrueWeight = 1;

      FalseWeight = 1;

    }

    BranchProbability PredToNewBBProb = BranchProbability::getBranchProbability(

        TrueWeight, TrueWeight + FalseWeight);

    auto NewBBFreq = BFI->getBlockFreq(Pred) * PredToNewBBProb;

    BFI->setBlockFreq(NewBB, NewBBFreq);

  }


  // The select is now dead.

  SI->eraseFromParent();

  DTU->applyUpdatesPermissive({{DominatorTree::Insert, NewBB, BB},

                               {DominatorTree::Insert, Pred, NewBB}});


  // Update any other PHI nodes in BB.

  for (BasicBlock::iterator BI = BB->begin();

       PHINode *Phi = dyn_cast<PHINode>(BI); ++BI)

    if (Phi != SIUse)

      Phi->addIncoming(Phi->getIncomingValueForBlock(Pred), NewBB);

}


bool JumpThreadingPass::tryToUnfoldSelect(SwitchInst *SI, BasicBlock *BB) {

  PHINode *CondPHI = dyn_cast<PHINode>(SI->getCondition());


  if (!CondPHI || CondPHI->getParent() != BB)

    return false;


  for (unsigned I = 0, E = CondPHI->getNumIncomingValues(); I != E; ++I) {

    BasicBlock *Pred = CondPHI->getIncomingBlock(I);

    SelectInst *PredSI = dyn_cast<SelectInst>(CondPHI->getIncomingValue(I));


    // The second and third condition can be potentially relaxed. Currently

    // the conditions help to simplify the code and allow us to reuse existing

    // code, developed for tryToUnfoldSelect(CmpInst *, BasicBlock *)

    if (!PredSI || PredSI->getParent() != Pred || !PredSI->hasOneUse())

      continue;


    BranchInst *PredTerm = dyn_cast<BranchInst>(Pred->getTerminator());

    if (!PredTerm || !PredTerm->isUnconditional())

      continue;


    unfoldSelectInstr(Pred, BB, PredSI, CondPHI, I);

    return true;

  }

  return false;

}


/// tryToUnfoldSelect - Look for blocks of the form

/// bb1:

///   %a = select

///   br bb2

///

/// bb2:

///   %p = phi [%a, %bb1] ...

///   %c = icmp %p

///   br i1 %c

///

/// And expand the select into a branch structure if one of its arms allows %c

/// to be folded. This later enables threading from bb1 over bb2.

bool JumpThreadingPass::tryToUnfoldSelect(CmpInst *CondCmp, BasicBlock *BB) {

  BranchInst *CondBr = dyn_cast<BranchInst>(BB->getTerminator());

  PHINode *CondLHS = dyn_cast<PHINode>(CondCmp->getOperand(0));

  Constant *CondRHS = cast<Constant>(CondCmp->getOperand(1));


  if (!CondBr || !CondBr->isConditional() || !CondLHS ||

      CondLHS->getParent() != BB)

    return false;


  for (unsigned I = 0, E = CondLHS->getNumIncomingValues(); I != E; ++I) {

    BasicBlock *Pred = CondLHS->getIncomingBlock(I);

    SelectInst *SI = dyn_cast<SelectInst>(CondLHS->getIncomingValue(I));


    // Look if one of the incoming values is a select in the corresponding

    // predecessor.

    if (!SI || SI->getParent() != Pred || !SI->hasOneUse())

      continue;


    BranchInst *PredTerm = dyn_cast<BranchInst>(Pred->getTerminator());

    if (!PredTerm || !PredTerm->isUnconditional())

      continue;


    // Now check if one of the select values would allow us to constant fold the

    // terminator in BB. We don't do the transform if both sides fold, those

    // cases will be threaded in any case.

    Constant *LHSRes =

        LVI->getPredicateOnEdge(CondCmp->getPredicate(), SI->getOperand(1),

                                CondRHS, Pred, BB, CondCmp);

    Constant *RHSRes =

        LVI->getPredicateOnEdge(CondCmp->getPredicate(), SI->getOperand(2),

                                CondRHS, Pred, BB, CondCmp);

    if ((LHSRes || RHSRes) && LHSRes != RHSRes) {

      unfoldSelectInstr(Pred, BB, SI, CondLHS, I);

      return true;

    }

  }

  return false;

}


/// tryToUnfoldSelectInCurrBB - Look for PHI/Select or PHI/CMP/Select in the

/// same BB in the form

/// bb:

///   %p = phi [false, %bb1], [true, %bb2], [false, %bb3], [true, %bb4], ...

///   %s = select %p, trueval, falseval

///

/// or

///

/// bb:

///   %p = phi [0, %bb1], [1, %bb2], [0, %bb3], [1, %bb4], ...

///   %c = cmp %p, 0

///   %s = select %c, trueval, falseval

///

/// And expand the select into a branch structure. This later enables

/// jump-threading over bb in this pass.

///

/// Using the similar approach of SimplifyCFG::FoldCondBranchOnPHI(), unfold

/// select if the associated PHI has at least one constant.  If the unfolded

/// select is not jump-threaded, it will be folded again in the later

/// optimizations.

bool JumpThreadingPass::tryToUnfoldSelectInCurrBB(BasicBlock *BB) {

  // This transform would reduce the quality of msan diagnostics.

  // Disable this transform under MemorySanitizer.

  if (BB->getParent()->hasFnAttribute(Attribute::SanitizeMemory))

    return false;


  // If threading this would thread across a loop header, don't thread the edge.

  // See the comments above findLoopHeaders for justifications and caveats.

  if (LoopHeaders.count(BB))

    return false;


  for (BasicBlock::iterator BI = BB->begin();

       PHINode *PN = dyn_cast<PHINode>(BI); ++BI) {

    // Look for a Phi having at least one constant incoming value.

    if (llvm::all_of(PN->incoming_values(),

                     [](Value *V) { return !isa<ConstantInt>(V); }))

      continue;


    auto isUnfoldCandidate = [BB](SelectInst *SI, Value *V) {

      using namespace PatternMatch;


      // Check if SI is in BB and use V as condition.

      if (SI->getParent() != BB)

        return false;

      Value *Cond = SI->getCondition();

      bool IsAndOr = match(SI, m_CombineOr(m_LogicalAnd(), m_LogicalOr()));

      return Cond && Cond == V && Cond->getType()->isIntegerTy(1) && !IsAndOr;

    };


    SelectInst *SI = nullptr;

    for (Use &U : PN->uses()) {

      if (ICmpInst *Cmp = dyn_cast<ICmpInst>(U.getUser())) {

        // Look for a ICmp in BB that compares PN with a constant and is the

        // condition of a Select.

        if (Cmp->getParent() == BB && Cmp->hasOneUse() &&

            isa<ConstantInt>(Cmp->getOperand(1 - U.getOperandNo())))

          if (SelectInst *SelectI = dyn_cast<SelectInst>(Cmp->user_back()))

            if (isUnfoldCandidate(SelectI, Cmp->use_begin()->get())) {

              SI = SelectI;

              break;

            }

      } else if (SelectInst *SelectI = dyn_cast<SelectInst>(U.getUser())) {

        // Look for a Select in BB that uses PN as condition.

        if (isUnfoldCandidate(SelectI, U.get())) {

          SI = SelectI;

          break;

        }

      }

    }


    if (!SI)

      continue;

    // Expand the select.

    Value *Cond = SI->getCondition();

    if (!isGuaranteedNotToBeUndefOrPoison(Cond, nullptr, SI))

      Cond = new FreezeInst(Cond, "cond.fr", SI->getIterator());

    MDNode *BranchWeights = getBranchWeightMDNode(*SI);

    Instruction *Term =

        SplitBlockAndInsertIfThen(Cond, SI, false, BranchWeights);

    BasicBlock *SplitBB = SI->getParent();

    BasicBlock *NewBB = Term->getParent();

    PHINode *NewPN = PHINode::Create(SI->getType(), 2, "", SI->getIterator());

    NewPN->addIncoming(SI->getTrueValue(), Term->getParent());

    NewPN->addIncoming(SI->getFalseValue(), BB);

    NewPN->setDebugLoc(SI->getDebugLoc());

    SI->replaceAllUsesWith(NewPN);

    SI->eraseFromParent();

    // NewBB and SplitBB are newly created blocks which require insertion.

    std::vector<DominatorTree::UpdateType> Updates;

    Updates.reserve((2 * SplitBB->getTerminator()->getNumSuccessors()) + 3);

    Updates.push_back({DominatorTree::Insert, BB, SplitBB});

    Updates.push_back({DominatorTree::Insert, BB, NewBB});

    Updates.push_back({DominatorTree::Insert, NewBB, SplitBB});

    // BB's successors were moved to SplitBB, update DTU accordingly.

    for (auto *Succ : successors(SplitBB)) {

      Updates.push_back({DominatorTree::Delete, BB, Succ});

      Updates.push_back({DominatorTree::Insert, SplitBB, Succ});

    }

    DTU->applyUpdatesPermissive(Updates);

    return true;

  }

  return false;

}


/// Try to propagate a guard from the current BB into one of its predecessors

/// in case if another branch of execution implies that the condition of this

/// guard is always true. Currently we only process the simplest case that

/// looks like:

///

/// Start:

///   %cond = ...

///   br i1 %cond, label %T1, label %F1

/// T1:

///   br label %Merge

/// F1:

///   br label %Merge

/// Merge:

///   %condGuard = ...

///   call void(i1, ...) @llvm.experimental.guard( i1 %condGuard )[ "deopt"() ]

///

/// And cond either implies condGuard or !condGuard. In this case all the

/// instructions before the guard can be duplicated in both branches, and the

/// guard is then threaded to one of them.

bool JumpThreadingPass::processGuards(BasicBlock *BB) {

  using namespace PatternMatch;


  // We only want to deal with two predecessors.

  BasicBlock *Pred1, *Pred2;

  auto PI = pred_begin(BB), PE = pred_end(BB);

  if (PI == PE)

    return false;

  Pred1 = *PI++;

  if (PI == PE)

    return false;

  Pred2 = *PI++;

  if (PI != PE)

    return false;

  if (Pred1 == Pred2)

    return false;


  // Try to thread one of the guards of the block.

  // TODO: Look up deeper than to immediate predecessor?

  auto *Parent = Pred1->getSinglePredecessor();

  if (!Parent || Parent != Pred2->getSinglePredecessor())

    return false;


  if (auto *BI = dyn_cast<BranchInst>(Parent->getTerminator()))

    for (auto &I : *BB)

      if (isGuard(&I) && threadGuard(BB, cast<IntrinsicInst>(&I), BI))

        return true;


  return false;

}


/// Try to propagate the guard from BB which is the lower block of a diamond

/// to one of its branches, in case if diamond's condition implies guard's

/// condition.

bool JumpThreadingPass::threadGuard(BasicBlock *BB, IntrinsicInst *Guard,

                                    BranchInst *BI) {

  assert(BI->getNumSuccessors() == 2 && "Wrong number of successors?");

  assert(BI->isConditional() && "Unconditional branch has 2 successors?");

  Value *GuardCond = Guard->getArgOperand(0);

  Value *BranchCond = BI->getCondition();

  BasicBlock *TrueDest = BI->getSuccessor(0);

  BasicBlock *FalseDest = BI->getSuccessor(1);


  auto &DL = BB->getDataLayout();

  bool TrueDestIsSafe = false;

  bool FalseDestIsSafe = false;


  // True dest is safe if BranchCond => GuardCond.

  auto Impl = isImpliedCondition(BranchCond, GuardCond, DL);

  if (Impl && *Impl)

    TrueDestIsSafe = true;

  else {

    // False dest is safe if !BranchCond => GuardCond.

    Impl = isImpliedCondition(BranchCond, GuardCond, DL, /* LHSIsTrue */ false);

    if (Impl && *Impl)

      FalseDestIsSafe = true;

  }


  if (!TrueDestIsSafe && !FalseDestIsSafe)

    return false;


  BasicBlock *PredUnguardedBlock = TrueDestIsSafe ? TrueDest : FalseDest;

  BasicBlock *PredGuardedBlock = FalseDestIsSafe ? TrueDest : FalseDest;


  ValueToValueMapTy UnguardedMapping, GuardedMapping;

  Instruction *AfterGuard = Guard->getNextNode();

  unsigned Cost =

      getJumpThreadDuplicationCost(TTI, BB, AfterGuard, BBDupThreshold);

  if (Cost > BBDupThreshold)

    return false;

  // Duplicate all instructions before the guard and the guard itself to the

  // branch where implication is not proved.

  BasicBlock *GuardedBlock = DuplicateInstructionsInSplitBetween(

      BB, PredGuardedBlock, AfterGuard, GuardedMapping, *DTU);

  assert(GuardedBlock && "Could not create the guarded block?");

  // Duplicate all instructions before the guard in the unguarded branch.

  // Since we have successfully duplicated the guarded block and this block

  // has fewer instructions, we expect it to succeed.

  BasicBlock *UnguardedBlock = DuplicateInstructionsInSplitBetween(

      BB, PredUnguardedBlock, Guard, UnguardedMapping, *DTU);

  assert(UnguardedBlock && "Could not create the unguarded block?");

  LLVM_DEBUG(dbgs() << "Moved guard " << *Guard << " to block "

                    << GuardedBlock->getName() << "\n");

  // Some instructions before the guard may still have uses. For them, we need

  // to create Phi nodes merging their copies in both guarded and unguarded

  // branches. Those instructions that have no uses can be just removed.

  SmallVector<Instruction *, 4> ToRemove;

  for (auto BI = BB->begin(); &*BI != AfterGuard; ++BI)

    if (!isa<PHINode>(&*BI))

      ToRemove.push_back(&*BI);


  BasicBlock::iterator InsertionPoint = BB->getFirstInsertionPt();

  assert(InsertionPoint != BB->end() && "Empty block?");

  // Substitute with Phis & remove.

  for (auto *Inst : reverse(ToRemove)) {

    if (!Inst->use_empty()) {

      PHINode *NewPN = PHINode::Create(Inst->getType(), 2);

      NewPN->addIncoming(UnguardedMapping[Inst], UnguardedBlock);

      NewPN->addIncoming(GuardedMapping[Inst], GuardedBlock);

      NewPN->setDebugLoc(Inst->getDebugLoc());

      NewPN->insertBefore(InsertionPoint);

      Inst->replaceAllUsesWith(NewPN);

    }

    Inst->dropDbgRecords();

    Inst->eraseFromParent();

  }

  return true;

}


PreservedAnalyses JumpThreadingPass::getPreservedAnalysis() const {

  PreservedAnalyses PA;

  PA.preserve<LazyValueAnalysis>();

  PA.preserve<DominatorTreeAnalysis>();


  // TODO: We would like to preserve BPI/BFI. Enable once all paths update them.

  // TODO: Would be nice to verify BPI/BFI consistency as well.

  return PA;

}


template <typename AnalysisT>

typename AnalysisT::Result *JumpThreadingPass::runExternalAnalysis() {

  assert(FAM && "Can't run external analysis without FunctionAnalysisManager");


  // If there were no changes since last call to 'runExternalAnalysis' then all

  // analysis is either up to date or explicitly invalidated. Just go ahead and

  // run the "external" analysis.

  if (!ChangedSinceLastAnalysisUpdate) {

    assert(!DTU->hasPendingUpdates() &&

           "Lost update of 'ChangedSinceLastAnalysisUpdate'?");

    // Run the "external" analysis.

    return &FAM->getResult<AnalysisT>(*F);

  }

  ChangedSinceLastAnalysisUpdate = false;


  auto PA = getPreservedAnalysis();

  // TODO: This shouldn't be needed once 'getPreservedAnalysis' reports BPI/BFI

  // as preserved.

  PA.preserve<BranchProbabilityAnalysis>();

  PA.preserve<BlockFrequencyAnalysis>();

  // Report everything except explicitly preserved as invalid.

  FAM->invalidate(*F, PA);

  // Update DT/PDT.

  DTU->flush();

  // Make sure DT/PDT are valid before running "external" analysis.

  assert(DTU->getDomTree().verify(DominatorTree::VerificationLevel::Fast));

  assert((!DTU->hasPostDomTree() ||

          DTU->getPostDomTree().verify(

              PostDominatorTree::VerificationLevel::Fast)));

  // Run the "external" analysis.

  auto *Result = &FAM->getResult<AnalysisT>(*F);

  // Update analysis JumpThreading depends on and not explicitly preserved.

  TTI = &FAM->getResult<TargetIRAnalysis>(*F);

  TLI = &FAM->getResult<TargetLibraryAnalysis>(*F);

  AA = &FAM->getResult<AAManager>(*F);


  return Result;

}


BranchProbabilityInfo *JumpThreadingPass::getBPI() {

  if (!BPI) {

    assert(FAM && "Can't create BPI without FunctionAnalysisManager");

    BPI = FAM->getCachedResult<BranchProbabilityAnalysis>(*F);

  }

  return *BPI;

}


BlockFrequencyInfo *JumpThreadingPass::getBFI() {

  if (!BFI) {

    assert(FAM && "Can't create BFI without FunctionAnalysisManager");

    BFI = FAM->getCachedResult<BlockFrequencyAnalysis>(*F);

  }

  return *BFI;

}


// Important note on validity of BPI/BFI. JumpThreading tries to preserve

// BPI/BFI as it goes. Thus if cached instance exists it will be updated.

// Otherwise, new instance of BPI/BFI is created (up to date by definition).

BranchProbabilityInfo *JumpThreadingPass::getOrCreateBPI(bool Force) {

  auto *Res = getBPI();

  if (Res)

    return Res;


  if (Force)

    BPI = runExternalAnalysis<BranchProbabilityAnalysis>();


  return *BPI;

}


BlockFrequencyInfo *JumpThreadingPass::getOrCreateBFI(bool Force) {

  auto *Res = getBFI();

  if (Res)

    return Res;


  if (Force)

    BFI = runExternalAnalysis<BlockFrequencyAnalysis>();


  return *BFI;

}

PHI
Rewrite undef for PHI
Definition: AMDGPURewriteUndefForPHI.cpp:100

ToRemove
ReachingDefAnalysis InstSet & ToRemove
Definition: ARMLowOverheadLoops.cpp:531

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

AliasAnalysis.h

CFG.h

GuardUtils.h

getParent
static const Function * getParent(const Value *V)
Definition: BasicAliasAnalysis.cpp:863

BasicBlockUtils.h

BlockFrequencyInfo.h

BlockFrequency.h

From
BlockVerifier::State From
Definition: BlockVerifier.cpp:57

BranchProbabilityInfo.h

BranchProbability.h

Casting.h

Cloning.h

CommandLine.h

ConstantFolding.h

ConstantRange.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

DataLayout.h

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:353

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition: Debug.h:106

DenseMap.h
This file defines the DenseMap class.

Dominators.h

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

GlobalsModRef.h
This is the interface for a simple mod/ref and alias analysis over globals.

BasicBlock.h

CFG.h
This file provides various utilities for inspecting and working with the control flow graph in LLVM I...

Constant.h

Function.h

Instruction.h

IntrinsicInst.h

Module.h
Module.h This file contains the declarations for the Module class.

PassManager.h
This header defines various interfaces for pass management in LLVM.

Type.h

Use.h
This defines the Use class.

Value.h

InstrTypes.h

InstructionSimplify.h

Instructions.h

Intrinsics.h

getBestDestForJumpOnUndef
static unsigned getBestDestForJumpOnUndef(BasicBlock *BB)
GetBestDestForBranchOnUndef - If we determine that the specified block ends in an undefined jump,...
Definition: JumpThreading.cpp:917

PhiDuplicateThreshold
static cl::opt< unsigned > PhiDuplicateThreshold("jump-threading-phi-threshold", cl::desc("Max PHIs in BB to duplicate for jump threading"), cl::init(76), cl::Hidden)

replaceFoldableUses
static bool replaceFoldableUses(Instruction *Cond, Value *ToVal, BasicBlock *KnownAtEndOfBB)
Definition: JumpThreading.cpp:391

BBDuplicateThreshold
static cl::opt< unsigned > BBDuplicateThreshold("jump-threading-threshold", cl::desc("Max block size to duplicate for jump threading"), cl::init(6), cl::Hidden)

ThreadAcrossLoopHeaders
static cl::opt< bool > ThreadAcrossLoopHeaders("jump-threading-across-loop-headers", cl::desc("Allow JumpThreading to thread across loop headers, for testing"), cl::init(false), cl::Hidden)

getJumpThreadDuplicationCost
static unsigned getJumpThreadDuplicationCost(const TargetTransformInfo *TTI, BasicBlock *BB, Instruction *StopAt, unsigned Threshold)
Return the cost of duplicating a piece of this block from first non-phi and before StopAt instruction...
Definition: JumpThreading.cpp:425

addPHINodeEntriesForMappedBlock
static void addPHINodeEntriesForMappedBlock(BasicBlock *PHIBB, BasicBlock *OldPred, BasicBlock *NewPred, ValueToValueMapTy &ValueMap)
addPHINodeEntriesForMappedBlock - We're adding 'NewPred' as a new predecessor to the PHIBB block.
Definition: JumpThreading.cpp:1866

findMostPopularDest
static BasicBlock * findMostPopularDest(BasicBlock *BB, const SmallVectorImpl< std::pair< BasicBlock *, BasicBlock * > > &PredToDestList)
findMostPopularDest - The specified list contains multiple possible threadable destinations.
Definition: JumpThreading.cpp:1465

getKnownConstant
static Constant * getKnownConstant(Value *Val, ConstantPreference Preference)
getKnownConstant - Helper method to determine if we can thread over a terminator with the given value...
Definition: JumpThreading.cpp:537

ImplicationSearchThreshold
static cl::opt< unsigned > ImplicationSearchThreshold("jump-threading-implication-search-threshold", cl::desc("The number of predecessors to search for a stronger " "condition to use to thread over a weaker condition"), cl::init(3), cl::Hidden)

isOpDefinedInBlock
static bool isOpDefinedInBlock(Value *Op, BasicBlock *BB)
Return true if Op is an instruction defined in the given block.
Definition: JumpThreading.cpp:1210

updatePredecessorProfileMetadata
static void updatePredecessorProfileMetadata(PHINode *PN, BasicBlock *BB)
Definition: JumpThreading.cpp:147

hasAddressTakenAndUsed
static bool hasAddressTakenAndUsed(BasicBlock *BB)
Definition: JumpThreading.cpp:935

JumpThreading.h
See the comments on JumpThreadingPass.

LLVMContext.h

LazyValueInfo.h

isZero
static bool isZero(Value *V, const DataLayout &DL, DominatorTree *DT, AssumptionCache *AC)
Definition: Lint.cpp:533

Loads.h

LoopInfo.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

MDBuilder.h

MapVector.h
This file implements a map that provides insertion order iteration.

MemoryLocation.h
This file provides utility analysis objects describing memory locations.

Metadata.h
This file contains the declarations for metadata subclasses.

P
#define P(N)

verify
ppc ctr loops verify
Definition: PPCCTRLoopsVerify.cpp:72

PatternMatch.h

PostDominators.h

ProfDataUtils.h
This file contains the declarations for profiling metadata utility functions.

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition: RISCVRedundantCopyElimination.cpp:75

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

SSAUpdater.h

STLExtras.h
This file contains some templates that are useful if you are working with the STL at all.

SmallPtrSet.h
This file defines the SmallPtrSet class.

SmallVector.h
This file defines the SmallVector class.

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition: Statistic.h:166

TargetLibraryInfo.h

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

Local.h

ValueMapper.h

ValueTracking.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

IV
static const uint32_t IV[8]
Definition: blake3_impl.h:78

T

llvm::AAManager
A manager for alias analyses.
Definition: AliasAnalysis.h:927

llvm::AAResults
Definition: AliasAnalysis.h:314

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:253

llvm::AnalysisManager::invalidate
void invalidate(IRUnitT &IR, const PreservedAnalyses &PA)
Invalidate cached analyses for an IR unit.
Definition: PassManagerImpl.h:172

llvm::AnalysisManager::getCachedResult
PassT::Result * getCachedResult(IRUnitT &IR) const
Get the cached result of an analysis pass for a given IR unit.
Definition: PassManager.h:429

llvm::AnalysisManager::getResult
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Definition: PassManager.h:410

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::BasicBlock::end
iterator end()
Definition: BasicBlock.h:461

llvm::BasicBlock::begin
iterator begin()
Instruction iterator methods.
Definition: BasicBlock.h:448

llvm::BasicBlock::phis
iterator_range< const_phi_iterator > phis() const
Returns a range that iterates over the phis in the basic block.
Definition: BasicBlock.h:517

llvm::BasicBlock::getFirstInsertionPt
const_iterator getFirstInsertionPt() const
Returns an iterator to the first instruction in this block that is suitable for inserting a non-PHI i...
Definition: BasicBlock.cpp:416

llvm::BasicBlock::createMarker
DbgMarker * createMarker(Instruction *I)
Attach a DbgMarker to the given instruction.
Definition: BasicBlock.cpp:52

llvm::BasicBlock::hasAddressTaken
bool hasAddressTaken() const
Returns true if there are any uses of this basic block other than direct branches,...
Definition: BasicBlock.h:658

llvm::BasicBlock::const_iterator
InstListType::const_iterator const_iterator
Definition: BasicBlock.h:178

llvm::BasicBlock::front
const Instruction & front() const
Definition: BasicBlock.h:471

llvm::BasicBlock::Create
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
Definition: BasicBlock.h:212

llvm::BasicBlock::moveAfter
void moveAfter(BasicBlock *MovePos)
Unlink this basic block from its current function and insert it right after MovePos in the function M...
Definition: BasicBlock.cpp:287

llvm::BasicBlock::hasNPredecessors
bool hasNPredecessors(unsigned N) const
Return true if this block has exactly N predecessors.
Definition: BasicBlock.cpp:481

llvm::BasicBlock::getSinglePredecessor
const BasicBlock * getSinglePredecessor() const
Return the predecessor of this block if it has a single predecessor block.
Definition: BasicBlock.cpp:459

llvm::BasicBlock::getParent
const Function * getParent() const
Return the enclosing method, or null if none.
Definition: BasicBlock.h:219

llvm::BasicBlock::getDataLayout
const DataLayout & getDataLayout() const
Get the data layout of the module this basic block belongs to.
Definition: BasicBlock.cpp:296

llvm::BasicBlock::getMarker
DbgMarker * getMarker(InstListType::iterator It)
Return the DbgMarker for the position given by It, so that DbgRecords can be inserted there.
Definition: BasicBlock.cpp:1078

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition: BasicBlock.h:177

llvm::BasicBlock::getContext
LLVMContext & getContext() const
Get the context in which this basic block lives.
Definition: BasicBlock.cpp:168

llvm::BasicBlock::isLandingPad
bool isLandingPad() const
Return true if this basic block is a landing pad.
Definition: BasicBlock.cpp:677

llvm::BasicBlock::isEHPad
bool isEHPad() const
Return true if this basic block is an exception handling block.
Definition: BasicBlock.h:675

llvm::BasicBlock::getTerminator
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Definition: BasicBlock.h:239

llvm::BasicBlock::removePredecessor
void removePredecessor(BasicBlock *Pred, bool KeepOneInputPHIs=false)
Update PHI nodes in this BasicBlock before removal of predecessor Pred.
Definition: BasicBlock.cpp:516

llvm::BatchAAResults
This class is a wrapper over an AAResults, and it is intended to be used only when there are no IR ch...
Definition: AliasAnalysis.h:630

llvm::BatchAAResults::disableDominatorTree
void disableDominatorTree()
Disable the use of the dominator tree during alias analysis queries.
Definition: AliasAnalysis.h:683

llvm::BinaryOperator
Definition: InstrTypes.h:170

llvm::BlockAddress
The address of a basic block.
Definition: Constants.h:893

llvm::BlockAddress::get
static BlockAddress * get(Function *F, BasicBlock *BB)
Return a BlockAddress for the specified function and basic block.
Definition: Constants.cpp:1897

llvm::BlockFrequencyAnalysis
Analysis pass which computes BlockFrequencyInfo.
Definition: BlockFrequencyInfo.h:114

llvm::BlockFrequencyInfo
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Definition: BlockFrequencyInfo.h:37

llvm::BlockFrequency
Definition: BlockFrequency.h:26

llvm::BranchInst
Conditional or Unconditional Branch instruction.
Definition: Instructions.h:3011

llvm::BranchInst::isConditional
bool isConditional() const
Definition: Instructions.h:3085

llvm::BranchInst::getNumSuccessors
unsigned getNumSuccessors() const
Definition: Instructions.h:3097

llvm::BranchInst::Create
static BranchInst * Create(BasicBlock *IfTrue, InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:3067

llvm::BranchInst::getSuccessor
BasicBlock * getSuccessor(unsigned i) const
Definition: Instructions.h:3099

llvm::BranchInst::isUnconditional
bool isUnconditional() const
Definition: Instructions.h:3084

llvm::BranchInst::getCondition
Value * getCondition() const
Definition: Instructions.h:3087

llvm::BranchProbabilityAnalysis
Analysis pass which computes BranchProbabilityInfo.
Definition: BranchProbabilityInfo.h:425

llvm::BranchProbabilityInfo
Analysis providing branch probability information.
Definition: BranchProbabilityInfo.h:112

llvm::BranchProbabilityInfo::setEdgeProbability
void setEdgeProbability(const BasicBlock *Src, const SmallVectorImpl< BranchProbability > &Probs)
Set the raw probabilities for all edges from the given block.
Definition: BranchProbabilityInfo.cpp:1131

llvm::BranchProbabilityInfo::getEdgeProbability
BranchProbability getEdgeProbability(const BasicBlock *Src, unsigned IndexInSuccessors) const
Get an edge's probability, relative to other out-edges of the Src.
Definition: BranchProbabilityInfo.cpp:1094

llvm::BranchProbabilityInfo::copyEdgeProbabilities
void copyEdgeProbabilities(BasicBlock *Src, BasicBlock *Dst)
Copy outgoing edge probabilities from Src to Dst.
Definition: BranchProbabilityInfo.cpp:1158

llvm::BranchProbability
Definition: BranchProbability.h:30

llvm::BranchProbability::getBranchProbability
static BranchProbability getBranchProbability(uint64_t Numerator, uint64_t Denominator)
Definition: BranchProbability.cpp:53

llvm::BranchProbability::getNumerator
uint32_t getNumerator() const
Definition: BranchProbability.h:65

llvm::BranchProbability::getCompl
BranchProbability getCompl() const
Definition: BranchProbability.h:69

llvm::BranchProbability::normalizeProbabilities
static void normalizeProbabilities(ProbabilityIter Begin, ProbabilityIter End)
Definition: BranchProbability.h:205

llvm::CallBase::getArgOperand
Value * getArgOperand(unsigned i) const
Definition: InstrTypes.h:1294

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1474

llvm::CastInst
This is the base class for all instructions that perform data casts.
Definition: InstrTypes.h:444

llvm::CastInst::CreateBitOrPointerCast
static CastInst * CreateBitOrPointerCast(Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a BitCast, a PtrToInt, or an IntToPTr cast instruction.
Definition: Instructions.cpp:3047

llvm::CmpInst
This class is the base class for the comparison instructions.
Definition: InstrTypes.h:661

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:673

llvm::CmpInst::getPredicate
Predicate getPredicate() const
Return the predicate for this instruction.
Definition: InstrTypes.h:763

llvm::CmpPredicate
An abstraction over a floating-point predicate, and a pack of an integer predicate with samesign info...
Definition: CmpPredicate.h:22

llvm::ConstantExpr::getNot
static Constant * getNot(Constant *C)
Definition: Constants.cpp:2631

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:83

llvm::ConstantInt::isOne
bool isOne() const
This is just a convenience method to make client code smaller for a common case.
Definition: Constants.h:214

llvm::ConstantInt::getTrue
static ConstantInt * getTrue(LLVMContext &Context)
Definition: Constants.cpp:866

llvm::ConstantInt::isZero
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
Definition: Constants.h:208

llvm::ConstantInt::getFalse
static ConstantInt * getFalse(LLVMContext &Context)
Definition: Constants.cpp:873

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition: Constants.h:148

llvm::ConstantRange
This class represents a range of values.
Definition: ConstantRange.h:47

llvm::ConstantRange::add
ConstantRange add(const ConstantRange &Other) const
Return a new range representing the possible values resulting from an addition of a value in this ran...
Definition: ConstantRange.cpp:1067

llvm::ConstantRange::makeExactICmpRegion
static ConstantRange makeExactICmpRegion(CmpInst::Predicate Pred, const APInt &Other)
Produce the exact range such that all values in the returned range satisfy the given predicate with a...
Definition: ConstantRange.cpp:158

llvm::ConstantRange::inverse
ConstantRange inverse() const
Return a new range that is the logical not of the current set.
Definition: ConstantRange.cpp:1871

llvm::ConstantRange::contains
bool contains(const APInt &Val) const
Return true if the specified value is in the set.
Definition: ConstantRange.cpp:507

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:42

llvm::Constant::removeDeadConstantUsers
void removeDeadConstantUsers() const
If there are any dead constant users dangling off of this constant, remove them.
Definition: Constants.cpp:739

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::DbgMarker
Per-instruction record of debug-info.
Definition: DebugProgramInstruction.h:575

llvm::DbgMarker::cloneDebugInfoFrom
iterator_range< simple_ilist< DbgRecord >::iterator > cloneDebugInfoFrom(DbgMarker *From, std::optional< simple_ilist< DbgRecord >::iterator > FromHere, bool InsertAtHead=false)
Clone all DbgMarkers from From into this marker.
Definition: DebugProgramInstruction.cpp:692

llvm::DbgRecord::getParent
const BasicBlock * getParent() const
Definition: DebugProgramInstruction.cpp:507

llvm::DbgValueInst
This represents the llvm.dbg.value instruction.
Definition: IntrinsicInst.h:468

llvm::DbgVariableRecord
Record of a variable value-assignment, aka a non instruction representation of the dbg....
Definition: DebugProgramInstruction.h:262

llvm::DenseMapBase::lookup
ValueT lookup(const_arg_type_t< KeyT > Val) const
lookup - Return the entry for the specified key, or a default constructed value if no such entry exis...
Definition: DenseMap.h:194

llvm::DenseMapBase::insert
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition: DenseMap.h:211

llvm::DenseMap
Definition: DenseMap.h:727

llvm::DominatorTreeAnalysis
Analysis pass which computes a DominatorTree.
Definition: Dominators.h:279

llvm::DominatorTreeBase< BasicBlock, false >::Delete
static constexpr UpdateKind Delete
Definition: GenericDomTree.h:253

llvm::DominatorTreeBase< BasicBlock, false >::Insert
static constexpr UpdateKind Insert
Definition: GenericDomTree.h:252

llvm::DominatorTreeBase::VerificationLevel::Full
@ Full

llvm::DominatorTreeBase::VerificationLevel::Fast
@ Fast

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition: Dominators.h:162

llvm::DominatorTree::isReachableFromEntry
bool isReachableFromEntry(const Use &U) const
Provide an overload for a Use.
Definition: Dominators.cpp:321

llvm::FreezeInst
This class represents a freeze function that returns random concrete value if an operand is either a ...
Definition: Instructions.h:5083

llvm::Function
Definition: Function.h:63

llvm::Function::getEntryBlock
const BasicBlock & getEntryBlock() const
Definition: Function.h:809

llvm::Function::hasFnAttribute
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
Definition: Function.cpp:731

llvm::GenericDomTreeUpdater::flush
void flush()
Apply all pending updates to available trees and flush all BasicBlocks awaiting deletion.
Definition: GenericDomTreeUpdater.h:202

llvm::GlobalValue::getParent
Module * getParent()
Get the module that this global value is contained inside of...
Definition: GlobalValue.h:656

llvm::ICmpInst
This instruction compares its operands according to the predicate given to the constructor.
Definition: Instructions.h:1158

llvm::IndirectBrInst
Indirect Branch Instruction.
Definition: Instructions.h:3539

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::Instruction
Definition: Instruction.h:68

llvm::Instruction::removeFromParent
void removeFromParent()
This method unlinks 'this' from the containing basic block, but does not delete it.
Definition: Instruction.cpp:80

llvm::Instruction::cloneDebugInfoFrom
iterator_range< simple_ilist< DbgRecord >::iterator > cloneDebugInfoFrom(const Instruction *From, std::optional< simple_ilist< DbgRecord >::iterator > FromHere=std::nullopt, bool InsertAtHead=false)
Clone any debug-info attached to From onto this instruction.
Definition: Instruction.cpp:235

llvm::Instruction::getNumSuccessors
unsigned getNumSuccessors() const LLVM_READONLY
Return the number of successors that this instruction has.
Definition: Instruction.cpp:1263

llvm::Instruction::insertBefore
void insertBefore(Instruction *InsertPos)
Insert an unlinked instruction into a basic block immediately before the specified instruction.
Definition: Instruction.cpp:99

llvm::Instruction::getDebugLoc
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
Definition: Instruction.h:475

llvm::Instruction::setAAMetadata
void setAAMetadata(const AAMDNodes &N)
Sets the AA metadata on this instruction from the AAMDNodes structure.
Definition: Metadata.cpp:1764

llvm::Instruction::isAtomic
bool isAtomic() const LLVM_READONLY
Return true if this instruction has an AtomicOrdering of unordered or higher.
Definition: Instruction.cpp:1019

llvm::Instruction::eraseFromParent
InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Definition: Instruction.cpp:94

llvm::Instruction::getSuccessor
BasicBlock * getSuccessor(unsigned Idx) const LLVM_READONLY
Return the specified successor. This instruction must be a terminator.
Definition: Instruction.cpp:1275

llvm::Instruction::getAAMetadata
AAMDNodes getAAMetadata() const
Returns the AA metadata for this instruction.
Definition: Metadata.cpp:1750

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition: Instruction.h:274

llvm::Instruction::setDebugLoc
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
Definition: Instruction.h:472

llvm::Instruction::setSuccessor
void setSuccessor(unsigned Idx, BasicBlock *BB)
Update the specified successor to point at the provided block.
Definition: Instruction.cpp:1287

llvm::Instruction::getDataLayout
const DataLayout & getDataLayout() const
Get the data layout of the module this instruction belongs to.
Definition: Instruction.cpp:76

llvm::Instruction::isSpecialTerminator
bool isSpecialTerminator() const
Definition: Instruction.h:285

llvm::Instruction::insertInto
InstListType::iterator insertInto(BasicBlock *ParentBB, InstListType::iterator It)
Inserts an unlinked instruction into ParentBB at position It and returns the iterator of the inserted...
Definition: Instruction.cpp:117

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:48

llvm::JumpThreadingPass::simplifyPartiallyRedundantLoad
bool simplifyPartiallyRedundantLoad(LoadInst *LI)
simplifyPartiallyRedundantLoad - If LoadI is an obviously partially redundant load instruction,...
Definition: JumpThreading.cpp:1221

llvm::JumpThreadingPass::processBranchOnXOR
bool processBranchOnXOR(BinaryOperator *BO)
processBranchOnXOR - We have an otherwise unthreadable conditional branch on a xor instruction in the...
Definition: JumpThreading.cpp:1752

llvm::JumpThreadingPass::processGuards
bool processGuards(BasicBlock *BB)
Try to propagate a guard from the current BB into one of its predecessors in case if another branch o...
Definition: JumpThreading.cpp:3012

llvm::JumpThreadingPass::updateSSA
void updateSSA(BasicBlock *BB, BasicBlock *NewBB, ValueToValueMapTy &ValueMapping)
Update the SSA form.
Definition: JumpThreading.cpp:1938

llvm::JumpThreadingPass::computeValueKnownInPredecessors
bool computeValueKnownInPredecessors(Value *V, BasicBlock *BB, jumpthreading::PredValueInfo &Result, jumpthreading::ConstantPreference Preference, Instruction *CxtI=nullptr)
Definition: JumpThreading.h:135

llvm::JumpThreadingPass::findLoopHeaders
void findLoopHeaders(Function &F)
findLoopHeaders - We do not want jump threading to turn proper loop structures into irreducible loops...
Definition: JumpThreading.cpp:524

llvm::JumpThreadingPass::maybeMergeBasicBlockIntoOnlyPred
bool maybeMergeBasicBlockIntoOnlyPred(BasicBlock *BB)
Merge basic block BB into its sole predecessor if possible.
Definition: JumpThreading.cpp:1887

llvm::JumpThreadingPass::JumpThreadingPass
JumpThreadingPass(int T=-1)
Definition: JumpThreading.cpp:108

llvm::JumpThreadingPass::cloneInstructions
void cloneInstructions(ValueToValueMapTy &ValueMapping, BasicBlock::iterator BI, BasicBlock::iterator BE, BasicBlock *NewBB, BasicBlock *PredBB)
Clone instructions in range [BI, BE) to NewBB.
Definition: JumpThreading.cpp:2001

llvm::JumpThreadingPass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
Definition: JumpThreading.cpp:236

llvm::JumpThreadingPass::runImpl
bool runImpl(Function &F, FunctionAnalysisManager *FAM, TargetLibraryInfo *TLI, TargetTransformInfo *TTI, LazyValueInfo *LVI, AAResults *AA, std::unique_ptr< DomTreeUpdater > DTU, std::optional< BlockFrequencyInfo * > BFI, std::optional< BranchProbabilityInfo * > BPI)
Definition: JumpThreading.cpp:280

llvm::JumpThreadingPass::evaluateOnPredecessorEdge
Constant * evaluateOnPredecessorEdge(BasicBlock *BB, BasicBlock *PredPredBB, Value *cond, const DataLayout &DL)
Definition: JumpThreading.cpp:1497

llvm::JumpThreadingPass::processBranchOnPHI
bool processBranchOnPHI(PHINode *PN)
processBranchOnPHI - We have an otherwise unthreadable conditional branch on a PHI node (or freeze PH...
Definition: JumpThreading.cpp:1720

llvm::JumpThreadingPass::maybethreadThroughTwoBasicBlocks
bool maybethreadThroughTwoBasicBlocks(BasicBlock *BB, Value *Cond)
Attempt to thread through two successive basic blocks.
Definition: JumpThreading.cpp:2115

llvm::JumpThreadingPass::computeValueKnownInPredecessorsImpl
bool computeValueKnownInPredecessorsImpl(Value *V, BasicBlock *BB, jumpthreading::PredValueInfo &Result, jumpthreading::ConstantPreference Preference, SmallPtrSet< Value *, 4 > &RecursionSet, Instruction *CxtI=nullptr)
computeValueKnownInPredecessors - Given a basic block BB and a value V, see if we can infer that the ...
Definition: JumpThreading.cpp:557

llvm::JumpThreadingPass::unfoldSelectInstr
void unfoldSelectInstr(BasicBlock *Pred, BasicBlock *BB, SelectInst *SI, PHINode *SIUse, unsigned Idx)
Definition: JumpThreading.cpp:2749

llvm::JumpThreadingPass::getDomTreeUpdater
DomTreeUpdater * getDomTreeUpdater() const
Definition: JumpThreading.h:113

llvm::JumpThreadingPass::processThreadableEdges
bool processThreadableEdges(Value *Cond, BasicBlock *BB, jumpthreading::ConstantPreference Preference, Instruction *CxtI=nullptr)
Definition: JumpThreading.cpp:1539

llvm::JumpThreadingPass::processBlock
bool processBlock(BasicBlock *BB)
processBlock - If there are any predecessors whose control can be threaded through to a successor,...
Definition: JumpThreading.cpp:947

llvm::JumpThreadingPass::processImpliedCondition
bool processImpliedCondition(BasicBlock *BB)
Definition: JumpThreading.cpp:1144

llvm::JumpThreadingPass::duplicateCondBranchOnPHIIntoPred
bool duplicateCondBranchOnPHIIntoPred(BasicBlock *BB, const SmallVectorImpl< BasicBlock * > &PredBBs)
duplicateCondBranchOnPHIIntoPred - PredBB contains an unconditional branch to BB which contains an i1...
Definition: JumpThreading.cpp:2613

llvm::JumpThreadingPass::threadThroughTwoBasicBlocks
void threadThroughTwoBasicBlocks(BasicBlock *PredPredBB, BasicBlock *PredBB, BasicBlock *BB, BasicBlock *SuccBB)
Definition: JumpThreading.cpp:2256

llvm::JumpThreadingPass::tryThreadEdge
bool tryThreadEdge(BasicBlock *BB, const SmallVectorImpl< BasicBlock * > &PredBBs, BasicBlock *SuccBB)
tryThreadEdge - Thread an edge if it's safe and profitable to do so.
Definition: JumpThreading.cpp:2329

llvm::JumpThreadingPass::tryToUnfoldSelect
bool tryToUnfoldSelect(CmpInst *CondCmp, BasicBlock *BB)
tryToUnfoldSelect - Look for blocks of the form bb1: a = select br bb2
Definition: JumpThreading.cpp:2850

llvm::JumpThreadingPass::tryToUnfoldSelectInCurrBB
bool tryToUnfoldSelectInCurrBB(BasicBlock *BB)
tryToUnfoldSelectInCurrBB - Look for PHI/Select or PHI/CMP/Select in the same BB in the form bb: p = ...
Definition: JumpThreading.cpp:2909

llvm::JumpThreadingPass::threadEdge
void threadEdge(BasicBlock *BB, const SmallVectorImpl< BasicBlock * > &PredBBs, BasicBlock *SuccBB)
threadEdge - We have decided that it is safe and profitable to factor the blocks in PredBBs to one pr...
Definition: JumpThreading.cpp:2368

llvm::JumpThreadingPass::threadGuard
bool threadGuard(BasicBlock *BB, IntrinsicInst *Guard, BranchInst *BI)
Try to propagate the guard from BB which is the lower block of a diamond to one of its branches,...
Definition: JumpThreading.cpp:3046

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LazyValueAnalysis
Analysis to compute lazy value information.
Definition: LazyValueInfo.h:139

llvm::LazyValueInfo
This pass computes, caches, and vends lazy value constraint information.
Definition: LazyValueInfo.h:32

llvm::LazyValueInfo::eraseBlock
void eraseBlock(BasicBlock *BB)
Inform the analysis cache that we have erased a block.
Definition: LazyValueInfo.cpp:2003

llvm::LazyValueInfo::threadEdge
void threadEdge(BasicBlock *PredBB, BasicBlock *OldSucc, BasicBlock *NewSucc)
Inform the analysis cache that we have threaded an edge from PredBB to OldSucc to be from PredBB to N...
Definition: LazyValueInfo.cpp:1992

llvm::LazyValueInfo::getPredicateOnEdge
Constant * getPredicateOnEdge(CmpInst::Predicate Pred, Value *V, Constant *C, BasicBlock *FromBB, BasicBlock *ToBB, Instruction *CxtI=nullptr)
Determine whether the specified value comparison with a constant is known to be true or false on the ...
Definition: LazyValueInfo.cpp:1847

llvm::LazyValueInfo::getConstantOnEdge
Constant * getConstantOnEdge(Value *V, BasicBlock *FromBB, BasicBlock *ToBB, Instruction *CxtI=nullptr)
Determine whether the specified value is known to be a constant on the specified edge.
Definition: LazyValueInfo.cpp:1777

llvm::LazyValueInfo::getConstantRangeOnEdge
ConstantRange getConstantRangeOnEdge(Value *V, BasicBlock *FromBB, BasicBlock *ToBB, Instruction *CxtI=nullptr)
Return the ConstantRage constraint that is known to hold for the specified value on the specified edg...
Definition: LazyValueInfo.cpp:1794

llvm::LazyValueInfo::getConstant
Constant * getConstant(Value *V, Instruction *CxtI)
Determine whether the specified value is known to be a constant at the specified instruction.
Definition: LazyValueInfo.cpp:1740

llvm::LazyValueInfo::forgetValue
void forgetValue(Value *V)
Remove information related to this value from the cache.
Definition: LazyValueInfo.cpp:1998

llvm::LazyValueInfo::getPredicateAt
Constant * getPredicateAt(CmpInst::Predicate Pred, Value *V, Constant *C, Instruction *CxtI, bool UseBlockValue)
Determine whether the specified value comparison with a constant is known to be true or false at the ...
Definition: LazyValueInfo.cpp:1858

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:176

llvm::LoadInst::getOrdering
AtomicOrdering getOrdering() const
Returns the ordering constraint of this load instruction.
Definition: Instructions.h:220

llvm::LoadInst::isUnordered
bool isUnordered() const
Definition: Instructions.h:249

llvm::LoadInst::getSyncScopeID
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this load instruction.
Definition: Instructions.h:230

llvm::LoadInst::getAlign
Align getAlign() const
Return the alignment of the access that is being performed.
Definition: Instructions.h:211

llvm::LocationSize::precise
static LocationSize precise(uint64_t Value)
Definition: MemoryLocation.h:108

llvm::MDNode
Metadata node.
Definition: Metadata.h:1069

llvm::MapVector
This class implements a map that also provides access to all stored values in a deterministic order.
Definition: MapVector.h:36

llvm::MemoryLocation
Representation for a specific memory location.
Definition: MemoryLocation.h:227

llvm::PHINode
Definition: Instructions.h:2595

llvm::PHINode::addIncoming
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
Definition: Instructions.h:2730

llvm::PHINode::setIncomingValue
void setIncomingValue(unsigned i, Value *V)
Definition: Instructions.h:2673

llvm::PHINode::getIncomingValueForBlock
Value * getIncomingValueForBlock(const BasicBlock *BB) const
Definition: Instructions.h:2770

llvm::PHINode::getIncomingBlock
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Definition: Instructions.h:2690

llvm::PHINode::getIncomingValue
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
Definition: Instructions.h:2670

llvm::PHINode::getNumIncomingValues
unsigned getNumIncomingValues() const
Return the number of incoming edges.
Definition: Instructions.h:2666

llvm::PHINode::Create
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
Definition: Instructions.h:2630

llvm::PoisonValue::get
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition: Constants.cpp:1878

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:111

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:117

llvm::PreservedAnalyses::preserve
void preserve()
Mark an analysis as preserved.
Definition: Analysis.h:131

llvm::SSAUpdater
Helper class for SSA formation on a set of values defined in multiple blocks.
Definition: SSAUpdater.h:40

llvm::SSAUpdater::RewriteUse
void RewriteUse(Use &U)
Rewrite a use of the symbolic value.
Definition: SSAUpdater.cpp:187

llvm::SSAUpdater::Initialize
void Initialize(Type *Ty, StringRef Name)
Reset this object to get ready for a new set of SSA updates with type 'Ty'.
Definition: SSAUpdater.cpp:52

llvm::SSAUpdater::UpdateDebugValues
void UpdateDebugValues(Instruction *I)
Rewrite debug value intrinsics to conform to a new SSA form.
Definition: SSAUpdater.cpp:199

llvm::SSAUpdater::AddAvailableValue
void AddAvailableValue(BasicBlock *BB, Value *V)
Indicate that a rewritten value is available in the specified block with the specified value.
Definition: SSAUpdater.cpp:69

llvm::SelectInst
This class represents the LLVM 'select' instruction.
Definition: Instructions.h:1652

llvm::SmallPtrSetImplBase::size
size_type size() const
Definition: SmallPtrSet.h:94

llvm::SmallPtrSetImpl::count
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
Definition: SmallPtrSet.h:452

llvm::SmallPtrSetImpl::insert
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
Definition: SmallPtrSet.h:384

llvm::SmallPtrSet
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
Definition: SmallPtrSet.h:519

llvm::SmallSet
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
Definition: SmallSet.h:132

llvm::SmallSet::insert
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
Definition: SmallSet.h:181

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:81

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:78

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:573

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition: SmallVector.h:673

llvm::SmallVectorImpl::assign
void assign(size_type NumElts, ValueParamT Elt)
Definition: SmallVector.h:704

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition: SmallVector.h:937

llvm::SmallVectorImpl::clear
void clear()
Definition: SmallVector.h:610

llvm::SmallVectorImpl::resize
void resize(size_type N)
Definition: SmallVector.h:638

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:413

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition: SmallVector.h:269

llvm::SmallVectorTemplateCommon::begin
iterator begin()
Definition: SmallVector.h:267

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::SwitchInst
Multiway switch.
Definition: Instructions.h:3149

llvm::TargetIRAnalysis
Analysis pass providing the TargetTransformInfo.
Definition: TargetTransformInfo.h:3128

llvm::TargetLibraryAnalysis
Analysis pass providing the TargetLibraryInfo.
Definition: TargetLibraryInfo.h:614

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:280

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition: TargetTransformInfo.h:212

llvm::TargetTransformInfo::hasBranchDivergence
bool hasBranchDivergence(const Function *F=nullptr) const
Return true if branch divergence exists.
Definition: TargetTransformInfo.cpp:289

llvm::TargetTransformInfo::TCK_SizeAndLatency
@ TCK_SizeAndLatency
The weighted sum of size and latency.
Definition: TargetTransformInfo.h:261

llvm::TargetTransformInfo::TCC_Free
@ TCC_Free
Expected to fold away in lowering.
Definition: TargetTransformInfo.h:283

llvm::TargetTransformInfo::getInstructionCost
InstructionCost getInstructionCost(const User *U, ArrayRef< const Value * > Operands, TargetCostKind CostKind) const
Estimate the cost of a given IR user when lowered.
Definition: TargetTransformInfo.cpp:270

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition: Type.h:270

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:237

llvm::UndefValue
'undef' values are things that do not have specified contents.
Definition: Constants.h:1412

llvm::UndefValue::get
static UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
Definition: Constants.cpp:1859

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition: Use.h:43

llvm::User
Definition: User.h:44

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition: User.h:233

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:228

llvm::ValueMapIterator
Definition: ValueMap.h:325

llvm::ValueMap< const Value *, WeakTrackingVH >

llvm::ValueMap::find
iterator find(const KeyT &Val)
Definition: ValueMap.h:155

llvm::ValueMap::end
iterator end()
Definition: ValueMap.h:135

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::DoPHITranslation
const Value * DoPHITranslation(const BasicBlock *CurBB, const BasicBlock *PredBB) const
Translate PHI node to its predecessor from the given basic block.
Definition: Value.cpp:1067

llvm::Value::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition: Value.h:434

llvm::Value::replaceAllUsesWith
void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition: Value.cpp:534

llvm::Value::stripPointerCasts
const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition: Value.cpp:694

llvm::Value::use_empty
bool use_empty() const
Definition: Value.h:344

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::Value::takeName
void takeName(Value *V)
Transfer the name from V to this value.
Definition: Value.cpp:383

llvm::cl::opt
Definition: CommandLine.h:1423

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition: ilist_node.h:32

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:132

llvm::ilist_node_with_parent::getNextNode
NodeTy * getNextNode()
Get the next node, or nullptr for the list tail.
Definition: ilist_node.h:353

uint32_t

uint64_t

DebugInfo.h

llvm::AMDGPUISD::BFI
@ BFI
Definition: AMDGPUISelLowering.h:496

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::Intrinsic::getDeclarationIfExists
Function * getDeclarationIfExists(Module *M, ID id, ArrayRef< Type * > Tys, FunctionType *FT=nullptr)
This version supports overloaded intrinsics.
Definition: Intrinsics.cpp:746

llvm::PatternMatch::m_Add
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1102

llvm::PatternMatch::m_Constant
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
Definition: PatternMatch.h:165

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_ConstantInt
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
Definition: PatternMatch.h:168

llvm::PatternMatch::m_LogicalOr
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
Definition: PatternMatch.h:3071

llvm::PatternMatch::m_Cmp
class_match< CmpInst > m_Cmp()
Matches any compare instruction and ignore it.
Definition: PatternMatch.h:105

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_LogicalAnd
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Definition: PatternMatch.h:3053

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition: PatternMatch.h:239

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm::jumpthreading::ConstantPreference
ConstantPreference
Definition: JumpThreading.h:60

llvm::jumpthreading::WantBlockAddress
@ WantBlockAddress
Definition: JumpThreading.h:60

llvm::jumpthreading::WantInteger
@ WantInteger
Definition: JumpThreading.h:60

llvm::ms_demangle::QualifierMangleMode::Result
@ Result

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::RemoveRedundantDbgInstrs
bool RemoveRedundantDbgInstrs(BasicBlock *BB)
Try to remove redundant dbg.value instructions from given basic block.
Definition: BasicBlockUtils.cpp:685

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1739

llvm::ConstantFoldTerminator
bool ConstantFoldTerminator(BasicBlock *BB, bool DeleteDeadConditions=false, const TargetLibraryInfo *TLI=nullptr, DomTreeUpdater *DTU=nullptr)
If a terminator instruction is predicated on a constant value, convert it into an unconditional branc...
Definition: Local.cpp:136

llvm::pred_end
auto pred_end(const MachineBasicBlock *BB)
Definition: MachineBasicBlock.h:1385

llvm::replaceNonLocalUsesWith
unsigned replaceNonLocalUsesWith(Instruction *From, Value *To)
Definition: Local.cpp:3566

llvm::successors
auto successors(const MachineBasicBlock *BB)
Definition: MachineBasicBlock.h:1376

llvm::getBranchWeightMDNode
MDNode * getBranchWeightMDNode(const Instruction &I)
Get the branch weights metadata node.
Definition: ProfDataUtils.cpp:146

llvm::findAvailablePtrLoadStore
Value * findAvailablePtrLoadStore(const MemoryLocation &Loc, Type *AccessTy, bool AtLeastAtomic, BasicBlock *ScanBB, BasicBlock::iterator &ScanFrom, unsigned MaxInstsToScan, BatchAAResults *AA, bool *IsLoadCSE, unsigned *NumScanedInst)
Scan backwards to see if we have the value of the given pointer available locally within a small numb...
Definition: Loads.cpp:621

llvm::remapDebugVariable
void remapDebugVariable(ValueToValueMapTy &Mapping, Instruction *Inst)
Remap the operands of the debug records attached to Inst, and the operands of Inst itself if it's a d...
Definition: Local.cpp:3788

llvm::ConstantFoldCompareInstOperands
Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
Definition: ConstantFolding.cpp:1184

llvm::pred_size
auto pred_size(const MachineBasicBlock *BB)
Definition: MachineBasicBlock.h:1381

llvm::SimplifyInstructionsInBlock
bool SimplifyInstructionsInBlock(BasicBlock *BB, const TargetLibraryInfo *TLI=nullptr)
Scan the specified basic block and try to simplify any instructions in it and recursively delete dead...
Definition: Local.cpp:737

llvm::DeleteDeadBlock
void DeleteDeadBlock(BasicBlock *BB, DomTreeUpdater *DTU=nullptr, bool KeepOneInputPHIs=false)
Delete the specified block, which must have no predecessors.
Definition: BasicBlockUtils.cpp:96

llvm::FindAvailableLoadedValue
Value * FindAvailableLoadedValue(LoadInst *Load, BasicBlock *ScanBB, BasicBlock::iterator &ScanFrom, unsigned MaxInstsToScan=DefMaxInstsToScan, BatchAAResults *AA=nullptr, bool *IsLoadCSE=nullptr, unsigned *NumScanedInst=nullptr)
Scan backwards to see if we have the value of the given load available locally within a small number ...
Definition: Loads.cpp:492

llvm::hasBranchWeightOrigin
bool hasBranchWeightOrigin(const Instruction &I)
Check if Branch Weight Metadata has an "expected" field from an llvm.expect* intrinsic.
Definition: ProfDataUtils.cpp:122

llvm::DuplicateInstructionsInSplitBetween
BasicBlock * DuplicateInstructionsInSplitBetween(BasicBlock *BB, BasicBlock *PredBB, Instruction *StopAt, ValueToValueMapTy &ValueMapping, DomTreeUpdater &DTU)
Split edge between BB and PredBB and duplicate all non-Phi instructions from BB between its beginning...
Definition: CloneFunction.cpp:1121

llvm::findDbgValues
void findDbgValues(SmallVectorImpl< DbgValueInst * > &DbgValues, Value *V, SmallVectorImpl< DbgVariableRecord * > *DbgVariableRecords=nullptr)
Finds the llvm.dbg.value intrinsics describing a value.
Definition: DebugInfo.cpp:155

llvm::simplifyInstruction
Value * simplifyInstruction(Instruction *I, const SimplifyQuery &Q)
See if we can compute a simplified version of this instruction.
Definition: InstructionSimplify.cpp:7202

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1746

llvm::isInstructionTriviallyDead
bool isInstructionTriviallyDead(Instruction *I, const TargetLibraryInfo *TLI=nullptr)
Return true if the result produced by the instruction is not used, and the instruction will return.
Definition: Local.cpp:406

llvm::isGuard
bool isGuard(const User *U)
Returns true iff U has semantics of a guard expressed in a form of call of llvm.experimental....
Definition: GuardUtils.cpp:18

llvm::TryToSimplifyUncondBranchFromEmptyBlock
bool TryToSimplifyUncondBranchFromEmptyBlock(BasicBlock *BB, DomTreeUpdater *DTU=nullptr)
BB is known to contain an unconditional branch, and contains no instructions other than PHI nodes,...
Definition: Local.cpp:1156

llvm::reverse
auto reverse(ContainerTy &&C)
Definition: STLExtras.h:420

llvm::setBranchWeights
void setBranchWeights(Instruction &I, ArrayRef< uint32_t > Weights, bool IsExpected)
Create a new branch_weights metadata node and add or overwrite a prof metadata reference to instructi...
Definition: ProfDataUtils.cpp:235

llvm::hasValidBranchWeightMD
bool hasValidBranchWeightMD(const Instruction &I)
Checks if an instructions has valid Branch Weight Metadata.
Definition: ProfDataUtils.cpp:118

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::isSafeToSpeculativelyExecute
bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
Definition: ValueTracking.cpp:7012

llvm::ConstantFoldCastOperand
Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
Definition: ConstantFolding.cpp:1460

llvm::cloneNoAliasScopes
void cloneNoAliasScopes(ArrayRef< MDNode * > NoAliasDeclScopes, DenseMap< MDNode *, MDNode * > &ClonedScopes, StringRef Ext, LLVMContext &Context)
Duplicate the specified list of noalias decl scopes.
Definition: CloneFunction.cpp:1170

llvm::DefMaxInstsToScan
cl::opt< unsigned > DefMaxInstsToScan
The default number of maximum instructions to scan in the block, used by FindAvailableLoadedValue().

llvm::SplitLandingPadPredecessors
void SplitLandingPadPredecessors(BasicBlock *OrigBB, ArrayRef< BasicBlock * > Preds, const char *Suffix, const char *Suffix2, SmallVectorImpl< BasicBlock * > &NewBBs, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, bool PreserveLCSSA=false)
This method transforms the landing pad, OrigBB, by introducing two new basic blocks into the function...
Definition: BasicBlockUtils.cpp:1539

llvm::ConstantFoldBinaryOpOperands
Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
Definition: ConstantFolding.cpp:1298

llvm::combineMetadataForCSE
void combineMetadataForCSE(Instruction *K, const Instruction *J, bool DoesKMove)
Combine the metadata of two instructions so that K can replace J.
Definition: Local.cpp:3426

llvm::SplitBlockPredecessors
BasicBlock * SplitBlockPredecessors(BasicBlock *BB, ArrayRef< BasicBlock * > Preds, const char *Suffix, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, bool PreserveLCSSA=false)
This method introduces at least one new basic block into the function and moves some of the predecess...
Definition: BasicBlockUtils.cpp:1419

llvm::MergeBasicBlockIntoOnlyPred
void MergeBasicBlockIntoOnlyPred(BasicBlock *BB, DomTreeUpdater *DTU=nullptr)
BB is a block with one predecessor and its predecessor is known to have one successor (BB!...
Definition: Local.cpp:777

llvm::lower_bound
auto lower_bound(R &&Range, T &&Value)
Provide wrappers to std::lower_bound which take ranges instead of having to pass begin/end explicitly...
Definition: STLExtras.h:1978

llvm::adaptNoAliasScopes
void adaptNoAliasScopes(llvm::Instruction *I, const DenseMap< MDNode *, MDNode * > &ClonedScopes, LLVMContext &Context)
Adapt the metadata for the specified instruction according to the provided mapping.
Definition: CloneFunction.cpp:1195

llvm::max_element
auto max_element(R &&Range)
Provide wrappers to std::max_element which take ranges instead of having to pass begin/end explicitly...
Definition: STLExtras.h:2014

llvm::ConstantFoldInstruction
Constant * ConstantFoldInstruction(Instruction *I, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldInstruction - Try to constant fold the specified instruction.
Definition: ConstantFolding.cpp:1121

llvm::isGuaranteedNotToBeUndefOrPoison
bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
Definition: ValueTracking.cpp:7810

llvm::isGuaranteedToTransferExecutionToSuccessor
bool isGuaranteedToTransferExecutionToSuccessor(const Instruction *I)
Return true if this function can prove that the instruction I will always transfer execution to one o...
Definition: ValueTracking.cpp:7889

llvm::extractBranchWeights
bool extractBranchWeights(const MDNode *ProfileData, SmallVectorImpl< uint32_t > &Weights)
Extract branch weights from MD_prof metadata.
Definition: ProfDataUtils.cpp:170

llvm::pred_begin
auto pred_begin(const MachineBasicBlock *BB)
Definition: MachineBasicBlock.h:1383

llvm::erase_if
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
Definition: STLExtras.h:2099

llvm::predecessors
auto predecessors(const MachineBasicBlock *BB)
Definition: MachineBasicBlock.h:1377

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition: STLExtras.h:1903

llvm::pred_empty
bool pred_empty(const BasicBlock *BB)
Definition: CFG.h:118

llvm::SplitBlockAndInsertIfThen
Instruction * SplitBlockAndInsertIfThen(Value *Cond, BasicBlock::iterator SplitBefore, bool Unreachable, MDNode *BranchWeights=nullptr, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, BasicBlock *ThenBlock=nullptr)
Split the containing block at the specified instruction - everything before SplitBefore stays in the ...
Definition: BasicBlockUtils.cpp:1609

llvm::simplifyCmpInst
Value * simplifyCmpInst(CmpPredicate Predicate, Value *LHS, Value *RHS, const SimplifyQuery &Q)
Given operands for a CmpInst, fold the result or return null.
Definition: InstructionSimplify.cpp:6102

llvm::array_pod_sort
void array_pod_sort(IteratorTy Start, IteratorTy End)
array_pod_sort - This sorts an array with the specified start and end extent.
Definition: STLExtras.h:1624

llvm::identifyNoAliasScopesToClone
void identifyNoAliasScopesToClone(ArrayRef< BasicBlock * > BBs, SmallVectorImpl< MDNode * > &NoAliasDeclScopes)
Find the 'llvm.experimental.noalias.scope.decl' intrinsics in the specified basic blocks and extract ...
Definition: CloneFunction.cpp:1266

llvm::SplitEdge
BasicBlock * SplitEdge(BasicBlock *From, BasicBlock *To, DominatorTree *DT=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the edge connecting the specified blocks, and return the newly created basic block between From...
Definition: BasicBlockUtils.cpp:762

llvm::filterDbgVars
static auto filterDbgVars(iterator_range< simple_ilist< DbgRecord >::iterator > R)
Filter the DbgRecord range to DbgVariableRecord types only and downcast.
Definition: DebugProgramInstruction.h:547

llvm::FindFunctionBackedges
void FindFunctionBackedges(const Function &F, SmallVectorImpl< std::pair< const BasicBlock *, const BasicBlock * > > &Result)
Analyze the specified function to find all of the loop backedges in the function and return them.
Definition: CFG.cpp:34

llvm::isImpliedCondition
std::optional< bool > isImpliedCondition(const Value *LHS, const Value *RHS, const DataLayout &DL, bool LHSIsTrue=true, unsigned Depth=0)
Return true if RHS is known to be implied true by LHS.
Definition: ValueTracking.cpp:9489

raw_ostream.h

InsertionPoint
Definition: CFIFixup.cpp:129

llvm::AAMDNodes
A collection of metadata nodes that might be associated with a memory access used by the alias-analys...
Definition: Metadata.h:760

llvm::cl::desc
Definition: CommandLine.h:409

llvm::less_second
Function object to check whether the second component of a container supported by std::get (like std:...
Definition: STLExtras.h:1476