doxygen/InstCombineCalls_8cpp_source.html

//===- InstCombineCalls.cpp -----------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the visitCall, visitInvoke, and visitCallBr functions.

//

//===----------------------------------------------------------------------===//


#include "InstCombineInternal.h"

#include "llvm/ADT/APFloat.h"

#include "llvm/ADT/APInt.h"

#include "llvm/ADT/APSInt.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/ADT/STLFunctionalExtras.h"

#include "llvm/ADT/SmallBitVector.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/AssumeBundleQueries.h"

#include "llvm/Analysis/AssumptionCache.h"

#include "llvm/Analysis/InstructionSimplify.h"

#include "llvm/Analysis/Loads.h"

#include "llvm/Analysis/MemoryBuiltins.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/IR/AttributeMask.h"

#include "llvm/IR/Attributes.h"

#include "llvm/IR/BasicBlock.h"

#include "llvm/IR/Constant.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/DebugInfo.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/GlobalVariable.h"

#include "llvm/IR/InlineAsm.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instruction.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/IntrinsicsAArch64.h"

#include "llvm/IR/IntrinsicsAMDGPU.h"

#include "llvm/IR/IntrinsicsARM.h"

#include "llvm/IR/IntrinsicsHexagon.h"

#include "llvm/IR/LLVMContext.h"

#include "llvm/IR/Metadata.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/IR/Statepoint.h"

#include "llvm/IR/Type.h"

#include "llvm/IR/User.h"

#include "llvm/IR/Value.h"

#include "llvm/IR/ValueHandle.h"

#include "llvm/Support/AtomicOrdering.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Support/MathExtras.h"

#include "llvm/Support/raw_ostream.h"

#include "llvm/Transforms/InstCombine/InstCombiner.h"

#include "llvm/Transforms/Utils/AssumeBundleBuilder.h"

#include "llvm/Transforms/Utils/Local.h"

#include "llvm/Transforms/Utils/SimplifyLibCalls.h"

#include <algorithm>

#include <cassert>

#include <cstdint>

#include <optional>

#include <utility>

#include <vector>


#define DEBUG_TYPE "instcombine"

#include "llvm/Transforms/Utils/InstructionWorklist.h"


using namespace llvm;

using namespace PatternMatch;


STATISTIC(NumSimplified, "Number of library calls simplified");


static cl::opt<unsigned> GuardWideningWindow(

    "instcombine-guard-widening-window",

    cl::init(3),

    cl::desc("How wide an instruction window to bypass looking for "

             "another guard"));


/// Return the specified type promoted as it would be to pass though a va_arg

/// area.

static Type *getPromotedType(Type *Ty) {

  if (IntegerType* ITy = dyn_cast<IntegerType>(Ty)) {

    if (ITy->getBitWidth() < 32)

      return Type::getInt32Ty(Ty->getContext());

  }

  return Ty;

}


/// Recognize a memcpy/memmove from a trivially otherwise unused alloca.

/// TODO: This should probably be integrated with visitAllocSites, but that

/// requires a deeper change to allow either unread or unwritten objects.

static bool hasUndefSource(AnyMemTransferInst *MI) {

  auto *Src = MI->getRawSource();

  while (isa<GetElementPtrInst>(Src)) {

    if (!Src->hasOneUse())

      return false;

    Src = cast<Instruction>(Src)->getOperand(0);

  }

  return isa<AllocaInst>(Src) && Src->hasOneUse();

}


Instruction *InstCombinerImpl::SimplifyAnyMemTransfer(AnyMemTransferInst *MI) {

  Align DstAlign = getKnownAlignment(MI->getRawDest(), DL, MI, &AC, &DT);

  MaybeAlign CopyDstAlign = MI->getDestAlign();

  if (!CopyDstAlign || *CopyDstAlign < DstAlign) {

    MI->setDestAlignment(DstAlign);

    return MI;

  }


  Align SrcAlign = getKnownAlignment(MI->getRawSource(), DL, MI, &AC, &DT);

  MaybeAlign CopySrcAlign = MI->getSourceAlign();

  if (!CopySrcAlign || *CopySrcAlign < SrcAlign) {

    MI->setSourceAlignment(SrcAlign);

    return MI;

  }


  // If we have a store to a location which is known constant, we can conclude

  // that the store must be storing the constant value (else the memory

  // wouldn't be constant), and this must be a noop.

  if (!isModSet(AA->getModRefInfoMask(MI->getDest()))) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // If the source is provably undef, the memcpy/memmove doesn't do anything

  // (unless the transfer is volatile).

  if (hasUndefSource(MI) && !MI->isVolatile()) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // If MemCpyInst length is 1/2/4/8 bytes then replace memcpy with

  // load/store.

  ConstantInt *MemOpLength = dyn_cast<ConstantInt>(MI->getLength());

  if (!MemOpLength) return nullptr;


  // Source and destination pointer types are always "i8*" for intrinsic.  See

  // if the size is something we can handle with a single primitive load/store.

  // A single load+store correctly handles overlapping memory in the memmove

  // case.

  uint64_t Size = MemOpLength->getLimitedValue();

  assert(Size && "0-sized memory transferring should be removed already.");


  if (Size > 8 || (Size&(Size-1)))

    return nullptr;  // If not 1/2/4/8 bytes, exit.


  // If it is an atomic and alignment is less than the size then we will

  // introduce the unaligned memory access which will be later transformed

  // into libcall in CodeGen. This is not evident performance gain so disable

  // it now.

  if (isa<AtomicMemTransferInst>(MI))

    if (*CopyDstAlign < Size || *CopySrcAlign < Size)

      return nullptr;


  // Use an integer load+store unless we can find something better.

  IntegerType* IntType = IntegerType::get(MI->getContext(), Size<<3);


  // If the memcpy has metadata describing the members, see if we can get the

  // TBAA, scope and noalias tags describing our copy.

  AAMDNodes AACopyMD = MI->getAAMetadata().adjustForAccess(Size);


  Value *Src = MI->getArgOperand(1);

  Value *Dest = MI->getArgOperand(0);

  LoadInst *L = Builder.CreateLoad(IntType, Src);

  // Alignment from the mem intrinsic will be better, so use it.

  L->setAlignment(*CopySrcAlign);

  L->setAAMetadata(AACopyMD);

  MDNode *LoopMemParallelMD =

    MI->getMetadata(LLVMContext::MD_mem_parallel_loop_access);

  if (LoopMemParallelMD)

    L->setMetadata(LLVMContext::MD_mem_parallel_loop_access, LoopMemParallelMD);

  MDNode *AccessGroupMD = MI->getMetadata(LLVMContext::MD_access_group);

  if (AccessGroupMD)

    L->setMetadata(LLVMContext::MD_access_group, AccessGroupMD);


  StoreInst *S = Builder.CreateStore(L, Dest);

  // Alignment from the mem intrinsic will be better, so use it.

  S->setAlignment(*CopyDstAlign);

  S->setAAMetadata(AACopyMD);

  if (LoopMemParallelMD)

    S->setMetadata(LLVMContext::MD_mem_parallel_loop_access, LoopMemParallelMD);

  if (AccessGroupMD)

    S->setMetadata(LLVMContext::MD_access_group, AccessGroupMD);

  S->copyMetadata(*MI, LLVMContext::MD_DIAssignID);


  if (auto *MT = dyn_cast<MemTransferInst>(MI)) {

    // non-atomics can be volatile

    L->setVolatile(MT->isVolatile());

    S->setVolatile(MT->isVolatile());

  }

  if (isa<AtomicMemTransferInst>(MI)) {

    // atomics have to be unordered

    L->setOrdering(AtomicOrdering::Unordered);

    S->setOrdering(AtomicOrdering::Unordered);

  }


  // Set the size of the copy to 0, it will be deleted on the next iteration.

  MI->setLength(Constant::getNullValue(MemOpLength->getType()));

  return MI;

}


Instruction *InstCombinerImpl::SimplifyAnyMemSet(AnyMemSetInst *MI) {

  const Align KnownAlignment =

      getKnownAlignment(MI->getDest(), DL, MI, &AC, &DT);

  MaybeAlign MemSetAlign = MI->getDestAlign();

  if (!MemSetAlign || *MemSetAlign < KnownAlignment) {

    MI->setDestAlignment(KnownAlignment);

    return MI;

  }


  // If we have a store to a location which is known constant, we can conclude

  // that the store must be storing the constant value (else the memory

  // wouldn't be constant), and this must be a noop.

  if (!isModSet(AA->getModRefInfoMask(MI->getDest()))) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // Remove memset with an undef value.

  // FIXME: This is technically incorrect because it might overwrite a poison

  // value. Change to PoisonValue once #52930 is resolved.

  if (isa<UndefValue>(MI->getValue())) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // Extract the length and alignment and fill if they are constant.

  ConstantInt *LenC = dyn_cast<ConstantInt>(MI->getLength());

  ConstantInt *FillC = dyn_cast<ConstantInt>(MI->getValue());

  if (!LenC || !FillC || !FillC->getType()->isIntegerTy(8))

    return nullptr;

  const uint64_t Len = LenC->getLimitedValue();

  assert(Len && "0-sized memory setting should be removed already.");

  const Align Alignment = MI->getDestAlign().valueOrOne();


  // If it is an atomic and alignment is less than the size then we will

  // introduce the unaligned memory access which will be later transformed

  // into libcall in CodeGen. This is not evident performance gain so disable

  // it now.

  if (isa<AtomicMemSetInst>(MI))

    if (Alignment < Len)

      return nullptr;


  // memset(s,c,n) -> store s, c (for n=1,2,4,8)

  if (Len <= 8 && isPowerOf2_32((uint32_t)Len)) {

    Value *Dest = MI->getDest();


    // Extract the fill value and store.

    Constant *FillVal = ConstantInt::get(

        MI->getContext(), APInt::getSplat(Len * 8, FillC->getValue()));

    StoreInst *S = Builder.CreateStore(FillVal, Dest, MI->isVolatile());

    S->copyMetadata(*MI, LLVMContext::MD_DIAssignID);

    auto replaceOpForAssignmentMarkers = [FillC, FillVal](auto *DbgAssign) {

      if (llvm::is_contained(DbgAssign->location_ops(), FillC))

        DbgAssign->replaceVariableLocationOp(FillC, FillVal);

    };

    for_each(at::getAssignmentMarkers(S), replaceOpForAssignmentMarkers);

    for_each(at::getDVRAssignmentMarkers(S), replaceOpForAssignmentMarkers);


    S->setAlignment(Alignment);

    if (isa<AtomicMemSetInst>(MI))

      S->setOrdering(AtomicOrdering::Unordered);


    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(LenC->getType()));

    return MI;

  }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Narrow width by halfs excluding zero/undef lanes

Value *InstCombinerImpl::simplifyMaskedLoad(IntrinsicInst &II) {

  Value *LoadPtr = II.getArgOperand(0);

  const Align Alignment =

      cast<ConstantInt>(II.getArgOperand(1))->getAlignValue();


  // If the mask is all ones or undefs, this is a plain vector load of the 1st

  // argument.

  if (maskIsAllOneOrUndef(II.getArgOperand(2))) {

    LoadInst *L = Builder.CreateAlignedLoad(II.getType(), LoadPtr, Alignment,

                                            "unmaskedload");

    L->copyMetadata(II);

    return L;

  }


  // If we can unconditionally load from this address, replace with a

  // load/select idiom. TODO: use DT for context sensitive query

  if (isDereferenceablePointer(LoadPtr, II.getType(),

                               II.getDataLayout(), &II, &AC)) {

    LoadInst *LI = Builder.CreateAlignedLoad(II.getType(), LoadPtr, Alignment,

                                             "unmaskedload");

    LI->copyMetadata(II);

    return Builder.CreateSelect(II.getArgOperand(2), LI, II.getArgOperand(3));

  }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane -> store

// * Narrow width by halfs excluding zero/undef lanes

Instruction *InstCombinerImpl::simplifyMaskedStore(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(3));

  if (!ConstMask)

    return nullptr;


  // If the mask is all zeros, this instruction does nothing.

  if (ConstMask->isNullValue())

    return eraseInstFromFunction(II);


  // If the mask is all ones, this is a plain vector store of the 1st argument.

  if (ConstMask->isAllOnesValue()) {

    Value *StorePtr = II.getArgOperand(1);

    Align Alignment = cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

    StoreInst *S =

        new StoreInst(II.getArgOperand(0), StorePtr, false, Alignment);

    S->copyMetadata(II);

    return S;

  }


  if (isa<ScalableVectorType>(ConstMask->getType()))

    return nullptr;


  // Use masked off lanes to simplify operands via SimplifyDemandedVectorElts

  APInt DemandedElts = possiblyDemandedEltsInMask(ConstMask);

  APInt PoisonElts(DemandedElts.getBitWidth(), 0);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(0), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 0, V);


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane load -> load

// * Dereferenceable address & few lanes -> scalarize speculative load/selects

// * Adjacent vector addresses -> masked.load

// * Narrow width by halfs excluding zero/undef lanes

// * Vector incrementing address -> vector masked load

Instruction *InstCombinerImpl::simplifyMaskedGather(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(2));

  if (!ConstMask)

    return nullptr;


  // Vector splat address w/known mask -> scalar load

  // Fold the gather to load the source vector first lane

  // because it is reloading the same value each time

  if (ConstMask->isAllOnesValue())

    if (auto *SplatPtr = getSplatValue(II.getArgOperand(0))) {

      auto *VecTy = cast<VectorType>(II.getType());

      const Align Alignment =

          cast<ConstantInt>(II.getArgOperand(1))->getAlignValue();

      LoadInst *L = Builder.CreateAlignedLoad(VecTy->getElementType(), SplatPtr,

                                              Alignment, "load.scalar");

      Value *Shuf =

          Builder.CreateVectorSplat(VecTy->getElementCount(), L, "broadcast");

      return replaceInstUsesWith(II, cast<Instruction>(Shuf));

    }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane -> store

// * Adjacent vector addresses -> masked.store

// * Narrow store width by halfs excluding zero/undef lanes

// * Vector incrementing address -> vector masked store

Instruction *InstCombinerImpl::simplifyMaskedScatter(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(3));

  if (!ConstMask)

    return nullptr;


  // If the mask is all zeros, a scatter does nothing.

  if (ConstMask->isNullValue())

    return eraseInstFromFunction(II);


  // Vector splat address -> scalar store

  if (auto *SplatPtr = getSplatValue(II.getArgOperand(1))) {

    // scatter(splat(value), splat(ptr), non-zero-mask) -> store value, ptr

    if (auto *SplatValue = getSplatValue(II.getArgOperand(0))) {

      if (maskContainsAllOneOrUndef(ConstMask)) {

        Align Alignment =

            cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

        StoreInst *S = new StoreInst(SplatValue, SplatPtr, /*IsVolatile=*/false,

                                     Alignment);

        S->copyMetadata(II);

        return S;

      }

    }

    // scatter(vector, splat(ptr), splat(true)) -> store extract(vector,

    // lastlane), ptr

    if (ConstMask->isAllOnesValue()) {

      Align Alignment = cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

      VectorType *WideLoadTy = cast<VectorType>(II.getArgOperand(1)->getType());

      ElementCount VF = WideLoadTy->getElementCount();

      Value *RunTimeVF = Builder.CreateElementCount(Builder.getInt32Ty(), VF);

      Value *LastLane = Builder.CreateSub(RunTimeVF, Builder.getInt32(1));

      Value *Extract =

          Builder.CreateExtractElement(II.getArgOperand(0), LastLane);

      StoreInst *S =

          new StoreInst(Extract, SplatPtr, /*IsVolatile=*/false, Alignment);

      S->copyMetadata(II);

      return S;

    }

  }

  if (isa<ScalableVectorType>(ConstMask->getType()))

    return nullptr;


  // Use masked off lanes to simplify operands via SimplifyDemandedVectorElts

  APInt DemandedElts = possiblyDemandedEltsInMask(ConstMask);

  APInt PoisonElts(DemandedElts.getBitWidth(), 0);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(0), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 0, V);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(1), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 1, V);


  return nullptr;

}


/// This function transforms launder.invariant.group and strip.invariant.group

/// like:

/// launder(launder(%x)) -> launder(%x)       (the result is not the argument)

/// launder(strip(%x)) -> launder(%x)

/// strip(strip(%x)) -> strip(%x)             (the result is not the argument)

/// strip(launder(%x)) -> strip(%x)

/// This is legal because it preserves the most recent information about

/// the presence or absence of invariant.group.

static Instruction *simplifyInvariantGroupIntrinsic(IntrinsicInst &II,

                                                    InstCombinerImpl &IC) {

  auto *Arg = II.getArgOperand(0);

  auto *StrippedArg = Arg->stripPointerCasts();

  auto *StrippedInvariantGroupsArg = StrippedArg;

  while (auto *Intr = dyn_cast<IntrinsicInst>(StrippedInvariantGroupsArg)) {

    if (Intr->getIntrinsicID() != Intrinsic::launder_invariant_group &&

        Intr->getIntrinsicID() != Intrinsic::strip_invariant_group)

      break;

    StrippedInvariantGroupsArg = Intr->getArgOperand(0)->stripPointerCasts();

  }

  if (StrippedArg == StrippedInvariantGroupsArg)

    return nullptr; // No launders/strips to remove.


  Value *Result = nullptr;


  if (II.getIntrinsicID() == Intrinsic::launder_invariant_group)

    Result = IC.Builder.CreateLaunderInvariantGroup(StrippedInvariantGroupsArg);

  else if (II.getIntrinsicID() == Intrinsic::strip_invariant_group)

    Result = IC.Builder.CreateStripInvariantGroup(StrippedInvariantGroupsArg);

  else

    llvm_unreachable(

        "simplifyInvariantGroupIntrinsic only handles launder and strip");

  if (Result->getType()->getPointerAddressSpace() !=

      II.getType()->getPointerAddressSpace())

    Result = IC.Builder.CreateAddrSpaceCast(Result, II.getType());


  return cast<Instruction>(Result);

}


static Instruction *foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC) {

  assert((II.getIntrinsicID() == Intrinsic::cttz ||

          II.getIntrinsicID() == Intrinsic::ctlz) &&

         "Expected cttz or ctlz intrinsic");

  bool IsTZ = II.getIntrinsicID() == Intrinsic::cttz;

  Value *Op0 = II.getArgOperand(0);

  Value *Op1 = II.getArgOperand(1);

  Value *X;

  // ctlz(bitreverse(x)) -> cttz(x)

  // cttz(bitreverse(x)) -> ctlz(x)

  if (match(Op0, m_BitReverse(m_Value(X)))) {

    Intrinsic::ID ID = IsTZ ? Intrinsic::ctlz : Intrinsic::cttz;

    Function *F =

        Intrinsic::getOrInsertDeclaration(II.getModule(), ID, II.getType());

    return CallInst::Create(F, {X, II.getArgOperand(1)});

  }


  if (II.getType()->isIntOrIntVectorTy(1)) {

    // ctlz/cttz i1 Op0 --> not Op0

    if (match(Op1, m_Zero()))

      return BinaryOperator::CreateNot(Op0);

    // If zero is poison, then the input can be assumed to be "true", so the

    // instruction simplifies to "false".

    assert(match(Op1, m_One()) && "Expected ctlz/cttz operand to be 0 or 1");

    return IC.replaceInstUsesWith(II, ConstantInt::getNullValue(II.getType()));

  }


  // If ctlz/cttz is only used as a shift amount, set is_zero_poison to true.

  if (II.hasOneUse() && match(Op1, m_Zero()) &&

      match(II.user_back(), m_Shift(m_Value(), m_Specific(&II)))) {

    II.dropUBImplyingAttrsAndMetadata();

    return IC.replaceOperand(II, 1, IC.Builder.getTrue());

  }


  Constant *C;


  if (IsTZ) {

    // cttz(-x) -> cttz(x)

    if (match(Op0, m_Neg(m_Value(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(-x & x) -> cttz(x)

    if (match(Op0, m_c_And(m_Neg(m_Value(X)), m_Deferred(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(sext(x)) -> cttz(zext(x))

    if (match(Op0, m_OneUse(m_SExt(m_Value(X))))) {

      auto *Zext = IC.Builder.CreateZExt(X, II.getType());

      auto *CttzZext =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, Zext, Op1);

      return IC.replaceInstUsesWith(II, CttzZext);

    }


    // Zext doesn't change the number of trailing zeros, so narrow:

    // cttz(zext(x)) -> zext(cttz(x)) if the 'ZeroIsPoison' parameter is 'true'.

    if (match(Op0, m_OneUse(m_ZExt(m_Value(X)))) && match(Op1, m_One())) {

      auto *Cttz = IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, X,

                                                    IC.Builder.getTrue());

      auto *ZextCttz = IC.Builder.CreateZExt(Cttz, II.getType());

      return IC.replaceInstUsesWith(II, ZextCttz);

    }


    // cttz(abs(x)) -> cttz(x)

    // cttz(nabs(x)) -> cttz(x)

    Value *Y;

    SelectPatternFlavor SPF = matchSelectPattern(Op0, X, Y).Flavor;

    if (SPF == SPF_ABS || SPF == SPF_NABS)

      return IC.replaceOperand(II, 0, X);


    if (match(Op0, m_Intrinsic<Intrinsic::abs>(m_Value(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(shl(%const, %val), 1) --> add(cttz(%const, 1), %val)

    if (match(Op0, m_Shl(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCttz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, C, Op1);

      return BinaryOperator::CreateAdd(ConstCttz, X);

    }


    // cttz(lshr exact (%const, %val), 1) --> sub(cttz(%const, 1), %val)

    if (match(Op0, m_Exact(m_LShr(m_ImmConstant(C), m_Value(X)))) &&

        match(Op1, m_One())) {

      Value *ConstCttz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, C, Op1);

      return BinaryOperator::CreateSub(ConstCttz, X);

    }


    // cttz(add(lshr(UINT_MAX, %val), 1)) --> sub(width, %val)

    if (match(Op0, m_Add(m_LShr(m_AllOnes(), m_Value(X)), m_One()))) {

      Value *Width =

          ConstantInt::get(II.getType(), II.getType()->getScalarSizeInBits());

      return BinaryOperator::CreateSub(Width, X);

    }

  } else {

    // ctlz(lshr(%const, %val), 1) --> add(ctlz(%const, 1), %val)

    if (match(Op0, m_LShr(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCtlz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);

      return BinaryOperator::CreateAdd(ConstCtlz, X);

    }


    // ctlz(shl nuw (%const, %val), 1) --> sub(ctlz(%const, 1), %val)

    if (match(Op0, m_NUWShl(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCtlz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);

      return BinaryOperator::CreateSub(ConstCtlz, X);

    }

  }


  // cttz(Pow2) -> Log2(Pow2)

  // ctlz(Pow2) -> BitWidth - 1 - Log2(Pow2)

  if (auto *R = IC.tryGetLog2(Op0, match(Op1, m_One()))) {

    if (IsTZ)

      return IC.replaceInstUsesWith(II, R);

    BinaryOperator *BO = BinaryOperator::CreateSub(

        ConstantInt::get(R->getType(), R->getType()->getScalarSizeInBits() - 1),

        R);

    BO->setHasNoSignedWrap();

    BO->setHasNoUnsignedWrap();

    return BO;

  }


  KnownBits Known = IC.computeKnownBits(Op0, 0, &II);


  // Create a mask for bits above (ctlz) or below (cttz) the first known one.

  unsigned PossibleZeros = IsTZ ? Known.countMaxTrailingZeros()

                                : Known.countMaxLeadingZeros();

  unsigned DefiniteZeros = IsTZ ? Known.countMinTrailingZeros()

                                : Known.countMinLeadingZeros();


  // If all bits above (ctlz) or below (cttz) the first known one are known

  // zero, this value is constant.

  // FIXME: This should be in InstSimplify because we're replacing an

  // instruction with a constant.

  if (PossibleZeros == DefiniteZeros) {

    auto *C = ConstantInt::get(Op0->getType(), DefiniteZeros);

    return IC.replaceInstUsesWith(II, C);

  }


  // If the input to cttz/ctlz is known to be non-zero,

  // then change the 'ZeroIsPoison' parameter to 'true'

  // because we know the zero behavior can't affect the result.

  if (!Known.One.isZero() ||

      isKnownNonZero(Op0, IC.getSimplifyQuery().getWithInstruction(&II))) {

    if (!match(II.getArgOperand(1), m_One()))

      return IC.replaceOperand(II, 1, IC.Builder.getTrue());

  }


  // Add range attribute since known bits can't completely reflect what we know.

  unsigned BitWidth = Op0->getType()->getScalarSizeInBits();

  if (BitWidth != 1 && !II.hasRetAttr(Attribute::Range) &&

      !II.getMetadata(LLVMContext::MD_range)) {

    ConstantRange Range(APInt(BitWidth, DefiniteZeros),

                        APInt(BitWidth, PossibleZeros + 1));

    II.addRangeRetAttr(Range);

    return &II;

  }


  return nullptr;

}


static Instruction *foldCtpop(IntrinsicInst &II, InstCombinerImpl &IC) {

  assert(II.getIntrinsicID() == Intrinsic::ctpop &&

         "Expected ctpop intrinsic");

  Type *Ty = II.getType();

  unsigned BitWidth = Ty->getScalarSizeInBits();

  Value *Op0 = II.getArgOperand(0);

  Value *X, *Y;


  // ctpop(bitreverse(x)) -> ctpop(x)

  // ctpop(bswap(x)) -> ctpop(x)

  if (match(Op0, m_BitReverse(m_Value(X))) || match(Op0, m_BSwap(m_Value(X))))

    return IC.replaceOperand(II, 0, X);


  // ctpop(rot(x)) -> ctpop(x)

  if ((match(Op0, m_FShl(m_Value(X), m_Value(Y), m_Value())) ||

       match(Op0, m_FShr(m_Value(X), m_Value(Y), m_Value()))) &&

      X == Y)

    return IC.replaceOperand(II, 0, X);


  // ctpop(x | -x) -> bitwidth - cttz(x, false)

  if (Op0->hasOneUse() &&

      match(Op0, m_c_Or(m_Value(X), m_Neg(m_Deferred(X))))) {

    auto *Cttz = IC.Builder.CreateIntrinsic(Intrinsic::cttz, Ty,

                                            {X, IC.Builder.getFalse()});

    auto *Bw = ConstantInt::get(Ty, APInt(BitWidth, BitWidth));

    return IC.replaceInstUsesWith(II, IC.Builder.CreateSub(Bw, Cttz));

  }


  // ctpop(~x & (x - 1)) -> cttz(x, false)

  if (match(Op0,

            m_c_And(m_Not(m_Value(X)), m_Add(m_Deferred(X), m_AllOnes())))) {

    Function *F =

        Intrinsic::getOrInsertDeclaration(II.getModule(), Intrinsic::cttz, Ty);

    return CallInst::Create(F, {X, IC.Builder.getFalse()});

  }


  // Zext doesn't change the number of set bits, so narrow:

  // ctpop (zext X) --> zext (ctpop X)

  if (match(Op0, m_OneUse(m_ZExt(m_Value(X))))) {

    Value *NarrowPop = IC.Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, X);

    return CastInst::Create(Instruction::ZExt, NarrowPop, Ty);

  }


  KnownBits Known(BitWidth);

  IC.computeKnownBits(Op0, Known, 0, &II);


  // If all bits are zero except for exactly one fixed bit, then the result

  // must be 0 or 1, and we can get that answer by shifting to LSB:

  // ctpop (X & 32) --> (X & 32) >> 5

  // TODO: Investigate removing this as its likely unnecessary given the below

  // `isKnownToBeAPowerOfTwo` check.

  if ((~Known.Zero).isPowerOf2())

    return BinaryOperator::CreateLShr(

        Op0, ConstantInt::get(Ty, (~Known.Zero).exactLogBase2()));


  // More generally we can also handle non-constant power of 2 patterns such as

  // shl/shr(Pow2, X), (X & -X), etc... by transforming:

  // ctpop(Pow2OrZero) --> icmp ne X, 0

  if (IC.isKnownToBeAPowerOfTwo(Op0, /* OrZero */ true))

    return CastInst::Create(Instruction::ZExt,

                            IC.Builder.CreateICmp(ICmpInst::ICMP_NE, Op0,

                                                  Constant::getNullValue(Ty)),

                            Ty);


  // Add range attribute since known bits can't completely reflect what we know.

  if (BitWidth != 1) {

    ConstantRange OldRange =

        II.getRange().value_or(ConstantRange::getFull(BitWidth));


    unsigned Lower = Known.countMinPopulation();

    unsigned Upper = Known.countMaxPopulation() + 1;


    if (Lower == 0 && OldRange.contains(APInt::getZero(BitWidth)) &&

        isKnownNonZero(Op0, IC.getSimplifyQuery().getWithInstruction(&II)))

      Lower = 1;


    ConstantRange Range(APInt(BitWidth, Lower), APInt(BitWidth, Upper));

    Range = Range.intersectWith(OldRange, ConstantRange::Unsigned);


    if (Range != OldRange) {

      II.addRangeRetAttr(Range);

      return &II;

    }

  }


  return nullptr;

}


/// Convert a table lookup to shufflevector if the mask is constant.

/// This could benefit tbl1 if the mask is { 7,6,5,4,3,2,1,0 }, in

/// which case we could lower the shufflevector with rev64 instructions

/// as it's actually a byte reverse.

static Value *simplifyNeonTbl1(const IntrinsicInst &II,

                               InstCombiner::BuilderTy &Builder) {

  // Bail out if the mask is not a constant.

  auto *C = dyn_cast<Constant>(II.getArgOperand(1));

  if (!C)

    return nullptr;


  auto *VecTy = cast<FixedVectorType>(II.getType());

  unsigned NumElts = VecTy->getNumElements();


  // Only perform this transformation for <8 x i8> vector types.

  if (!VecTy->getElementType()->isIntegerTy(8) || NumElts != 8)

    return nullptr;


  int Indexes[8];


  for (unsigned I = 0; I < NumElts; ++I) {

    Constant *COp = C->getAggregateElement(I);


    if (!COp || !isa<ConstantInt>(COp))

      return nullptr;


    Indexes[I] = cast<ConstantInt>(COp)->getLimitedValue();


    // Make sure the mask indices are in range.

    if ((unsigned)Indexes[I] >= NumElts)

      return nullptr;

  }


  auto *V1 = II.getArgOperand(0);

  auto *V2 = Constant::getNullValue(V1->getType());

  return Builder.CreateShuffleVector(V1, V2, ArrayRef(Indexes));

}


// Returns true iff the 2 intrinsics have the same operands, limiting the

// comparison to the first NumOperands.

static bool haveSameOperands(const IntrinsicInst &I, const IntrinsicInst &E,

                             unsigned NumOperands) {

  assert(I.arg_size() >= NumOperands && "Not enough operands");

  assert(E.arg_size() >= NumOperands && "Not enough operands");

  for (unsigned i = 0; i < NumOperands; i++)

    if (I.getArgOperand(i) != E.getArgOperand(i))

      return false;

  return true;

}


// Remove trivially empty start/end intrinsic ranges, i.e. a start

// immediately followed by an end (ignoring debuginfo or other

// start/end intrinsics in between). As this handles only the most trivial

// cases, tracking the nesting level is not needed:

//

//   call @llvm.foo.start(i1 0)

//   call @llvm.foo.start(i1 0) ; This one won't be skipped: it will be removed

//   call @llvm.foo.end(i1 0)

//   call @llvm.foo.end(i1 0) ; &I

static bool

removeTriviallyEmptyRange(IntrinsicInst &EndI, InstCombinerImpl &IC,

                          std::function<bool(const IntrinsicInst &)> IsStart) {

  // We start from the end intrinsic and scan backwards, so that InstCombine

  // has already processed (and potentially removed) all the instructions

  // before the end intrinsic.

  BasicBlock::reverse_iterator BI(EndI), BE(EndI.getParent()->rend());

  for (; BI != BE; ++BI) {

    if (auto *I = dyn_cast<IntrinsicInst>(&*BI)) {

      if (I->isDebugOrPseudoInst() ||

          I->getIntrinsicID() == EndI.getIntrinsicID())

        continue;

      if (IsStart(*I)) {

        if (haveSameOperands(EndI, *I, EndI.arg_size())) {

          IC.eraseInstFromFunction(*I);

          IC.eraseInstFromFunction(EndI);

          return true;

        }

        // Skip start intrinsics that don't pair with this end intrinsic.

        continue;

      }

    }

    break;

  }


  return false;

}


Instruction *InstCombinerImpl::visitVAEndInst(VAEndInst &I) {

  removeTriviallyEmptyRange(I, *this, [](const IntrinsicInst &I) {

    return I.getIntrinsicID() == Intrinsic::vastart ||

           I.getIntrinsicID() == Intrinsic::vacopy;

  });

  return nullptr;

}


static CallInst *canonicalizeConstantArg0ToArg1(CallInst &Call) {

  assert(Call.arg_size() > 1 && "Need at least 2 args to swap");

  Value *Arg0 = Call.getArgOperand(0), *Arg1 = Call.getArgOperand(1);

  if (isa<Constant>(Arg0) && !isa<Constant>(Arg1)) {

    Call.setArgOperand(0, Arg1);

    Call.setArgOperand(1, Arg0);

    return &Call;

  }

  return nullptr;

}


/// Creates a result tuple for an overflow intrinsic \p II with a given

/// \p Result and a constant \p Overflow value.

static Instruction *createOverflowTuple(IntrinsicInst *II, Value *Result,

                                        Constant *Overflow) {

  Constant *V[] = {PoisonValue::get(Result->getType()), Overflow};

  StructType *ST = cast<StructType>(II->getType());

  Constant *Struct = ConstantStruct::get(ST, V);

  return InsertValueInst::Create(Struct, Result, 0);

}


Instruction *

InstCombinerImpl::foldIntrinsicWithOverflowCommon(IntrinsicInst *II) {

  WithOverflowInst *WO = cast<WithOverflowInst>(II);

  Value *OperationResult = nullptr;

  Constant *OverflowResult = nullptr;

  if (OptimizeOverflowCheck(WO->getBinaryOp(), WO->isSigned(), WO->getLHS(),

                            WO->getRHS(), *WO, OperationResult, OverflowResult))

    return createOverflowTuple(WO, OperationResult, OverflowResult);


  // See whether we can optimize the overflow check with assumption information.

  for (User *U : WO->users()) {

    if (!match(U, m_ExtractValue<1>(m_Value())))

      continue;


    for (auto &AssumeVH : AC.assumptionsFor(U)) {

      if (!AssumeVH)

        continue;

      CallInst *I = cast<CallInst>(AssumeVH);

      if (!match(I->getArgOperand(0), m_Not(m_Specific(U))))

        continue;

      if (!isValidAssumeForContext(I, II, /*DT=*/nullptr,

                                   /*AllowEphemerals=*/true))

        continue;

      Value *Result =

          Builder.CreateBinOp(WO->getBinaryOp(), WO->getLHS(), WO->getRHS());

      Result->takeName(WO);

      if (auto *Inst = dyn_cast<Instruction>(Result)) {

        if (WO->isSigned())

          Inst->setHasNoSignedWrap();

        else

          Inst->setHasNoUnsignedWrap();

      }

      return createOverflowTuple(WO, Result,

                                 ConstantInt::getFalse(U->getType()));

    }

  }


  return nullptr;

}


static bool inputDenormalIsIEEE(const Function &F, const Type *Ty) {

  Ty = Ty->getScalarType();

  return F.getDenormalMode(Ty->getFltSemantics()).Input == DenormalMode::IEEE;

}


static bool inputDenormalIsDAZ(const Function &F, const Type *Ty) {

  Ty = Ty->getScalarType();

  return F.getDenormalMode(Ty->getFltSemantics()).inputsAreZero();

}


/// \returns the compare predicate type if the test performed by

/// llvm.is.fpclass(x, \p Mask) is equivalent to fcmp o__ x, 0.0 with the

/// floating-point environment assumed for \p F for type \p Ty

static FCmpInst::Predicate fpclassTestIsFCmp0(FPClassTest Mask,

                                              const Function &F, Type *Ty) {

  switch (static_cast<unsigned>(Mask)) {

  case fcZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OEQ;

    break;

  case fcZero | fcSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OEQ;

    break;

  case fcPositive | fcNegZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OGE;

    break;

  case fcPositive | fcNegZero | fcNegSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OGE;

    break;

  case fcPosSubnormal | fcPosNormal | fcPosInf:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OGT;

    break;

  case fcNegative | fcPosZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OLE;

    break;

  case fcNegative | fcPosZero | fcPosSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OLE;

    break;

  case fcNegSubnormal | fcNegNormal | fcNegInf:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OLT;

    break;

  case fcPosNormal | fcPosInf:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OGT;

    break;

  case fcNegNormal | fcNegInf:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OLT;

    break;

  case ~fcZero & ~fcNan:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_ONE;

    break;

  case ~(fcZero | fcSubnormal) & ~fcNan:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_ONE;

    break;

  default:

    break;

  }


  return FCmpInst::BAD_FCMP_PREDICATE;

}


Instruction *InstCombinerImpl::foldIntrinsicIsFPClass(IntrinsicInst &II) {

  Value *Src0 = II.getArgOperand(0);

  Value *Src1 = II.getArgOperand(1);

  const ConstantInt *CMask = cast<ConstantInt>(Src1);

  FPClassTest Mask = static_cast<FPClassTest>(CMask->getZExtValue());

  const bool IsUnordered = (Mask & fcNan) == fcNan;

  const bool IsOrdered = (Mask & fcNan) == fcNone;

  const FPClassTest OrderedMask = Mask & ~fcNan;

  const FPClassTest OrderedInvertedMask = ~OrderedMask & ~fcNan;


  const bool IsStrict =

      II.getFunction()->getAttributes().hasFnAttr(Attribute::StrictFP);


  Value *FNegSrc;

  if (match(Src0, m_FNeg(m_Value(FNegSrc)))) {

    // is.fpclass (fneg x), mask -> is.fpclass x, (fneg mask)


    II.setArgOperand(1, ConstantInt::get(Src1->getType(), fneg(Mask)));

    return replaceOperand(II, 0, FNegSrc);

  }


  Value *FAbsSrc;

  if (match(Src0, m_FAbs(m_Value(FAbsSrc)))) {

    II.setArgOperand(1, ConstantInt::get(Src1->getType(), inverse_fabs(Mask)));

    return replaceOperand(II, 0, FAbsSrc);

  }


  if ((OrderedMask == fcInf || OrderedInvertedMask == fcInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, fcInf) -> fcmp oeq fabs(x), +inf

    // is.fpclass(x, ~fcInf) -> fcmp one fabs(x), +inf

    // is.fpclass(x, fcInf|fcNan) -> fcmp ueq fabs(x), +inf

    // is.fpclass(x, ~(fcInf|fcNan)) -> fcmp une fabs(x), +inf

    Constant *Inf = ConstantFP::getInfinity(Src0->getType());

    FCmpInst::Predicate Pred =

        IsUnordered ? FCmpInst::FCMP_UEQ : FCmpInst::FCMP_OEQ;

    if (OrderedInvertedMask == fcInf)

      Pred = IsUnordered ? FCmpInst::FCMP_UNE : FCmpInst::FCMP_ONE;


    Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Src0);

    Value *CmpInf = Builder.CreateFCmp(Pred, Fabs, Inf);

    CmpInf->takeName(&II);

    return replaceInstUsesWith(II, CmpInf);

  }


  if ((OrderedMask == fcPosInf || OrderedMask == fcNegInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, fcPosInf) -> fcmp oeq x, +inf

    // is.fpclass(x, fcNegInf) -> fcmp oeq x, -inf

    // is.fpclass(x, fcPosInf|fcNan) -> fcmp ueq x, +inf

    // is.fpclass(x, fcNegInf|fcNan) -> fcmp ueq x, -inf

    Constant *Inf =

        ConstantFP::getInfinity(Src0->getType(), OrderedMask == fcNegInf);

    Value *EqInf = IsUnordered ? Builder.CreateFCmpUEQ(Src0, Inf)

                               : Builder.CreateFCmpOEQ(Src0, Inf);


    EqInf->takeName(&II);

    return replaceInstUsesWith(II, EqInf);

  }


  if ((OrderedInvertedMask == fcPosInf || OrderedInvertedMask == fcNegInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, ~fcPosInf) -> fcmp one x, +inf

    // is.fpclass(x, ~fcNegInf) -> fcmp one x, -inf

    // is.fpclass(x, ~fcPosInf|fcNan) -> fcmp une x, +inf

    // is.fpclass(x, ~fcNegInf|fcNan) -> fcmp une x, -inf

    Constant *Inf = ConstantFP::getInfinity(Src0->getType(),

                                            OrderedInvertedMask == fcNegInf);

    Value *NeInf = IsUnordered ? Builder.CreateFCmpUNE(Src0, Inf)

                               : Builder.CreateFCmpONE(Src0, Inf);

    NeInf->takeName(&II);

    return replaceInstUsesWith(II, NeInf);

  }


  if (Mask == fcNan && !IsStrict) {

    // Equivalent of isnan. Replace with standard fcmp if we don't care about FP

    // exceptions.

    Value *IsNan =

        Builder.CreateFCmpUNO(Src0, ConstantFP::getZero(Src0->getType()));

    IsNan->takeName(&II);

    return replaceInstUsesWith(II, IsNan);

  }


  if (Mask == (~fcNan & fcAllFlags) && !IsStrict) {

    // Equivalent of !isnan. Replace with standard fcmp.

    Value *FCmp =

        Builder.CreateFCmpORD(Src0, ConstantFP::getZero(Src0->getType()));

    FCmp->takeName(&II);

    return replaceInstUsesWith(II, FCmp);

  }


  FCmpInst::Predicate PredType = FCmpInst::BAD_FCMP_PREDICATE;


  // Try to replace with an fcmp with 0

  //

  // is.fpclass(x, fcZero) -> fcmp oeq x, 0.0

  // is.fpclass(x, fcZero | fcNan) -> fcmp ueq x, 0.0

  // is.fpclass(x, ~fcZero & ~fcNan) -> fcmp one x, 0.0

  // is.fpclass(x, ~fcZero) -> fcmp une x, 0.0

  //

  // is.fpclass(x, fcPosSubnormal | fcPosNormal | fcPosInf) -> fcmp ogt x, 0.0

  // is.fpclass(x, fcPositive | fcNegZero) -> fcmp oge x, 0.0

  //

  // is.fpclass(x, fcNegSubnormal | fcNegNormal | fcNegInf) -> fcmp olt x, 0.0

  // is.fpclass(x, fcNegative | fcPosZero) -> fcmp ole x, 0.0

  //

  if (!IsStrict && (IsOrdered || IsUnordered) &&

      (PredType = fpclassTestIsFCmp0(OrderedMask, *II.getFunction(),

                                     Src0->getType())) !=

          FCmpInst::BAD_FCMP_PREDICATE) {

    Constant *Zero = ConstantFP::getZero(Src0->getType());

    // Equivalent of == 0.

    Value *FCmp = Builder.CreateFCmp(

        IsUnordered ? FCmpInst::getUnorderedPredicate(PredType) : PredType,

        Src0, Zero);


    FCmp->takeName(&II);

    return replaceInstUsesWith(II, FCmp);

  }


  KnownFPClass Known = computeKnownFPClass(Src0, Mask, &II);


  // Clear test bits we know must be false from the source value.

  // fp_class (nnan x), qnan|snan|other -> fp_class (nnan x), other

  // fp_class (ninf x), ninf|pinf|other -> fp_class (ninf x), other

  if ((Mask & Known.KnownFPClasses) != Mask) {

    II.setArgOperand(

        1, ConstantInt::get(Src1->getType(), Mask & Known.KnownFPClasses));

    return &II;

  }


  // If none of the tests which can return false are possible, fold to true.

  // fp_class (nnan x), ~(qnan|snan) -> true

  // fp_class (ninf x), ~(ninf|pinf) -> true

  if (Mask == Known.KnownFPClasses)

    return replaceInstUsesWith(II, ConstantInt::get(II.getType(), true));


  return nullptr;

}


static std::optional<bool> getKnownSign(Value *Op, const SimplifyQuery &SQ) {

  KnownBits Known = computeKnownBits(Op, /*Depth=*/0, SQ);

  if (Known.isNonNegative())

    return false;

  if (Known.isNegative())

    return true;


  Value *X, *Y;

  if (match(Op, m_NSWSub(m_Value(X), m_Value(Y))))

    return isImpliedByDomCondition(ICmpInst::ICMP_SLT, X, Y, SQ.CxtI, SQ.DL);


  return std::nullopt;

}


static std::optional<bool> getKnownSignOrZero(Value *Op,

                                              const SimplifyQuery &SQ) {

  if (std::optional<bool> Sign = getKnownSign(Op, SQ))

    return Sign;


  Value *X, *Y;

  if (match(Op, m_NSWSub(m_Value(X), m_Value(Y))))

    return isImpliedByDomCondition(ICmpInst::ICMP_SLE, X, Y, SQ.CxtI, SQ.DL);


  return std::nullopt;

}


/// Return true if two values \p Op0 and \p Op1 are known to have the same sign.

static bool signBitMustBeTheSame(Value *Op0, Value *Op1,

                                 const SimplifyQuery &SQ) {

  std::optional<bool> Known1 = getKnownSign(Op1, SQ);

  if (!Known1)

    return false;

  std::optional<bool> Known0 = getKnownSign(Op0, SQ);

  if (!Known0)

    return false;

  return *Known0 == *Known1;

}


/// Try to canonicalize min/max(X + C0, C1) as min/max(X, C1 - C0) + C0. This

/// can trigger other combines.

static Instruction *moveAddAfterMinMax(IntrinsicInst *II,

                                       InstCombiner::BuilderTy &Builder) {

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  assert((MinMaxID == Intrinsic::smax || MinMaxID == Intrinsic::smin ||

          MinMaxID == Intrinsic::umax || MinMaxID == Intrinsic::umin) &&

         "Expected a min or max intrinsic");


  // TODO: Match vectors with undef elements, but undef may not propagate.

  Value *Op0 = II->getArgOperand(0), *Op1 = II->getArgOperand(1);

  Value *X;

  const APInt *C0, *C1;

  if (!match(Op0, m_OneUse(m_Add(m_Value(X), m_APInt(C0)))) ||

      !match(Op1, m_APInt(C1)))

    return nullptr;


  // Check for necessary no-wrap and overflow constraints.

  bool IsSigned = MinMaxID == Intrinsic::smax || MinMaxID == Intrinsic::smin;

  auto *Add = cast<BinaryOperator>(Op0);

  if ((IsSigned && !Add->hasNoSignedWrap()) ||

      (!IsSigned && !Add->hasNoUnsignedWrap()))

    return nullptr;


  // If the constant difference overflows, then instsimplify should reduce the

  // min/max to the add or C1.

  bool Overflow;

  APInt CDiff =

      IsSigned ? C1->ssub_ov(*C0, Overflow) : C1->usub_ov(*C0, Overflow);

  assert(!Overflow && "Expected simplify of min/max");


  // min/max (add X, C0), C1 --> add (min/max X, C1 - C0), C0

  // Note: the "mismatched" no-overflow setting does not propagate.

  Constant *NewMinMaxC = ConstantInt::get(II->getType(), CDiff);

  Value *NewMinMax = Builder.CreateBinaryIntrinsic(MinMaxID, X, NewMinMaxC);

  return IsSigned ? BinaryOperator::CreateNSWAdd(NewMinMax, Add->getOperand(1))

                  : BinaryOperator::CreateNUWAdd(NewMinMax, Add->getOperand(1));

}

/// Match a sadd_sat or ssub_sat which is using min/max to clamp the value.

Instruction *InstCombinerImpl::matchSAddSubSat(IntrinsicInst &MinMax1) {

  Type *Ty = MinMax1.getType();


  // We are looking for a tree of:

  // max(INT_MIN, min(INT_MAX, add(sext(A), sext(B))))

  // Where the min and max could be reversed

  Instruction *MinMax2;

  BinaryOperator *AddSub;

  const APInt *MinValue, *MaxValue;

  if (match(&MinMax1, m_SMin(m_Instruction(MinMax2), m_APInt(MaxValue)))) {

    if (!match(MinMax2, m_SMax(m_BinOp(AddSub), m_APInt(MinValue))))

      return nullptr;

  } else if (match(&MinMax1,

                   m_SMax(m_Instruction(MinMax2), m_APInt(MinValue)))) {

    if (!match(MinMax2, m_SMin(m_BinOp(AddSub), m_APInt(MaxValue))))

      return nullptr;

  } else

    return nullptr;


  // Check that the constants clamp a saturate, and that the new type would be

  // sensible to convert to.

  if (!(*MaxValue + 1).isPowerOf2() || -*MinValue != *MaxValue + 1)

    return nullptr;

  // In what bitwidth can this be treated as saturating arithmetics?

  unsigned NewBitWidth = (*MaxValue + 1).logBase2() + 1;

  // FIXME: This isn't quite right for vectors, but using the scalar type is a

  // good first approximation for what should be done there.

  if (!shouldChangeType(Ty->getScalarType()->getIntegerBitWidth(), NewBitWidth))

    return nullptr;


  // Also make sure that the inner min/max and the add/sub have one use.

  if (!MinMax2->hasOneUse() || !AddSub->hasOneUse())

    return nullptr;


  // Create the new type (which can be a vector type)

  Type *NewTy = Ty->getWithNewBitWidth(NewBitWidth);


  Intrinsic::ID IntrinsicID;

  if (AddSub->getOpcode() == Instruction::Add)

    IntrinsicID = Intrinsic::sadd_sat;

  else if (AddSub->getOpcode() == Instruction::Sub)

    IntrinsicID = Intrinsic::ssub_sat;

  else

    return nullptr;


  // The two operands of the add/sub must be nsw-truncatable to the NewTy. This

  // is usually achieved via a sext from a smaller type.

  if (ComputeMaxSignificantBits(AddSub->getOperand(0), 0, AddSub) >

          NewBitWidth ||

      ComputeMaxSignificantBits(AddSub->getOperand(1), 0, AddSub) > NewBitWidth)

    return nullptr;


  // Finally create and return the sat intrinsic, truncated to the new type

  Value *AT = Builder.CreateTrunc(AddSub->getOperand(0), NewTy);

  Value *BT = Builder.CreateTrunc(AddSub->getOperand(1), NewTy);

  Value *Sat = Builder.CreateIntrinsic(IntrinsicID, NewTy, {AT, BT});

  return CastInst::Create(Instruction::SExt, Sat, Ty);

}


/// If we have a clamp pattern like max (min X, 42), 41 -- where the output

/// can only be one of two possible constant values -- turn that into a select

/// of constants.

static Instruction *foldClampRangeOfTwo(IntrinsicInst *II,

                                        InstCombiner::BuilderTy &Builder) {

  Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

  Value *X;

  const APInt *C0, *C1;

  if (!match(I1, m_APInt(C1)) || !I0->hasOneUse())

    return nullptr;


  CmpInst::Predicate Pred = CmpInst::BAD_ICMP_PREDICATE;

  switch (II->getIntrinsicID()) {

  case Intrinsic::smax:

    if (match(I0, m_SMin(m_Value(X), m_APInt(C0))) && *C0 == *C1 + 1)

      Pred = ICmpInst::ICMP_SGT;

    break;

  case Intrinsic::smin:

    if (match(I0, m_SMax(m_Value(X), m_APInt(C0))) && *C1 == *C0 + 1)

      Pred = ICmpInst::ICMP_SLT;

    break;

  case Intrinsic::umax:

    if (match(I0, m_UMin(m_Value(X), m_APInt(C0))) && *C0 == *C1 + 1)

      Pred = ICmpInst::ICMP_UGT;

    break;

  case Intrinsic::umin:

    if (match(I0, m_UMax(m_Value(X), m_APInt(C0))) && *C1 == *C0 + 1)

      Pred = ICmpInst::ICMP_ULT;

    break;

  default:

    llvm_unreachable("Expected min/max intrinsic");

  }

  if (Pred == CmpInst::BAD_ICMP_PREDICATE)

    return nullptr;


  // max (min X, 42), 41 --> X > 41 ? 42 : 41

  // min (max X, 42), 43 --> X < 43 ? 42 : 43

  Value *Cmp = Builder.CreateICmp(Pred, X, I1);

  return SelectInst::Create(Cmp, ConstantInt::get(II->getType(), *C0), I1);

}


/// If this min/max has a constant operand and an operand that is a matching

/// min/max with a constant operand, constant-fold the 2 constant operands.

static Value *reassociateMinMaxWithConstants(IntrinsicInst *II,

                                             IRBuilderBase &Builder,

                                             const SimplifyQuery &SQ) {

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  auto *LHS = dyn_cast<MinMaxIntrinsic>(II->getArgOperand(0));

  if (!LHS)

    return nullptr;


  Constant *C0, *C1;

  if (!match(LHS->getArgOperand(1), m_ImmConstant(C0)) ||

      !match(II->getArgOperand(1), m_ImmConstant(C1)))

    return nullptr;


  // max (max X, C0), C1 --> max X, (max C0, C1)

  // min (min X, C0), C1 --> min X, (min C0, C1)

  // umax (smax X, nneg C0), nneg C1 --> smax X, (umax C0, C1)

  // smin (umin X, nneg C0), nneg C1 --> umin X, (smin C0, C1)

  Intrinsic::ID InnerMinMaxID = LHS->getIntrinsicID();

  if (InnerMinMaxID != MinMaxID &&

      !(((MinMaxID == Intrinsic::umax && InnerMinMaxID == Intrinsic::smax) ||

         (MinMaxID == Intrinsic::smin && InnerMinMaxID == Intrinsic::umin)) &&

        isKnownNonNegative(C0, SQ) && isKnownNonNegative(C1, SQ)))

    return nullptr;


  ICmpInst::Predicate Pred = MinMaxIntrinsic::getPredicate(MinMaxID);

  Value *CondC = Builder.CreateICmp(Pred, C0, C1);

  Value *NewC = Builder.CreateSelect(CondC, C0, C1);

  return Builder.CreateIntrinsic(InnerMinMaxID, II->getType(),

                                 {LHS->getArgOperand(0), NewC});

}


/// If this min/max has a matching min/max operand with a constant, try to push

/// the constant operand into this instruction. This can enable more folds.

static Instruction *

reassociateMinMaxWithConstantInOperand(IntrinsicInst *II,

                                       InstCombiner::BuilderTy &Builder) {

  // Match and capture a min/max operand candidate.

  Value *X, *Y;

  Constant *C;

  Instruction *Inner;

  if (!match(II, m_c_MaxOrMin(m_OneUse(m_CombineAnd(

                                  m_Instruction(Inner),

                                  m_MaxOrMin(m_Value(X), m_ImmConstant(C)))),

                              m_Value(Y))))

    return nullptr;


  // The inner op must match. Check for constants to avoid infinite loops.

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  auto *InnerMM = dyn_cast<IntrinsicInst>(Inner);

  if (!InnerMM || InnerMM->getIntrinsicID() != MinMaxID ||

      match(X, m_ImmConstant()) || match(Y, m_ImmConstant()))

    return nullptr;


  // max (max X, C), Y --> max (max X, Y), C

  Function *MinMax = Intrinsic::getOrInsertDeclaration(II->getModule(),

                                                       MinMaxID, II->getType());

  Value *NewInner = Builder.CreateBinaryIntrinsic(MinMaxID, X, Y);

  NewInner->takeName(Inner);

  return CallInst::Create(MinMax, {NewInner, C});

}


/// Reduce a sequence of min/max intrinsics with a common operand.

static Instruction *factorizeMinMaxTree(IntrinsicInst *II) {

  // Match 3 of the same min/max ops. Example: umin(umin(), umin()).

  auto *LHS = dyn_cast<IntrinsicInst>(II->getArgOperand(0));

  auto *RHS = dyn_cast<IntrinsicInst>(II->getArgOperand(1));

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  if (!LHS || !RHS || LHS->getIntrinsicID() != MinMaxID ||

      RHS->getIntrinsicID() != MinMaxID ||

      (!LHS->hasOneUse() && !RHS->hasOneUse()))

    return nullptr;


  Value *A = LHS->getArgOperand(0);

  Value *B = LHS->getArgOperand(1);

  Value *C = RHS->getArgOperand(0);

  Value *D = RHS->getArgOperand(1);


  // Look for a common operand.

  Value *MinMaxOp = nullptr;

  Value *ThirdOp = nullptr;

  if (LHS->hasOneUse()) {

    // If the LHS is only used in this chain and the RHS is used outside of it,

    // reuse the RHS min/max because that will eliminate the LHS.

    if (D == A || C == A) {

      // min(min(a, b), min(c, a)) --> min(min(c, a), b)

      // min(min(a, b), min(a, d)) --> min(min(a, d), b)

      MinMaxOp = RHS;

      ThirdOp = B;

    } else if (D == B || C == B) {

      // min(min(a, b), min(c, b)) --> min(min(c, b), a)

      // min(min(a, b), min(b, d)) --> min(min(b, d), a)

      MinMaxOp = RHS;

      ThirdOp = A;

    }

  } else {

    assert(RHS->hasOneUse() && "Expected one-use operand");

    // Reuse the LHS. This will eliminate the RHS.

    if (D == A || D == B) {

      // min(min(a, b), min(c, a)) --> min(min(a, b), c)

      // min(min(a, b), min(c, b)) --> min(min(a, b), c)

      MinMaxOp = LHS;

      ThirdOp = C;

    } else if (C == A || C == B) {

      // min(min(a, b), min(b, d)) --> min(min(a, b), d)

      // min(min(a, b), min(c, b)) --> min(min(a, b), d)

      MinMaxOp = LHS;

      ThirdOp = D;

    }

  }


  if (!MinMaxOp || !ThirdOp)

    return nullptr;


  Module *Mod = II->getModule();

  Function *MinMax =

      Intrinsic::getOrInsertDeclaration(Mod, MinMaxID, II->getType());

  return CallInst::Create(MinMax, { MinMaxOp, ThirdOp });

}


/// If all arguments of the intrinsic are unary shuffles with the same mask,

/// try to shuffle after the intrinsic.

static Instruction *

foldShuffledIntrinsicOperands(IntrinsicInst *II,

                              InstCombiner::BuilderTy &Builder) {

  // TODO: This should be extended to handle other intrinsics like fshl, ctpop,

  //       etc. Use llvm::isTriviallyVectorizable() and related to determine

  //       which intrinsics are safe to shuffle?

  switch (II->getIntrinsicID()) {

  case Intrinsic::smax:

  case Intrinsic::smin:

  case Intrinsic::umax:

  case Intrinsic::umin:

  case Intrinsic::fma:

  case Intrinsic::fshl:

  case Intrinsic::fshr:

    break;

  default:

    return nullptr;

  }


  Value *X;

  ArrayRef<int> Mask;

  if (!match(II->getArgOperand(0),

             m_Shuffle(m_Value(X), m_Undef(), m_Mask(Mask))))

    return nullptr;


  // At least 1 operand must have 1 use because we are creating 2 instructions.

  if (none_of(II->args(), [](Value *V) { return V->hasOneUse(); }))

    return nullptr;


  // See if all arguments are shuffled with the same mask.

  SmallVector<Value *, 4> NewArgs(II->arg_size());

  NewArgs[0] = X;

  Type *SrcTy = X->getType();

  for (unsigned i = 1, e = II->arg_size(); i != e; ++i) {

    if (!match(II->getArgOperand(i),

               m_Shuffle(m_Value(X), m_Undef(), m_SpecificMask(Mask))) ||

        X->getType() != SrcTy)

      return nullptr;

    NewArgs[i] = X;

  }


  // intrinsic (shuf X, M), (shuf Y, M), ... --> shuf (intrinsic X, Y, ...), M

  Instruction *FPI = isa<FPMathOperator>(II) ? II : nullptr;

  Value *NewIntrinsic =

      Builder.CreateIntrinsic(II->getIntrinsicID(), SrcTy, NewArgs, FPI);

  return new ShuffleVectorInst(NewIntrinsic, Mask);

}


/// Fold the following cases and accepts bswap and bitreverse intrinsics:

///   bswap(logic_op(bswap(x), y)) --> logic_op(x, bswap(y))

///   bswap(logic_op(bswap(x), bswap(y))) --> logic_op(x, y) (ignores multiuse)

template <Intrinsic::ID IntrID>

static Instruction *foldBitOrderCrossLogicOp(Value *V,

                                             InstCombiner::BuilderTy &Builder) {

  static_assert(IntrID == Intrinsic::bswap || IntrID == Intrinsic::bitreverse,

                "This helper only supports BSWAP and BITREVERSE intrinsics");


  Value *X, *Y;

  // Find bitwise logic op. Check that it is a BinaryOperator explicitly so we

  // don't match ConstantExpr that aren't meaningful for this transform.

  if (match(V, m_OneUse(m_BitwiseLogic(m_Value(X), m_Value(Y)))) &&

      isa<BinaryOperator>(V)) {

    Value *OldReorderX, *OldReorderY;

    BinaryOperator::BinaryOps Op = cast<BinaryOperator>(V)->getOpcode();


    // If both X and Y are bswap/bitreverse, the transform reduces the number

    // of instructions even if there's multiuse.

    // If only one operand is bswap/bitreverse, we need to ensure the operand

    // have only one use.

    if (match(X, m_Intrinsic<IntrID>(m_Value(OldReorderX))) &&

        match(Y, m_Intrinsic<IntrID>(m_Value(OldReorderY)))) {

      return BinaryOperator::Create(Op, OldReorderX, OldReorderY);

    }


    if (match(X, m_OneUse(m_Intrinsic<IntrID>(m_Value(OldReorderX))))) {

      Value *NewReorder = Builder.CreateUnaryIntrinsic(IntrID, Y);

      return BinaryOperator::Create(Op, OldReorderX, NewReorder);

    }


    if (match(Y, m_OneUse(m_Intrinsic<IntrID>(m_Value(OldReorderY))))) {

      Value *NewReorder = Builder.CreateUnaryIntrinsic(IntrID, X);

      return BinaryOperator::Create(Op, NewReorder, OldReorderY);

    }

  }

  return nullptr;

}


static Value *simplifyReductionOperand(Value *Arg, bool CanReorderLanes) {

  if (!CanReorderLanes)

    return nullptr;


  Value *V;

  if (match(Arg, m_VecReverse(m_Value(V))))

    return V;


  ArrayRef<int> Mask;

  if (!isa<FixedVectorType>(Arg->getType()) ||

      !match(Arg, m_Shuffle(m_Value(V), m_Undef(), m_Mask(Mask))) ||

      !cast<ShuffleVectorInst>(Arg)->isSingleSource())

    return nullptr;


  int Sz = Mask.size();

  SmallBitVector UsedIndices(Sz);

  for (int Idx : Mask) {

    if (Idx == PoisonMaskElem || UsedIndices.test(Idx))

      return nullptr;

    UsedIndices.set(Idx);

  }


  // Can remove shuffle iff just shuffled elements, no repeats, undefs, or

  // other changes.

  return UsedIndices.all() ? V : nullptr;

}


/// Fold an unsigned minimum of trailing or leading zero bits counts:

///   umin(cttz(CtOp, ZeroUndef), ConstOp) --> cttz(CtOp | (1 << ConstOp))

///   umin(ctlz(CtOp, ZeroUndef), ConstOp) --> ctlz(CtOp | (SignedMin

///                                              >> ConstOp))

template <Intrinsic::ID IntrID>

static Value *

foldMinimumOverTrailingOrLeadingZeroCount(Value *I0, Value *I1,

                                          const DataLayout &DL,

                                          InstCombiner::BuilderTy &Builder) {

  static_assert(IntrID == Intrinsic::cttz || IntrID == Intrinsic::ctlz,

                "This helper only supports cttz and ctlz intrinsics");


  Value *CtOp;

  Value *ZeroUndef;

  if (!match(I0,

             m_OneUse(m_Intrinsic<IntrID>(m_Value(CtOp), m_Value(ZeroUndef)))))

    return nullptr;


  unsigned BitWidth = I1->getType()->getScalarSizeInBits();

  auto LessBitWidth = [BitWidth](auto &C) { return C.ult(BitWidth); };

  if (!match(I1, m_CheckedInt(LessBitWidth)))

    // We have a constant >= BitWidth (which can be handled by CVP)

    // or a non-splat vector with elements < and >= BitWidth

    return nullptr;


  Type *Ty = I1->getType();

  Constant *NewConst = ConstantFoldBinaryOpOperands(

      IntrID == Intrinsic::cttz ? Instruction::Shl : Instruction::LShr,

      IntrID == Intrinsic::cttz

          ? ConstantInt::get(Ty, 1)

          : ConstantInt::get(Ty, APInt::getSignedMinValue(BitWidth)),

      cast<Constant>(I1), DL);

  return Builder.CreateBinaryIntrinsic(

      IntrID, Builder.CreateOr(CtOp, NewConst),

      ConstantInt::getTrue(ZeroUndef->getType()));

}


/// Return whether "X LOp (Y ROp Z)" is always equal to

/// "(X LOp Y) ROp (X LOp Z)".

static bool leftDistributesOverRight(Instruction::BinaryOps LOp, bool HasNUW,

                                     bool HasNSW, Intrinsic::ID ROp) {

  switch (ROp) {

  case Intrinsic::umax:

  case Intrinsic::umin:

    return HasNUW && LOp == Instruction::Add;

  case Intrinsic::smax:

  case Intrinsic::smin:

    return HasNSW && LOp == Instruction::Add;

  default:

    return false;

  }

}


// Attempts to factorise a common term

// in an instruction that has the form "(A op' B) op (C op' D)

// where op is an intrinsic and op' is a binop

static Value *

foldIntrinsicUsingDistributiveLaws(IntrinsicInst *II,

                                   InstCombiner::BuilderTy &Builder) {

  Value *LHS = II->getOperand(0), *RHS = II->getOperand(1);

  Intrinsic::ID TopLevelOpcode = II->getIntrinsicID();


  OverflowingBinaryOperator *Op0 = dyn_cast<OverflowingBinaryOperator>(LHS);

  OverflowingBinaryOperator *Op1 = dyn_cast<OverflowingBinaryOperator>(RHS);


  if (!Op0 || !Op1)

    return nullptr;


  if (Op0->getOpcode() != Op1->getOpcode())

    return nullptr;


  if (!Op0->hasOneUse() || !Op1->hasOneUse())

    return nullptr;


  Instruction::BinaryOps InnerOpcode =

      static_cast<Instruction::BinaryOps>(Op0->getOpcode());

  bool HasNUW = Op0->hasNoUnsignedWrap() && Op1->hasNoUnsignedWrap();

  bool HasNSW = Op0->hasNoSignedWrap() && Op1->hasNoSignedWrap();


  if (!leftDistributesOverRight(InnerOpcode, HasNUW, HasNSW, TopLevelOpcode))

    return nullptr;


  assert(II->isCommutative() && Op0->isCommutative() &&

         "Only inner and outer commutative op codes are supported.");


  Value *A = Op0->getOperand(0);

  Value *B = Op0->getOperand(1);

  Value *C = Op1->getOperand(0);

  Value *D = Op1->getOperand(1);


  // Attempts to swap variables such that A always equals C

  if (A != C && A != D)

    std::swap(A, B);

  if (A == C || A == D) {

    if (A != C)

      std::swap(C, D);

    Value *NewIntrinsic = Builder.CreateBinaryIntrinsic(TopLevelOpcode, B, D);

    BinaryOperator *NewBinop =

        cast<BinaryOperator>(Builder.CreateBinOp(InnerOpcode, NewIntrinsic, A));

    NewBinop->setHasNoSignedWrap(HasNSW);

    NewBinop->setHasNoUnsignedWrap(HasNUW);

    return NewBinop;

  }


  return nullptr;

}


/// CallInst simplification. This mostly only handles folding of intrinsic

/// instructions. For normal calls, it allows visitCallBase to do the heavy

/// lifting.

Instruction *InstCombinerImpl::visitCallInst(CallInst &CI) {

  // Don't try to simplify calls without uses. It will not do anything useful,

  // but will result in the following folds being skipped.

  if (!CI.use_empty()) {

    SmallVector<Value *, 8> Args(CI.args());

    if (Value *V = simplifyCall(&CI, CI.getCalledOperand(), Args,

                                SQ.getWithInstruction(&CI)))

      return replaceInstUsesWith(CI, V);

  }


  if (Value *FreedOp = getFreedOperand(&CI, &TLI))

    return visitFree(CI, FreedOp);


  // If the caller function (i.e. us, the function that contains this CallInst)

  // is nounwind, mark the call as nounwind, even if the callee isn't.

  if (CI.getFunction()->doesNotThrow() && !CI.doesNotThrow()) {

    CI.setDoesNotThrow();

    return &CI;

  }


  IntrinsicInst *II = dyn_cast<IntrinsicInst>(&CI);

  if (!II) return visitCallBase(CI);


  // For atomic unordered mem intrinsics if len is not a positive or

  // not a multiple of element size then behavior is undefined.

  if (auto *AMI = dyn_cast<AtomicMemIntrinsic>(II))

    if (ConstantInt *NumBytes = dyn_cast<ConstantInt>(AMI->getLength()))

      if (NumBytes->isNegative() ||

          (NumBytes->getZExtValue() % AMI->getElementSizeInBytes() != 0)) {

        CreateNonTerminatorUnreachable(AMI);

        assert(AMI->getType()->isVoidTy() &&

               "non void atomic unordered mem intrinsic");

        return eraseInstFromFunction(*AMI);

      }


  // Intrinsics cannot occur in an invoke or a callbr, so handle them here

  // instead of in visitCallBase.

  if (auto *MI = dyn_cast<AnyMemIntrinsic>(II)) {

    bool Changed = false;


    // memmove/cpy/set of zero bytes is a noop.

    if (Constant *NumBytes = dyn_cast<Constant>(MI->getLength())) {

      if (NumBytes->isNullValue())

        return eraseInstFromFunction(CI);

    }


    // No other transformations apply to volatile transfers.

    if (auto *M = dyn_cast<MemIntrinsic>(MI))

      if (M->isVolatile())

        return nullptr;


    // If we have a memmove and the source operation is a constant global,

    // then the source and dest pointers can't alias, so we can change this

    // into a call to memcpy.

    if (auto *MMI = dyn_cast<AnyMemMoveInst>(MI)) {

      if (GlobalVariable *GVSrc = dyn_cast<GlobalVariable>(MMI->getSource()))

        if (GVSrc->isConstant()) {

          Module *M = CI.getModule();

          Intrinsic::ID MemCpyID =

              isa<AtomicMemMoveInst>(MMI)

                  ? Intrinsic::memcpy_element_unordered_atomic

                  : Intrinsic::memcpy;

          Type *Tys[3] = { CI.getArgOperand(0)->getType(),

                           CI.getArgOperand(1)->getType(),

                           CI.getArgOperand(2)->getType() };

          CI.setCalledFunction(

              Intrinsic::getOrInsertDeclaration(M, MemCpyID, Tys));

          Changed = true;

        }

    }


    if (AnyMemTransferInst *MTI = dyn_cast<AnyMemTransferInst>(MI)) {

      // memmove(x,x,size) -> noop.

      if (MTI->getSource() == MTI->getDest())

        return eraseInstFromFunction(CI);

    }


    auto IsPointerUndefined = [MI](Value *Ptr) {

      return isa<ConstantPointerNull>(Ptr) &&

             !NullPointerIsDefined(

                 MI->getFunction(),

                 cast<PointerType>(Ptr->getType())->getAddressSpace());

    };

    bool SrcIsUndefined = false;

    // If we can determine a pointer alignment that is bigger than currently

    // set, update the alignment.

    if (auto *MTI = dyn_cast<AnyMemTransferInst>(MI)) {

      if (Instruction *I = SimplifyAnyMemTransfer(MTI))

        return I;

      SrcIsUndefined = IsPointerUndefined(MTI->getRawSource());

    } else if (auto *MSI = dyn_cast<AnyMemSetInst>(MI)) {

      if (Instruction *I = SimplifyAnyMemSet(MSI))

        return I;

    }


    // If src/dest is null, this memory intrinsic must be a noop.

    if (SrcIsUndefined || IsPointerUndefined(MI->getRawDest())) {

      Builder.CreateAssumption(Builder.CreateIsNull(MI->getLength()));

      return eraseInstFromFunction(CI);

    }


    if (Changed) return II;

  }


  // For fixed width vector result intrinsics, use the generic demanded vector

  // support.

  if (auto *IIFVTy = dyn_cast<FixedVectorType>(II->getType())) {

    auto VWidth = IIFVTy->getNumElements();

    APInt PoisonElts(VWidth, 0);

    APInt AllOnesEltMask(APInt::getAllOnes(VWidth));

    if (Value *V = SimplifyDemandedVectorElts(II, AllOnesEltMask, PoisonElts)) {

      if (V != II)

        return replaceInstUsesWith(*II, V);

      return II;

    }

  }


  if (II->isCommutative()) {

    if (auto Pair = matchSymmetricPair(II->getOperand(0), II->getOperand(1))) {

      replaceOperand(*II, 0, Pair->first);

      replaceOperand(*II, 1, Pair->second);

      return II;

    }


    if (CallInst *NewCall = canonicalizeConstantArg0ToArg1(CI))

      return NewCall;

  }


  // Unused constrained FP intrinsic calls may have declared side effect, which

  // prevents it from being removed. In some cases however the side effect is

  // actually absent. To detect this case, call SimplifyConstrainedFPCall. If it

  // returns a replacement, the call may be removed.

  if (CI.use_empty() && isa<ConstrainedFPIntrinsic>(CI)) {

    if (simplifyConstrainedFPCall(&CI, SQ.getWithInstruction(&CI)))

      return eraseInstFromFunction(CI);

  }


  Intrinsic::ID IID = II->getIntrinsicID();

  switch (IID) {

  case Intrinsic::objectsize: {

    SmallVector<Instruction *> InsertedInstructions;

    if (Value *V = lowerObjectSizeCall(II, DL, &TLI, AA, /*MustSucceed=*/false,

                                       &InsertedInstructions)) {

      for (Instruction *Inserted : InsertedInstructions)

        Worklist.add(Inserted);

      return replaceInstUsesWith(CI, V);

    }

    return nullptr;

  }

  case Intrinsic::abs: {

    Value *IIOperand = II->getArgOperand(0);

    bool IntMinIsPoison = cast<Constant>(II->getArgOperand(1))->isOneValue();


    // abs(-x) -> abs(x)

    // TODO: Copy nsw if it was present on the neg?

    Value *X;

    if (match(IIOperand, m_Neg(m_Value(X))))

      return replaceOperand(*II, 0, X);

    if (match(IIOperand, m_c_Select(m_Neg(m_Value(X)), m_Deferred(X))))

      return replaceOperand(*II, 0, X);


    Value *Y;

    // abs(a * abs(b)) -> abs(a * b)

    if (match(IIOperand,

              m_OneUse(m_c_Mul(m_Value(X),

                               m_Intrinsic<Intrinsic::abs>(m_Value(Y)))))) {

      bool NSW =

          cast<Instruction>(IIOperand)->hasNoSignedWrap() && IntMinIsPoison;

      auto *XY = NSW ? Builder.CreateNSWMul(X, Y) : Builder.CreateMul(X, Y);

      return replaceOperand(*II, 0, XY);

    }


    if (std::optional<bool> Known =

            getKnownSignOrZero(IIOperand, SQ.getWithInstruction(II))) {

      // abs(x) -> x if x >= 0 (include abs(x-y) --> x - y where x >= y)

      // abs(x) -> x if x > 0 (include abs(x-y) --> x - y where x > y)

      if (!*Known)

        return replaceInstUsesWith(*II, IIOperand);


      // abs(x) -> -x if x < 0

      // abs(x) -> -x if x < = 0 (include abs(x-y) --> y - x where x <= y)

      if (IntMinIsPoison)

        return BinaryOperator::CreateNSWNeg(IIOperand);

      return BinaryOperator::CreateNeg(IIOperand);

    }


    // abs (sext X) --> zext (abs X*)

    // Clear the IsIntMin (nsw) bit on the abs to allow narrowing.

    if (match(IIOperand, m_OneUse(m_SExt(m_Value(X))))) {

      Value *NarrowAbs =

          Builder.CreateBinaryIntrinsic(Intrinsic::abs, X, Builder.getFalse());

      return CastInst::Create(Instruction::ZExt, NarrowAbs, II->getType());

    }


    // Match a complicated way to check if a number is odd/even:

    // abs (srem X, 2) --> and X, 1

    const APInt *C;

    if (match(IIOperand, m_SRem(m_Value(X), m_APInt(C))) && *C == 2)

      return BinaryOperator::CreateAnd(X, ConstantInt::get(II->getType(), 1));


    break;

  }

  case Intrinsic::umin: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    // umin(x, 1) == zext(x != 0)

    if (match(I1, m_One())) {

      assert(II->getType()->getScalarSizeInBits() != 1 &&

             "Expected simplify of umin with max constant");

      Value *Zero = Constant::getNullValue(I0->getType());

      Value *Cmp = Builder.CreateICmpNE(I0, Zero);

      return CastInst::Create(Instruction::ZExt, Cmp, II->getType());

    }

    // umin(cttz(x), const) --> cttz(x | (1 << const))

    if (Value *FoldedCttz =

            foldMinimumOverTrailingOrLeadingZeroCount<Intrinsic::cttz>(

                I0, I1, DL, Builder))

      return replaceInstUsesWith(*II, FoldedCttz);

    // umin(ctlz(x), const) --> ctlz(x | (SignedMin >> const))

    if (Value *FoldedCtlz =

            foldMinimumOverTrailingOrLeadingZeroCount<Intrinsic::ctlz>(

                I0, I1, DL, Builder))

      return replaceInstUsesWith(*II, FoldedCtlz);

    [[fallthrough]];

  }

  case Intrinsic::umax: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(I0, m_ZExt(m_Value(X))) && match(I1, m_ZExt(m_Value(Y))) &&

        (I0->hasOneUse() || I1->hasOneUse()) && X->getType() == Y->getType()) {

      Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, Y);

      return CastInst::Create(Instruction::ZExt, NarrowMaxMin, II->getType());

    }

    Constant *C;

    if (match(I0, m_ZExt(m_Value(X))) && match(I1, m_Constant(C)) &&

        I0->hasOneUse()) {

      if (Constant *NarrowC = getLosslessUnsignedTrunc(C, X->getType())) {

        Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, NarrowC);

        return CastInst::Create(Instruction::ZExt, NarrowMaxMin, II->getType());

      }

    }

    // If C is not 0:

    //   umax(nuw_shl(x, C), x + 1) -> x == 0 ? 1 : nuw_shl(x, C)

    // If C is not 0 or 1:

    //   umax(nuw_mul(x, C), x + 1) -> x == 0 ? 1 : nuw_mul(x, C)

    auto foldMaxMulShift = [&](Value *A, Value *B) -> Instruction * {

      const APInt *C;

      Value *X;

      if (!match(A, m_NUWShl(m_Value(X), m_APInt(C))) &&

          !(match(A, m_NUWMul(m_Value(X), m_APInt(C))) && !C->isOne()))

        return nullptr;

      if (C->isZero())

        return nullptr;

      if (!match(B, m_OneUse(m_Add(m_Specific(X), m_One()))))

        return nullptr;


      Value *Cmp = Builder.CreateICmpEQ(X, ConstantInt::get(X->getType(), 0));

      Value *NewSelect =

          Builder.CreateSelect(Cmp, ConstantInt::get(X->getType(), 1), A);

      return replaceInstUsesWith(*II, NewSelect);

    };


    if (IID == Intrinsic::umax) {

      if (Instruction *I = foldMaxMulShift(I0, I1))

        return I;

      if (Instruction *I = foldMaxMulShift(I1, I0))

        return I;

    }

    // If both operands of unsigned min/max are sign-extended, it is still ok

    // to narrow the operation.

    [[fallthrough]];

  }

  case Intrinsic::smax:

  case Intrinsic::smin: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(I0, m_SExt(m_Value(X))) && match(I1, m_SExt(m_Value(Y))) &&

        (I0->hasOneUse() || I1->hasOneUse()) && X->getType() == Y->getType()) {

      Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, Y);

      return CastInst::Create(Instruction::SExt, NarrowMaxMin, II->getType());

    }


    Constant *C;

    if (match(I0, m_SExt(m_Value(X))) && match(I1, m_Constant(C)) &&

        I0->hasOneUse()) {

      if (Constant *NarrowC = getLosslessSignedTrunc(C, X->getType())) {

        Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, NarrowC);

        return CastInst::Create(Instruction::SExt, NarrowMaxMin, II->getType());

      }

    }


    // umin(i1 X, i1 Y) -> and i1 X, Y

    // smax(i1 X, i1 Y) -> and i1 X, Y

    if ((IID == Intrinsic::umin || IID == Intrinsic::smax) &&

        II->getType()->isIntOrIntVectorTy(1)) {

      return BinaryOperator::CreateAnd(I0, I1);

    }


    // umax(i1 X, i1 Y) -> or i1 X, Y

    // smin(i1 X, i1 Y) -> or i1 X, Y

    if ((IID == Intrinsic::umax || IID == Intrinsic::smin) &&

        II->getType()->isIntOrIntVectorTy(1)) {

      return BinaryOperator::CreateOr(I0, I1);

    }


    if (IID == Intrinsic::smax || IID == Intrinsic::smin) {

      // smax (neg nsw X), (neg nsw Y) --> neg nsw (smin X, Y)

      // smin (neg nsw X), (neg nsw Y) --> neg nsw (smax X, Y)

      // TODO: Canonicalize neg after min/max if I1 is constant.

      if (match(I0, m_NSWNeg(m_Value(X))) && match(I1, m_NSWNeg(m_Value(Y))) &&

          (I0->hasOneUse() || I1->hasOneUse())) {

        Intrinsic::ID InvID = getInverseMinMaxIntrinsic(IID);

        Value *InvMaxMin = Builder.CreateBinaryIntrinsic(InvID, X, Y);

        return BinaryOperator::CreateNSWNeg(InvMaxMin);

      }

    }


    // (umax X, (xor X, Pow2))

    //      -> (or X, Pow2)

    // (umin X, (xor X, Pow2))

    //      -> (and X, ~Pow2)

    // (smax X, (xor X, Pos_Pow2))

    //      -> (or X, Pos_Pow2)

    // (smin X, (xor X, Pos_Pow2))

    //      -> (and X, ~Pos_Pow2)

    // (smax X, (xor X, Neg_Pow2))

    //      -> (and X, ~Neg_Pow2)

    // (smin X, (xor X, Neg_Pow2))

    //      -> (or X, Neg_Pow2)

    if ((match(I0, m_c_Xor(m_Specific(I1), m_Value(X))) ||

         match(I1, m_c_Xor(m_Specific(I0), m_Value(X)))) &&

        isKnownToBeAPowerOfTwo(X, /* OrZero */ true)) {

      bool UseOr = IID == Intrinsic::smax || IID == Intrinsic::umax;

      bool UseAndN = IID == Intrinsic::smin || IID == Intrinsic::umin;


      if (IID == Intrinsic::smax || IID == Intrinsic::smin) {

        auto KnownSign = getKnownSign(X, SQ.getWithInstruction(II));

        if (KnownSign == std::nullopt) {

          UseOr = false;

          UseAndN = false;

        } else if (*KnownSign /* true is Signed. */) {

          UseOr ^= true;

          UseAndN ^= true;

          Type *Ty = I0->getType();

          // Negative power of 2 must be IntMin. It's possible to be able to

          // prove negative / power of 2 without actually having known bits, so

          // just get the value by hand.

          X = Constant::getIntegerValue(

              Ty, APInt::getSignedMinValue(Ty->getScalarSizeInBits()));

        }

      }

      if (UseOr)

        return BinaryOperator::CreateOr(I0, X);

      else if (UseAndN)

        return BinaryOperator::CreateAnd(I0, Builder.CreateNot(X));

    }


    // If we can eliminate ~A and Y is free to invert:

    // max ~A, Y --> ~(min A, ~Y)

    //

    // Examples:

    // max ~A, ~Y --> ~(min A, Y)

    // max ~A, C --> ~(min A, ~C)

    // max ~A, (max ~Y, ~Z) --> ~min( A, (min Y, Z))

    auto moveNotAfterMinMax = [&](Value *X, Value *Y) -> Instruction * {

      Value *A;

      if (match(X, m_OneUse(m_Not(m_Value(A)))) &&

          !isFreeToInvert(A, A->hasOneUse())) {

        if (Value *NotY = getFreelyInverted(Y, Y->hasOneUse(), &Builder)) {

          Intrinsic::ID InvID = getInverseMinMaxIntrinsic(IID);

          Value *InvMaxMin = Builder.CreateBinaryIntrinsic(InvID, A, NotY);

          return BinaryOperator::CreateNot(InvMaxMin);

        }

      }

      return nullptr;

    };


    if (Instruction *I = moveNotAfterMinMax(I0, I1))

      return I;

    if (Instruction *I = moveNotAfterMinMax(I1, I0))

      return I;


    if (Instruction *I = moveAddAfterMinMax(II, Builder))

      return I;


    // minmax (X & NegPow2C, Y & NegPow2C) --> minmax(X, Y) & NegPow2C

    const APInt *RHSC;

    if (match(I0, m_OneUse(m_And(m_Value(X), m_NegatedPower2(RHSC)))) &&

        match(I1, m_OneUse(m_And(m_Value(Y), m_SpecificInt(*RHSC)))))

      return BinaryOperator::CreateAnd(Builder.CreateBinaryIntrinsic(IID, X, Y),

                                       ConstantInt::get(II->getType(), *RHSC));


    // smax(X, -X) --> abs(X)

    // smin(X, -X) --> -abs(X)

    // umax(X, -X) --> -abs(X)

    // umin(X, -X) --> abs(X)

    if (isKnownNegation(I0, I1)) {

      // We can choose either operand as the input to abs(), but if we can

      // eliminate the only use of a value, that's better for subsequent

      // transforms/analysis.

      if (I0->hasOneUse() && !I1->hasOneUse())

        std::swap(I0, I1);


      // This is some variant of abs(). See if we can propagate 'nsw' to the abs

      // operation and potentially its negation.

      bool IntMinIsPoison = isKnownNegation(I0, I1, /* NeedNSW */ true);

      Value *Abs = Builder.CreateBinaryIntrinsic(

          Intrinsic::abs, I0,

          ConstantInt::getBool(II->getContext(), IntMinIsPoison));


      // We don't have a "nabs" intrinsic, so negate if needed based on the

      // max/min operation.

      if (IID == Intrinsic::smin || IID == Intrinsic::umax)

        Abs = Builder.CreateNeg(Abs, "nabs", IntMinIsPoison);

      return replaceInstUsesWith(CI, Abs);

    }


    if (Instruction *Sel = foldClampRangeOfTwo(II, Builder))

      return Sel;


    if (Instruction *SAdd = matchSAddSubSat(*II))

      return SAdd;


    if (Value *NewMinMax = reassociateMinMaxWithConstants(II, Builder, SQ))

      return replaceInstUsesWith(*II, NewMinMax);


    if (Instruction *R = reassociateMinMaxWithConstantInOperand(II, Builder))

      return R;


    if (Instruction *NewMinMax = factorizeMinMaxTree(II))

       return NewMinMax;


    // Try to fold minmax with constant RHS based on range information

    if (match(I1, m_APIntAllowPoison(RHSC))) {

      ICmpInst::Predicate Pred =

          ICmpInst::getNonStrictPredicate(MinMaxIntrinsic::getPredicate(IID));

      bool IsSigned = MinMaxIntrinsic::isSigned(IID);

      ConstantRange LHS_CR = computeConstantRangeIncludingKnownBits(

          I0, IsSigned, SQ.getWithInstruction(II));

      if (!LHS_CR.isFullSet()) {

        if (LHS_CR.icmp(Pred, *RHSC))

          return replaceInstUsesWith(*II, I0);

        if (LHS_CR.icmp(ICmpInst::getSwappedPredicate(Pred), *RHSC))

          return replaceInstUsesWith(*II,

                                     ConstantInt::get(II->getType(), *RHSC));

      }

    }


    if (Value *V = foldIntrinsicUsingDistributiveLaws(II, Builder))

      return replaceInstUsesWith(*II, V);


    break;

  }

  case Intrinsic::scmp: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *LHS, *RHS;

    if (match(I0, m_NSWSub(m_Value(LHS), m_Value(RHS))) && match(I1, m_Zero()))

      return replaceInstUsesWith(

          CI,

          Builder.CreateIntrinsic(II->getType(), Intrinsic::scmp, {LHS, RHS}));

    break;

  }

  case Intrinsic::bitreverse: {

    Value *IIOperand = II->getArgOperand(0);

    // bitrev (zext i1 X to ?) --> X ? SignBitC : 0

    Value *X;

    if (match(IIOperand, m_ZExt(m_Value(X))) &&

        X->getType()->isIntOrIntVectorTy(1)) {

      Type *Ty = II->getType();

      APInt SignBit = APInt::getSignMask(Ty->getScalarSizeInBits());

      return SelectInst::Create(X, ConstantInt::get(Ty, SignBit),

                                ConstantInt::getNullValue(Ty));

    }


    if (Instruction *crossLogicOpFold =

        foldBitOrderCrossLogicOp<Intrinsic::bitreverse>(IIOperand, Builder))

      return crossLogicOpFold;


    break;

  }

  case Intrinsic::bswap: {

    Value *IIOperand = II->getArgOperand(0);


    // Try to canonicalize bswap-of-logical-shift-by-8-bit-multiple as

    // inverse-shift-of-bswap:

    // bswap (shl X, Y) --> lshr (bswap X), Y

    // bswap (lshr X, Y) --> shl (bswap X), Y

    Value *X, *Y;

    if (match(IIOperand, m_OneUse(m_LogicalShift(m_Value(X), m_Value(Y))))) {

      unsigned BitWidth = IIOperand->getType()->getScalarSizeInBits();

      if (MaskedValueIsZero(Y, APInt::getLowBitsSet(BitWidth, 3))) {

        Value *NewSwap = Builder.CreateUnaryIntrinsic(Intrinsic::bswap, X);

        BinaryOperator::BinaryOps InverseShift =

            cast<BinaryOperator>(IIOperand)->getOpcode() == Instruction::Shl

                ? Instruction::LShr

                : Instruction::Shl;

        return BinaryOperator::Create(InverseShift, NewSwap, Y);

      }

    }


    KnownBits Known = computeKnownBits(IIOperand, 0, II);

    uint64_t LZ = alignDown(Known.countMinLeadingZeros(), 8);

    uint64_t TZ = alignDown(Known.countMinTrailingZeros(), 8);

    unsigned BW = Known.getBitWidth();


    // bswap(x) -> shift(x) if x has exactly one "active byte"

    if (BW - LZ - TZ == 8) {

      assert(LZ != TZ && "active byte cannot be in the middle");

      if (LZ > TZ)  // -> shl(x) if the "active byte" is in the low part of x

        return BinaryOperator::CreateNUWShl(

            IIOperand, ConstantInt::get(IIOperand->getType(), LZ - TZ));

      // -> lshr(x) if the "active byte" is in the high part of x

      return BinaryOperator::CreateExactLShr(

            IIOperand, ConstantInt::get(IIOperand->getType(), TZ - LZ));

    }


    // bswap(trunc(bswap(x))) -> trunc(lshr(x, c))

    if (match(IIOperand, m_Trunc(m_BSwap(m_Value(X))))) {

      unsigned C = X->getType()->getScalarSizeInBits() - BW;

      Value *CV = ConstantInt::get(X->getType(), C);

      Value *V = Builder.CreateLShr(X, CV);

      return new TruncInst(V, IIOperand->getType());

    }


    if (Instruction *crossLogicOpFold =

            foldBitOrderCrossLogicOp<Intrinsic::bswap>(IIOperand, Builder)) {

      return crossLogicOpFold;

    }


    // Try to fold into bitreverse if bswap is the root of the expression tree.

    if (Instruction *BitOp = matchBSwapOrBitReverse(*II, /*MatchBSwaps*/ false,

                                                    /*MatchBitReversals*/ true))

      return BitOp;

    break;

  }

  case Intrinsic::masked_load:

    if (Value *SimplifiedMaskedOp = simplifyMaskedLoad(*II))

      return replaceInstUsesWith(CI, SimplifiedMaskedOp);

    break;

  case Intrinsic::masked_store:

    return simplifyMaskedStore(*II);

  case Intrinsic::masked_gather:

    return simplifyMaskedGather(*II);

  case Intrinsic::masked_scatter:

    return simplifyMaskedScatter(*II);

  case Intrinsic::launder_invariant_group:

  case Intrinsic::strip_invariant_group:

    if (auto *SkippedBarrier = simplifyInvariantGroupIntrinsic(*II, *this))

      return replaceInstUsesWith(*II, SkippedBarrier);

    break;

  case Intrinsic::powi:

    if (ConstantInt *Power = dyn_cast<ConstantInt>(II->getArgOperand(1))) {

      // 0 and 1 are handled in instsimplify

      // powi(x, -1) -> 1/x

      if (Power->isMinusOne())

        return BinaryOperator::CreateFDivFMF(ConstantFP::get(CI.getType(), 1.0),

                                             II->getArgOperand(0), II);

      // powi(x, 2) -> x*x

      if (Power->equalsInt(2))

        return BinaryOperator::CreateFMulFMF(II->getArgOperand(0),

                                             II->getArgOperand(0), II);


      if (!Power->getValue()[0]) {

        Value *X;

        // If power is even:

        // powi(-x, p) -> powi(x, p)

        // powi(fabs(x), p) -> powi(x, p)

        // powi(copysign(x, y), p) -> powi(x, p)

        if (match(II->getArgOperand(0), m_FNeg(m_Value(X))) ||

            match(II->getArgOperand(0), m_FAbs(m_Value(X))) ||

            match(II->getArgOperand(0),

                  m_Intrinsic<Intrinsic::copysign>(m_Value(X), m_Value())))

          return replaceOperand(*II, 0, X);

      }

    }

    break;


  case Intrinsic::cttz:

  case Intrinsic::ctlz:

    if (auto *I = foldCttzCtlz(*II, *this))

      return I;

    break;


  case Intrinsic::ctpop:

    if (auto *I = foldCtpop(*II, *this))

      return I;

    break;


  case Intrinsic::fshl:

  case Intrinsic::fshr: {

    Value *Op0 = II->getArgOperand(0), *Op1 = II->getArgOperand(1);

    Type *Ty = II->getType();

    unsigned BitWidth = Ty->getScalarSizeInBits();

    Constant *ShAmtC;

    if (match(II->getArgOperand(2), m_ImmConstant(ShAmtC))) {

      // Canonicalize a shift amount constant operand to modulo the bit-width.

      Constant *WidthC = ConstantInt::get(Ty, BitWidth);

      Constant *ModuloC =

          ConstantFoldBinaryOpOperands(Instruction::URem, ShAmtC, WidthC, DL);

      if (!ModuloC)

        return nullptr;

      if (ModuloC != ShAmtC)

        return replaceOperand(*II, 2, ModuloC);


      assert(match(ConstantFoldCompareInstOperands(ICmpInst::ICMP_UGT, WidthC,

                                                   ShAmtC, DL),

                   m_One()) &&

             "Shift amount expected to be modulo bitwidth");


      // Canonicalize funnel shift right by constant to funnel shift left. This

      // is not entirely arbitrary. For historical reasons, the backend may

      // recognize rotate left patterns but miss rotate right patterns.

      if (IID == Intrinsic::fshr) {

        // fshr X, Y, C --> fshl X, Y, (BitWidth - C) if C is not zero.

        if (!isKnownNonZero(ShAmtC, SQ.getWithInstruction(II)))

          return nullptr;


        Constant *LeftShiftC = ConstantExpr::getSub(WidthC, ShAmtC);

        Module *Mod = II->getModule();

        Function *Fshl =

            Intrinsic::getOrInsertDeclaration(Mod, Intrinsic::fshl, Ty);

        return CallInst::Create(Fshl, { Op0, Op1, LeftShiftC });

      }

      assert(IID == Intrinsic::fshl &&

             "All funnel shifts by simple constants should go left");


      // fshl(X, 0, C) --> shl X, C

      // fshl(X, undef, C) --> shl X, C

      if (match(Op1, m_ZeroInt()) || match(Op1, m_Undef()))

        return BinaryOperator::CreateShl(Op0, ShAmtC);


      // fshl(0, X, C) --> lshr X, (BW-C)

      // fshl(undef, X, C) --> lshr X, (BW-C)

      if (match(Op0, m_ZeroInt()) || match(Op0, m_Undef()))

        return BinaryOperator::CreateLShr(Op1,

                                          ConstantExpr::getSub(WidthC, ShAmtC));


      // fshl i16 X, X, 8 --> bswap i16 X (reduce to more-specific form)

      if (Op0 == Op1 && BitWidth == 16 && match(ShAmtC, m_SpecificInt(8))) {

        Module *Mod = II->getModule();

        Function *Bswap =

            Intrinsic::getOrInsertDeclaration(Mod, Intrinsic::bswap, Ty);

        return CallInst::Create(Bswap, { Op0 });

      }

      if (Instruction *BitOp =

              matchBSwapOrBitReverse(*II, /*MatchBSwaps*/ true,

                                     /*MatchBitReversals*/ true))

        return BitOp;

    }


    // fshl(X, 0, Y) --> shl(X, and(Y, BitWidth - 1)) if bitwidth is a

    // power-of-2

    if (IID == Intrinsic::fshl && isPowerOf2_32(BitWidth) &&

        match(Op1, m_ZeroInt())) {

      Value *Op2 = II->getArgOperand(2);

      Value *And = Builder.CreateAnd(Op2, ConstantInt::get(Ty, BitWidth - 1));

      return BinaryOperator::CreateShl(Op0, And);

    }


    // Left or right might be masked.

    if (SimplifyDemandedInstructionBits(*II))

      return &CI;


    // The shift amount (operand 2) of a funnel shift is modulo the bitwidth,

    // so only the low bits of the shift amount are demanded if the bitwidth is

    // a power-of-2.

    if (!isPowerOf2_32(BitWidth))

      break;

    APInt Op2Demanded = APInt::getLowBitsSet(BitWidth, Log2_32_Ceil(BitWidth));

    KnownBits Op2Known(BitWidth);

    if (SimplifyDemandedBits(II, 2, Op2Demanded, Op2Known))

      return &CI;

    break;

  }

  case Intrinsic::ptrmask: {

    unsigned BitWidth = DL.getPointerTypeSizeInBits(II->getType());

    KnownBits Known(BitWidth);

    if (SimplifyDemandedInstructionBits(*II, Known))

      return II;


    Value *InnerPtr, *InnerMask;

    bool Changed = false;

    // Combine:

    // (ptrmask (ptrmask p, A), B)

    //    -> (ptrmask p, (and A, B))

    if (match(II->getArgOperand(0),

              m_OneUse(m_Intrinsic<Intrinsic::ptrmask>(m_Value(InnerPtr),

                                                       m_Value(InnerMask))))) {

      assert(II->getArgOperand(1)->getType() == InnerMask->getType() &&

             "Mask types must match");

      // TODO: If InnerMask == Op1, we could copy attributes from inner

      // callsite -> outer callsite.

      Value *NewMask = Builder.CreateAnd(II->getArgOperand(1), InnerMask);

      replaceOperand(CI, 0, InnerPtr);

      replaceOperand(CI, 1, NewMask);

      Changed = true;

    }


    // See if we can deduce non-null.

    if (!CI.hasRetAttr(Attribute::NonNull) &&

        (Known.isNonZero() ||

         isKnownNonZero(II, getSimplifyQuery().getWithInstruction(II)))) {

      CI.addRetAttr(Attribute::NonNull);

      Changed = true;

    }


    unsigned NewAlignmentLog =

        std::min(Value::MaxAlignmentExponent,

                 std::min(BitWidth - 1, Known.countMinTrailingZeros()));

    // Known bits will capture if we had alignment information associated with

    // the pointer argument.

    if (NewAlignmentLog > Log2(CI.getRetAlign().valueOrOne())) {

      CI.addRetAttr(Attribute::getWithAlignment(

          CI.getContext(), Align(uint64_t(1) << NewAlignmentLog)));

      Changed = true;

    }

    if (Changed)

      return &CI;

    break;

  }

  case Intrinsic::uadd_with_overflow:

  case Intrinsic::sadd_with_overflow: {

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;


    // Given 2 constant operands whose sum does not overflow:

    // uaddo (X +nuw C0), C1 -> uaddo X, C0 + C1

    // saddo (X +nsw C0), C1 -> saddo X, C0 + C1

    Value *X;

    const APInt *C0, *C1;

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    bool IsSigned = IID == Intrinsic::sadd_with_overflow;

    bool HasNWAdd = IsSigned

                        ? match(Arg0, m_NSWAddLike(m_Value(X), m_APInt(C0)))

                        : match(Arg0, m_NUWAddLike(m_Value(X), m_APInt(C0)));

    if (HasNWAdd && match(Arg1, m_APInt(C1))) {

      bool Overflow;

      APInt NewC =

          IsSigned ? C1->sadd_ov(*C0, Overflow) : C1->uadd_ov(*C0, Overflow);

      if (!Overflow)

        return replaceInstUsesWith(

            *II, Builder.CreateBinaryIntrinsic(

                     IID, X, ConstantInt::get(Arg1->getType(), NewC)));

    }

    break;

  }


  case Intrinsic::umul_with_overflow:

  case Intrinsic::smul_with_overflow:

  case Intrinsic::usub_with_overflow:

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;

    break;


  case Intrinsic::ssub_with_overflow: {

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;


    Constant *C;

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    // Given a constant C that is not the minimum signed value

    // for an integer of a given bit width:

    //

    // ssubo X, C -> saddo X, -C

    if (match(Arg1, m_Constant(C)) && C->isNotMinSignedValue()) {

      Value *NegVal = ConstantExpr::getNeg(C);

      // Build a saddo call that is equivalent to the discovered

      // ssubo call.

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(Intrinsic::sadd_with_overflow,

                                             Arg0, NegVal));

    }


    break;

  }


  case Intrinsic::uadd_sat:

  case Intrinsic::sadd_sat:

  case Intrinsic::usub_sat:

  case Intrinsic::ssub_sat: {

    SaturatingInst *SI = cast<SaturatingInst>(II);

    Type *Ty = SI->getType();

    Value *Arg0 = SI->getLHS();

    Value *Arg1 = SI->getRHS();


    // Make use of known overflow information.

    OverflowResult OR = computeOverflow(SI->getBinaryOp(), SI->isSigned(),

                                        Arg0, Arg1, SI);

    switch (OR) {

      case OverflowResult::MayOverflow:

        break;

      case OverflowResult::NeverOverflows:

        if (SI->isSigned())

          return BinaryOperator::CreateNSW(SI->getBinaryOp(), Arg0, Arg1);

        else

          return BinaryOperator::CreateNUW(SI->getBinaryOp(), Arg0, Arg1);

      case OverflowResult::AlwaysOverflowsLow: {

        unsigned BitWidth = Ty->getScalarSizeInBits();

        APInt Min = APSInt::getMinValue(BitWidth, !SI->isSigned());

        return replaceInstUsesWith(*SI, ConstantInt::get(Ty, Min));

      }

      case OverflowResult::AlwaysOverflowsHigh: {

        unsigned BitWidth = Ty->getScalarSizeInBits();

        APInt Max = APSInt::getMaxValue(BitWidth, !SI->isSigned());

        return replaceInstUsesWith(*SI, ConstantInt::get(Ty, Max));

      }

    }


    // usub_sat((sub nuw C, A), C1) -> usub_sat(usub_sat(C, C1), A)

    // which after that:

    // usub_sat((sub nuw C, A), C1) -> usub_sat(C - C1, A) if C1 u< C

    // usub_sat((sub nuw C, A), C1) -> 0 otherwise

    Constant *C, *C1;

    Value *A;

    if (IID == Intrinsic::usub_sat &&

        match(Arg0, m_NUWSub(m_ImmConstant(C), m_Value(A))) &&

        match(Arg1, m_ImmConstant(C1))) {

      auto *NewC = Builder.CreateBinaryIntrinsic(Intrinsic::usub_sat, C, C1);

      auto *NewSub =

          Builder.CreateBinaryIntrinsic(Intrinsic::usub_sat, NewC, A);

      return replaceInstUsesWith(*SI, NewSub);

    }


    // ssub.sat(X, C) -> sadd.sat(X, -C) if C != MIN

    if (IID == Intrinsic::ssub_sat && match(Arg1, m_Constant(C)) &&

        C->isNotMinSignedValue()) {

      Value *NegVal = ConstantExpr::getNeg(C);

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(

              Intrinsic::sadd_sat, Arg0, NegVal));

    }


    // sat(sat(X + Val2) + Val) -> sat(X + (Val+Val2))

    // sat(sat(X - Val2) - Val) -> sat(X - (Val+Val2))

    // if Val and Val2 have the same sign

    if (auto *Other = dyn_cast<IntrinsicInst>(Arg0)) {

      Value *X;

      const APInt *Val, *Val2;

      APInt NewVal;

      bool IsUnsigned =

          IID == Intrinsic::uadd_sat || IID == Intrinsic::usub_sat;

      if (Other->getIntrinsicID() == IID &&

          match(Arg1, m_APInt(Val)) &&

          match(Other->getArgOperand(0), m_Value(X)) &&

          match(Other->getArgOperand(1), m_APInt(Val2))) {

        if (IsUnsigned)

          NewVal = Val->uadd_sat(*Val2);

        else if (Val->isNonNegative() == Val2->isNonNegative()) {

          bool Overflow;

          NewVal = Val->sadd_ov(*Val2, Overflow);

          if (Overflow) {

            // Both adds together may add more than SignedMaxValue

            // without saturating the final result.

            break;

          }

        } else {

          // Cannot fold saturated addition with different signs.

          break;

        }


        return replaceInstUsesWith(

            *II, Builder.CreateBinaryIntrinsic(

                     IID, X, ConstantInt::get(II->getType(), NewVal)));

      }

    }

    break;

  }


  case Intrinsic::minnum:

  case Intrinsic::maxnum:

  case Intrinsic::minimum:

  case Intrinsic::maximum: {

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(Arg0, m_FNeg(m_Value(X))) && match(Arg1, m_FNeg(m_Value(Y))) &&

        (Arg0->hasOneUse() || Arg1->hasOneUse())) {

      // If both operands are negated, invert the call and negate the result:

      // min(-X, -Y) --> -(max(X, Y))

      // max(-X, -Y) --> -(min(X, Y))

      Intrinsic::ID NewIID;

      switch (IID) {

      case Intrinsic::maxnum:

        NewIID = Intrinsic::minnum;

        break;

      case Intrinsic::minnum:

        NewIID = Intrinsic::maxnum;

        break;

      case Intrinsic::maximum:

        NewIID = Intrinsic::minimum;

        break;

      case Intrinsic::minimum:

        NewIID = Intrinsic::maximum;

        break;

      default:

        llvm_unreachable("unexpected intrinsic ID");

      }

      Value *NewCall = Builder.CreateBinaryIntrinsic(NewIID, X, Y, II);

      Instruction *FNeg = UnaryOperator::CreateFNeg(NewCall);

      FNeg->copyIRFlags(II);

      return FNeg;

    }


    // m(m(X, C2), C1) -> m(X, C)

    const APFloat *C1, *C2;

    if (auto *M = dyn_cast<IntrinsicInst>(Arg0)) {

      if (M->getIntrinsicID() == IID && match(Arg1, m_APFloat(C1)) &&

          ((match(M->getArgOperand(0), m_Value(X)) &&

            match(M->getArgOperand(1), m_APFloat(C2))) ||

           (match(M->getArgOperand(1), m_Value(X)) &&

            match(M->getArgOperand(0), m_APFloat(C2))))) {

        APFloat Res(0.0);

        switch (IID) {

        case Intrinsic::maxnum:

          Res = maxnum(*C1, *C2);

          break;

        case Intrinsic::minnum:

          Res = minnum(*C1, *C2);

          break;

        case Intrinsic::maximum:

          Res = maximum(*C1, *C2);

          break;

        case Intrinsic::minimum:

          Res = minimum(*C1, *C2);

          break;

        default:

          llvm_unreachable("unexpected intrinsic ID");

        }

        // TODO: Conservatively intersecting FMF. If Res == C2, the transform

        //       was a simplification (so Arg0 and its original flags could

        //       propagate?)

        Value *V = Builder.CreateBinaryIntrinsic(

            IID, X, ConstantFP::get(Arg0->getType(), Res),

            FMFSource::intersect(II, M));

        return replaceInstUsesWith(*II, V);

      }

    }


    // m((fpext X), (fpext Y)) -> fpext (m(X, Y))

    if (match(Arg0, m_OneUse(m_FPExt(m_Value(X)))) &&

        match(Arg1, m_OneUse(m_FPExt(m_Value(Y)))) &&

        X->getType() == Y->getType()) {

      Value *NewCall =

          Builder.CreateBinaryIntrinsic(IID, X, Y, II, II->getName());

      return new FPExtInst(NewCall, II->getType());

    }


    // max X, -X --> fabs X

    // min X, -X --> -(fabs X)

    // TODO: Remove one-use limitation? That is obviously better for max,

    // hence why we don't check for one-use for that. However,

    // it would be an extra instruction for min (fnabs), but

    // that is still likely better for analysis and codegen.

    auto IsMinMaxOrXNegX = [IID, &X](Value *Op0, Value *Op1) {

      if (match(Op0, m_FNeg(m_Value(X))) && match(Op1, m_Specific(X)))

        return Op0->hasOneUse() ||

               (IID != Intrinsic::minimum && IID != Intrinsic::minnum);

      return false;

    };


    if (IsMinMaxOrXNegX(Arg0, Arg1) || IsMinMaxOrXNegX(Arg1, Arg0)) {

      Value *R = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, X, II);

      if (IID == Intrinsic::minimum || IID == Intrinsic::minnum)

        R = Builder.CreateFNegFMF(R, II);

      return replaceInstUsesWith(*II, R);

    }


    break;

  }

  case Intrinsic::matrix_multiply: {

    // Optimize negation in matrix multiplication.


    // -A * -B -> A * B

    Value *A, *B;

    if (match(II->getArgOperand(0), m_FNeg(m_Value(A))) &&

        match(II->getArgOperand(1), m_FNeg(m_Value(B)))) {

      replaceOperand(*II, 0, A);

      replaceOperand(*II, 1, B);

      return II;

    }


    Value *Op0 = II->getOperand(0);

    Value *Op1 = II->getOperand(1);

    Value *OpNotNeg, *NegatedOp;

    unsigned NegatedOpArg, OtherOpArg;

    if (match(Op0, m_FNeg(m_Value(OpNotNeg)))) {

      NegatedOp = Op0;

      NegatedOpArg = 0;

      OtherOpArg = 1;

    } else if (match(Op1, m_FNeg(m_Value(OpNotNeg)))) {

      NegatedOp = Op1;

      NegatedOpArg = 1;

      OtherOpArg = 0;

    } else

      // Multiplication doesn't have a negated operand.

      break;


    // Only optimize if the negated operand has only one use.

    if (!NegatedOp->hasOneUse())

      break;


    Value *OtherOp = II->getOperand(OtherOpArg);

    VectorType *RetTy = cast<VectorType>(II->getType());

    VectorType *NegatedOpTy = cast<VectorType>(NegatedOp->getType());

    VectorType *OtherOpTy = cast<VectorType>(OtherOp->getType());

    ElementCount NegatedCount = NegatedOpTy->getElementCount();

    ElementCount OtherCount = OtherOpTy->getElementCount();

    ElementCount RetCount = RetTy->getElementCount();

    // (-A) * B -> A * (-B), if it is cheaper to negate B and vice versa.

    if (ElementCount::isKnownGT(NegatedCount, OtherCount) &&

        ElementCount::isKnownLT(OtherCount, RetCount)) {

      Value *InverseOtherOp = Builder.CreateFNeg(OtherOp);

      replaceOperand(*II, NegatedOpArg, OpNotNeg);

      replaceOperand(*II, OtherOpArg, InverseOtherOp);

      return II;

    }

    // (-A) * B -> -(A * B), if it is cheaper to negate the result

    if (ElementCount::isKnownGT(NegatedCount, RetCount)) {

      SmallVector<Value *, 5> NewArgs(II->args());

      NewArgs[NegatedOpArg] = OpNotNeg;

      Instruction *NewMul =

          Builder.CreateIntrinsic(II->getType(), IID, NewArgs, II);

      return replaceInstUsesWith(*II, Builder.CreateFNegFMF(NewMul, II));

    }

    break;

  }

  case Intrinsic::fmuladd: {

    // Try to simplify the underlying FMul.

    if (Value *V =

            simplifyFMulInst(II->getArgOperand(0), II->getArgOperand(1),

                             II->getFastMathFlags(), SQ.getWithInstruction(II)))

      return BinaryOperator::CreateFAddFMF(V, II->getArgOperand(2),

                                           II->getFastMathFlags());


    [[fallthrough]];

  }

  case Intrinsic::fma: {

    // fma fneg(x), fneg(y), z -> fma x, y, z

    Value *Src0 = II->getArgOperand(0);

    Value *Src1 = II->getArgOperand(1);

    Value *Src2 = II->getArgOperand(2);

    Value *X, *Y;

    if (match(Src0, m_FNeg(m_Value(X))) && match(Src1, m_FNeg(m_Value(Y)))) {

      replaceOperand(*II, 0, X);

      replaceOperand(*II, 1, Y);

      return II;

    }


    // fma fabs(x), fabs(x), z -> fma x, x, z

    if (match(Src0, m_FAbs(m_Value(X))) &&

        match(Src1, m_FAbs(m_Specific(X)))) {

      replaceOperand(*II, 0, X);

      replaceOperand(*II, 1, X);

      return II;

    }


    // Try to simplify the underlying FMul. We can only apply simplifications

    // that do not require rounding.

    if (Value *V = simplifyFMAFMul(Src0, Src1, II->getFastMathFlags(),

                                   SQ.getWithInstruction(II)))

      return BinaryOperator::CreateFAddFMF(V, Src2, II->getFastMathFlags());


    // fma x, y, 0 -> fmul x, y

    // This is always valid for -0.0, but requires nsz for +0.0 as

    // -0.0 + 0.0 = 0.0, which would not be the same as the fmul on its own.

    if (match(Src2, m_NegZeroFP()) ||

        (match(Src2, m_PosZeroFP()) && II->getFastMathFlags().noSignedZeros()))

      return BinaryOperator::CreateFMulFMF(Src0, Src1, II);


    // fma x, -1.0, y -> fsub y, x

    if (match(Src1, m_SpecificFP(-1.0)))

      return BinaryOperator::CreateFSubFMF(Src2, Src0, II);


    break;

  }

  case Intrinsic::copysign: {

    Value *Mag = II->getArgOperand(0), *Sign = II->getArgOperand(1);

    if (std::optional<bool> KnownSignBit = computeKnownFPSignBit(

            Sign, /*Depth=*/0, getSimplifyQuery().getWithInstruction(II))) {

      if (*KnownSignBit) {

        // If we know that the sign argument is negative, reduce to FNABS:

        // copysign Mag, -Sign --> fneg (fabs Mag)

        Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Mag, II);

        return replaceInstUsesWith(*II, Builder.CreateFNegFMF(Fabs, II));

      }


      // If we know that the sign argument is positive, reduce to FABS:

      // copysign Mag, +Sign --> fabs Mag

      Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Mag, II);

      return replaceInstUsesWith(*II, Fabs);

    }


    // Propagate sign argument through nested calls:

    // copysign Mag, (copysign ?, X) --> copysign Mag, X

    Value *X;

    if (match(Sign, m_Intrinsic<Intrinsic::copysign>(m_Value(), m_Value(X)))) {

      Value *CopySign =

          Builder.CreateCopySign(Mag, X, FMFSource::intersect(II, Sign));

      return replaceInstUsesWith(*II, CopySign);

    }


    // Clear sign-bit of constant magnitude:

    // copysign -MagC, X --> copysign MagC, X

    // TODO: Support constant folding for fabs

    const APFloat *MagC;

    if (match(Mag, m_APFloat(MagC)) && MagC->isNegative()) {

      APFloat PosMagC = *MagC;

      PosMagC.clearSign();

      return replaceOperand(*II, 0, ConstantFP::get(Mag->getType(), PosMagC));

    }


    // Peek through changes of magnitude's sign-bit. This call rewrites those:

    // copysign (fabs X), Sign --> copysign X, Sign

    // copysign (fneg X), Sign --> copysign X, Sign

    if (match(Mag, m_FAbs(m_Value(X))) || match(Mag, m_FNeg(m_Value(X))))

      return replaceOperand(*II, 0, X);


    break;

  }

  case Intrinsic::fabs: {

    Value *Cond, *TVal, *FVal;

    Value *Arg = II->getArgOperand(0);

    Value *X;

    // fabs (-X) --> fabs (X)

    if (match(Arg, m_FNeg(m_Value(X)))) {

        CallInst *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, X, II);

        return replaceInstUsesWith(CI, Fabs);

    }


    if (match(Arg, m_Select(m_Value(Cond), m_Value(TVal), m_Value(FVal)))) {

      // fabs (select Cond, TrueC, FalseC) --> select Cond, AbsT, AbsF

      if (isa<Constant>(TVal) || isa<Constant>(FVal)) {

        CallInst *AbsT = Builder.CreateCall(II->getCalledFunction(), {TVal});

        CallInst *AbsF = Builder.CreateCall(II->getCalledFunction(), {FVal});

        SelectInst *SI = SelectInst::Create(Cond, AbsT, AbsF);

        FastMathFlags FMF1 = II->getFastMathFlags();

        FastMathFlags FMF2 = cast<SelectInst>(Arg)->getFastMathFlags();

        FMF2.setNoSignedZeros(false);

        SI->setFastMathFlags(FMF1 | FMF2);

        return SI;

      }

      // fabs (select Cond, -FVal, FVal) --> fabs FVal

      if (match(TVal, m_FNeg(m_Specific(FVal))))

        return replaceOperand(*II, 0, FVal);

      // fabs (select Cond, TVal, -TVal) --> fabs TVal

      if (match(FVal, m_FNeg(m_Specific(TVal))))

        return replaceOperand(*II, 0, TVal);

    }


    Value *Magnitude, *Sign;

    if (match(II->getArgOperand(0),

              m_CopySign(m_Value(Magnitude), m_Value(Sign)))) {

      // fabs (copysign x, y) -> (fabs x)

      CallInst *AbsSign =

          Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Magnitude, II);

      return replaceInstUsesWith(*II, AbsSign);

    }


    [[fallthrough]];

  }

  case Intrinsic::ceil:

  case Intrinsic::floor:

  case Intrinsic::round:

  case Intrinsic::roundeven:

  case Intrinsic::nearbyint:

  case Intrinsic::rint:

  case Intrinsic::trunc: {

    Value *ExtSrc;

    if (match(II->getArgOperand(0), m_OneUse(m_FPExt(m_Value(ExtSrc))))) {

      // Narrow the call: intrinsic (fpext x) -> fpext (intrinsic x)

      Value *NarrowII = Builder.CreateUnaryIntrinsic(IID, ExtSrc, II);

      return new FPExtInst(NarrowII, II->getType());

    }

    break;

  }

  case Intrinsic::cos:

  case Intrinsic::amdgcn_cos: {

    Value *X, *Sign;

    Value *Src = II->getArgOperand(0);

    if (match(Src, m_FNeg(m_Value(X))) || match(Src, m_FAbs(m_Value(X))) ||

        match(Src, m_CopySign(m_Value(X), m_Value(Sign)))) {

      // cos(-x) --> cos(x)

      // cos(fabs(x)) --> cos(x)

      // cos(copysign(x, y)) --> cos(x)

      return replaceOperand(*II, 0, X);

    }

    break;

  }

  case Intrinsic::sin:

  case Intrinsic::amdgcn_sin: {

    Value *X;

    if (match(II->getArgOperand(0), m_OneUse(m_FNeg(m_Value(X))))) {

      // sin(-x) --> -sin(x)

      Value *NewSin = Builder.CreateUnaryIntrinsic(IID, X, II);

      return UnaryOperator::CreateFNegFMF(NewSin, II);

    }

    break;

  }

  case Intrinsic::ldexp: {

    // ldexp(ldexp(x, a), b) -> ldexp(x, a + b)

    //

    // The danger is if the first ldexp would overflow to infinity or underflow

    // to zero, but the combined exponent avoids it. We ignore this with

    // reassoc.

    //

    // It's also safe to fold if we know both exponents are >= 0 or <= 0 since

    // it would just double down on the overflow/underflow which would occur

    // anyway.

    //

    // TODO: Could do better if we had range tracking for the input value

    // exponent. Also could broaden sign check to cover == 0 case.

    Value *Src = II->getArgOperand(0);

    Value *Exp = II->getArgOperand(1);

    Value *InnerSrc;

    Value *InnerExp;

    if (match(Src, m_OneUse(m_Intrinsic<Intrinsic::ldexp>(

                       m_Value(InnerSrc), m_Value(InnerExp)))) &&

        Exp->getType() == InnerExp->getType()) {

      FastMathFlags FMF = II->getFastMathFlags();

      FastMathFlags InnerFlags = cast<FPMathOperator>(Src)->getFastMathFlags();


      if ((FMF.allowReassoc() && InnerFlags.allowReassoc()) ||

          signBitMustBeTheSame(Exp, InnerExp, SQ.getWithInstruction(II))) {

        // TODO: Add nsw/nuw probably safe if integer type exceeds exponent

        // width.

        Value *NewExp = Builder.CreateAdd(InnerExp, Exp);

        II->setArgOperand(1, NewExp);

        II->setFastMathFlags(InnerFlags); // Or the inner flags.

        return replaceOperand(*II, 0, InnerSrc);

      }

    }


    // ldexp(x, zext(i1 y)) -> fmul x, (select y, 2.0, 1.0)

    // ldexp(x, sext(i1 y)) -> fmul x, (select y, 0.5, 1.0)

    Value *ExtSrc;

    if (match(Exp, m_ZExt(m_Value(ExtSrc))) &&

        ExtSrc->getType()->getScalarSizeInBits() == 1) {

      Value *Select =

          Builder.CreateSelect(ExtSrc, ConstantFP::get(II->getType(), 2.0),

                               ConstantFP::get(II->getType(), 1.0));

      return BinaryOperator::CreateFMulFMF(Src, Select, II);

    }

    if (match(Exp, m_SExt(m_Value(ExtSrc))) &&

        ExtSrc->getType()->getScalarSizeInBits() == 1) {

      Value *Select =

          Builder.CreateSelect(ExtSrc, ConstantFP::get(II->getType(), 0.5),

                               ConstantFP::get(II->getType(), 1.0));

      return BinaryOperator::CreateFMulFMF(Src, Select, II);

    }


    // ldexp(x, c ? exp : 0) -> c ? ldexp(x, exp) : x

    // ldexp(x, c ? 0 : exp) -> c ? x : ldexp(x, exp)

    ///

    // TODO: If we cared, should insert a canonicalize for x

    Value *SelectCond, *SelectLHS, *SelectRHS;

    if (match(II->getArgOperand(1),

              m_OneUse(m_Select(m_Value(SelectCond), m_Value(SelectLHS),

                                m_Value(SelectRHS))))) {

      Value *NewLdexp = nullptr;

      Value *Select = nullptr;

      if (match(SelectRHS, m_ZeroInt())) {

        NewLdexp = Builder.CreateLdexp(Src, SelectLHS, II);

        Select = Builder.CreateSelect(SelectCond, NewLdexp, Src);

      } else if (match(SelectLHS, m_ZeroInt())) {

        NewLdexp = Builder.CreateLdexp(Src, SelectRHS, II);

        Select = Builder.CreateSelect(SelectCond, Src, NewLdexp);

      }


      if (NewLdexp) {

        Select->takeName(II);

        return replaceInstUsesWith(*II, Select);

      }

    }


    break;

  }

  case Intrinsic::ptrauth_auth:

  case Intrinsic::ptrauth_resign: {

    // (sign|resign) + (auth|resign) can be folded by omitting the middle

    // sign+auth component if the key and discriminator match.

    bool NeedSign = II->getIntrinsicID() == Intrinsic::ptrauth_resign;

    Value *Ptr = II->getArgOperand(0);

    Value *Key = II->getArgOperand(1);

    Value *Disc = II->getArgOperand(2);


    // AuthKey will be the key we need to end up authenticating against in

    // whatever we replace this sequence with.

    Value *AuthKey = nullptr, *AuthDisc = nullptr, *BasePtr;

    if (const auto *CI = dyn_cast<CallBase>(Ptr)) {

      BasePtr = CI->getArgOperand(0);

      if (CI->getIntrinsicID() == Intrinsic::ptrauth_sign) {

        if (CI->getArgOperand(1) != Key || CI->getArgOperand(2) != Disc)

          break;

      } else if (CI->getIntrinsicID() == Intrinsic::ptrauth_resign) {

        if (CI->getArgOperand(3) != Key || CI->getArgOperand(4) != Disc)

          break;

        AuthKey = CI->getArgOperand(1);

        AuthDisc = CI->getArgOperand(2);

      } else

        break;

    } else if (const auto *PtrToInt = dyn_cast<PtrToIntOperator>(Ptr)) {

      // ptrauth constants are equivalent to a call to @llvm.ptrauth.sign for

      // our purposes, so check for that too.

      const auto *CPA = dyn_cast<ConstantPtrAuth>(PtrToInt->getOperand(0));

      if (!CPA || !CPA->isKnownCompatibleWith(Key, Disc, DL))

        break;


      // resign(ptrauth(p,ks,ds),ks,ds,kr,dr) -> ptrauth(p,kr,dr)

      if (NeedSign && isa<ConstantInt>(II->getArgOperand(4))) {

        auto *SignKey = cast<ConstantInt>(II->getArgOperand(3));

        auto *SignDisc = cast<ConstantInt>(II->getArgOperand(4));

        auto *SignAddrDisc = ConstantPointerNull::get(Builder.getPtrTy());

        auto *NewCPA = ConstantPtrAuth::get(CPA->getPointer(), SignKey,

                                            SignDisc, SignAddrDisc);

        replaceInstUsesWith(

            *II, ConstantExpr::getPointerCast(NewCPA, II->getType()));

        return eraseInstFromFunction(*II);

      }


      // auth(ptrauth(p,k,d),k,d) -> p

      BasePtr = Builder.CreatePtrToInt(CPA->getPointer(), II->getType());

    } else

      break;


    unsigned NewIntrin;

    if (AuthKey && NeedSign) {

      // resign(0,1) + resign(1,2) = resign(0, 2)

      NewIntrin = Intrinsic::ptrauth_resign;

    } else if (AuthKey) {

      // resign(0,1) + auth(1) = auth(0)

      NewIntrin = Intrinsic::ptrauth_auth;

    } else if (NeedSign) {

      // sign(0) + resign(0, 1) = sign(1)

      NewIntrin = Intrinsic::ptrauth_sign;

    } else {

      // sign(0) + auth(0) = nop

      replaceInstUsesWith(*II, BasePtr);

      return eraseInstFromFunction(*II);

    }


    SmallVector<Value *, 4> CallArgs;

    CallArgs.push_back(BasePtr);

    if (AuthKey) {

      CallArgs.push_back(AuthKey);

      CallArgs.push_back(AuthDisc);

    }


    if (NeedSign) {

      CallArgs.push_back(II->getArgOperand(3));

      CallArgs.push_back(II->getArgOperand(4));

    }


    Function *NewFn =

        Intrinsic::getOrInsertDeclaration(II->getModule(), NewIntrin);

    return CallInst::Create(NewFn, CallArgs);

  }

  case Intrinsic::arm_neon_vtbl1:

  case Intrinsic::aarch64_neon_tbl1:

    if (Value *V = simplifyNeonTbl1(*II, Builder))

      return replaceInstUsesWith(*II, V);

    break;


  case Intrinsic::arm_neon_vmulls:

  case Intrinsic::arm_neon_vmullu:

  case Intrinsic::aarch64_neon_smull:

  case Intrinsic::aarch64_neon_umull: {

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);


    // Handle mul by zero first:

    if (isa<ConstantAggregateZero>(Arg0) || isa<ConstantAggregateZero>(Arg1)) {

      return replaceInstUsesWith(CI, ConstantAggregateZero::get(II->getType()));

    }


    // Check for constant LHS & RHS - in this case we just simplify.

    bool Zext = (IID == Intrinsic::arm_neon_vmullu ||

                 IID == Intrinsic::aarch64_neon_umull);

    VectorType *NewVT = cast<VectorType>(II->getType());

    if (Constant *CV0 = dyn_cast<Constant>(Arg0)) {

      if (Constant *CV1 = dyn_cast<Constant>(Arg1)) {

        Value *V0 = Builder.CreateIntCast(CV0, NewVT, /*isSigned=*/!Zext);

        Value *V1 = Builder.CreateIntCast(CV1, NewVT, /*isSigned=*/!Zext);

        return replaceInstUsesWith(CI, Builder.CreateMul(V0, V1));

      }


      // Couldn't simplify - canonicalize constant to the RHS.

      std::swap(Arg0, Arg1);

    }


    // Handle mul by one:

    if (Constant *CV1 = dyn_cast<Constant>(Arg1))

      if (ConstantInt *Splat =

              dyn_cast_or_null<ConstantInt>(CV1->getSplatValue()))

        if (Splat->isOne())

          return CastInst::CreateIntegerCast(Arg0, II->getType(),

                                             /*isSigned=*/!Zext);


    break;

  }

  case Intrinsic::arm_neon_aesd:

  case Intrinsic::arm_neon_aese:

  case Intrinsic::aarch64_crypto_aesd:

  case Intrinsic::aarch64_crypto_aese: {

    Value *DataArg = II->getArgOperand(0);

    Value *KeyArg  = II->getArgOperand(1);


    // Try to use the builtin XOR in AESE and AESD to eliminate a prior XOR

    Value *Data, *Key;

    if (match(KeyArg, m_ZeroInt()) &&

        match(DataArg, m_Xor(m_Value(Data), m_Value(Key)))) {

      replaceOperand(*II, 0, Data);

      replaceOperand(*II, 1, Key);

      return II;

    }

    break;

  }

  case Intrinsic::hexagon_V6_vandvrt:

  case Intrinsic::hexagon_V6_vandvrt_128B: {

    // Simplify Q -> V -> Q conversion.

    if (auto Op0 = dyn_cast<IntrinsicInst>(II->getArgOperand(0))) {

      Intrinsic::ID ID0 = Op0->getIntrinsicID();

      if (ID0 != Intrinsic::hexagon_V6_vandqrt &&

          ID0 != Intrinsic::hexagon_V6_vandqrt_128B)

        break;

      Value *Bytes = Op0->getArgOperand(1), *Mask = II->getArgOperand(1);

      uint64_t Bytes1 = computeKnownBits(Bytes, 0, Op0).One.getZExtValue();

      uint64_t Mask1 = computeKnownBits(Mask, 0, II).One.getZExtValue();

      // Check if every byte has common bits in Bytes and Mask.

      uint64_t C = Bytes1 & Mask1;

      if ((C & 0xFF) && (C & 0xFF00) && (C & 0xFF0000) && (C & 0xFF000000))

        return replaceInstUsesWith(*II, Op0->getArgOperand(0));

    }

    break;

  }

  case Intrinsic::stackrestore: {

    enum class ClassifyResult {

      None,

      Alloca,

      StackRestore,

      CallWithSideEffects,

    };

    auto Classify = [](const Instruction *I) {

      if (isa<AllocaInst>(I))

        return ClassifyResult::Alloca;


      if (auto *CI = dyn_cast<CallInst>(I)) {

        if (auto *II = dyn_cast<IntrinsicInst>(CI)) {

          if (II->getIntrinsicID() == Intrinsic::stackrestore)

            return ClassifyResult::StackRestore;


          if (II->mayHaveSideEffects())

            return ClassifyResult::CallWithSideEffects;

        } else {

          // Consider all non-intrinsic calls to be side effects

          return ClassifyResult::CallWithSideEffects;

        }

      }


      return ClassifyResult::None;

    };


    // If the stacksave and the stackrestore are in the same BB, and there is

    // no intervening call, alloca, or stackrestore of a different stacksave,

    // remove the restore. This can happen when variable allocas are DCE'd.

    if (IntrinsicInst *SS = dyn_cast<IntrinsicInst>(II->getArgOperand(0))) {

      if (SS->getIntrinsicID() == Intrinsic::stacksave &&

          SS->getParent() == II->getParent()) {

        BasicBlock::iterator BI(SS);

        bool CannotRemove = false;

        for (++BI; &*BI != II; ++BI) {

          switch (Classify(&*BI)) {

          case ClassifyResult::None:

            // So far so good, look at next instructions.

            break;


          case ClassifyResult::StackRestore:

            // If we found an intervening stackrestore for a different

            // stacksave, we can't remove the stackrestore. Otherwise, continue.

            if (cast<IntrinsicInst>(*BI).getArgOperand(0) != SS)

              CannotRemove = true;

            break;


          case ClassifyResult::Alloca:

          case ClassifyResult::CallWithSideEffects:

            // If we found an alloca, a non-intrinsic call, or an intrinsic

            // call with side effects, we can't remove the stackrestore.

            CannotRemove = true;

            break;

          }

          if (CannotRemove)

            break;

        }


        if (!CannotRemove)

          return eraseInstFromFunction(CI);

      }

    }


    // Scan down this block to see if there is another stack restore in the

    // same block without an intervening call/alloca.

    BasicBlock::iterator BI(II);

    Instruction *TI = II->getParent()->getTerminator();

    bool CannotRemove = false;

    for (++BI; &*BI != TI; ++BI) {

      switch (Classify(&*BI)) {

      case ClassifyResult::None:

        // So far so good, look at next instructions.

        break;


      case ClassifyResult::StackRestore:

        // If there is a stackrestore below this one, remove this one.

        return eraseInstFromFunction(CI);


      case ClassifyResult::Alloca:

      case ClassifyResult::CallWithSideEffects:

        // If we found an alloca, a non-intrinsic call, or an intrinsic call

        // with side effects (such as llvm.stacksave and llvm.read_register),

        // we can't remove the stack restore.

        CannotRemove = true;

        break;

      }

      if (CannotRemove)

        break;

    }


    // If the stack restore is in a return, resume, or unwind block and if there

    // are no allocas or calls between the restore and the return, nuke the

    // restore.

    if (!CannotRemove && (isa<ReturnInst>(TI) || isa<ResumeInst>(TI)))

      return eraseInstFromFunction(CI);

    break;

  }

  case Intrinsic::lifetime_end:

    // Asan needs to poison memory to detect invalid access which is possible

    // even for empty lifetime range.

    if (II->getFunction()->hasFnAttribute(Attribute::SanitizeAddress) ||

        II->getFunction()->hasFnAttribute(Attribute::SanitizeMemory) ||

        II->getFunction()->hasFnAttribute(Attribute::SanitizeHWAddress))

      break;


    if (removeTriviallyEmptyRange(*II, *this, [](const IntrinsicInst &I) {

          return I.getIntrinsicID() == Intrinsic::lifetime_start;

        }))

      return nullptr;

    break;

  case Intrinsic::assume: {

    Value *IIOperand = II->getArgOperand(0);

    SmallVector<OperandBundleDef, 4> OpBundles;

    II->getOperandBundlesAsDefs(OpBundles);


    /// This will remove the boolean Condition from the assume given as

    /// argument and remove the assume if it becomes useless.

    /// always returns nullptr for use as a return values.

    auto RemoveConditionFromAssume = [&](Instruction *Assume) -> Instruction * {

      assert(isa<AssumeInst>(Assume));

      if (isAssumeWithEmptyBundle(*cast<AssumeInst>(II)))

        return eraseInstFromFunction(CI);

      replaceUse(II->getOperandUse(0), ConstantInt::getTrue(II->getContext()));

      return nullptr;

    };

    // Remove an assume if it is followed by an identical assume.

    // TODO: Do we need this? Unless there are conflicting assumptions, the

    // computeKnownBits(IIOperand) below here eliminates redundant assumes.

    Instruction *Next = II->getNextNonDebugInstruction();

    if (match(Next, m_Intrinsic<Intrinsic::assume>(m_Specific(IIOperand))))

      return RemoveConditionFromAssume(Next);


    // Canonicalize assume(a && b) -> assume(a); assume(b);

    // Note: New assumption intrinsics created here are registered by

    // the InstCombineIRInserter object.

    FunctionType *AssumeIntrinsicTy = II->getFunctionType();

    Value *AssumeIntrinsic = II->getCalledOperand();

    Value *A, *B;

    if (match(IIOperand, m_LogicalAnd(m_Value(A), m_Value(B)))) {

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic, A, OpBundles,

                         II->getName());

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic, B, II->getName());

      return eraseInstFromFunction(*II);

    }

    // assume(!(a || b)) -> assume(!a); assume(!b);

    if (match(IIOperand, m_Not(m_LogicalOr(m_Value(A), m_Value(B))))) {

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic,

                         Builder.CreateNot(A), OpBundles, II->getName());

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic,

                         Builder.CreateNot(B), II->getName());

      return eraseInstFromFunction(*II);

    }


    // assume( (load addr) != null ) -> add 'nonnull' metadata to load

    // (if assume is valid at the load)

    Instruction *LHS;

    if (match(IIOperand, m_SpecificICmp(ICmpInst::ICMP_NE, m_Instruction(LHS),

                                        m_Zero())) &&

        LHS->getOpcode() == Instruction::Load &&

        LHS->getType()->isPointerTy() &&

        isValidAssumeForContext(II, LHS, &DT)) {

      MDNode *MD = MDNode::get(II->getContext(), {});

      LHS->setMetadata(LLVMContext::MD_nonnull, MD);

      LHS->setMetadata(LLVMContext::MD_noundef, MD);

      return RemoveConditionFromAssume(II);


      // TODO: apply nonnull return attributes to calls and invokes

      // TODO: apply range metadata for range check patterns?

    }


    // Separate storage assumptions apply to the underlying allocations, not any

    // particular pointer within them. When evaluating the hints for AA purposes

    // we getUnderlyingObject them; by precomputing the answers here we can

    // avoid having to do so repeatedly there.

    for (unsigned Idx = 0; Idx < II->getNumOperandBundles(); Idx++) {

      OperandBundleUse OBU = II->getOperandBundleAt(Idx);

      if (OBU.getTagName() == "separate_storage") {

        assert(OBU.Inputs.size() == 2);

        auto MaybeSimplifyHint = [&](const Use &U) {

          Value *Hint = U.get();

          // Not having a limit is safe because InstCombine removes unreachable

          // code.

          Value *UnderlyingObject = getUnderlyingObject(Hint, /*MaxLookup*/ 0);

          if (Hint != UnderlyingObject)

            replaceUse(const_cast<Use &>(U), UnderlyingObject);

        };

        MaybeSimplifyHint(OBU.Inputs[0]);

        MaybeSimplifyHint(OBU.Inputs[1]);

      }

    }


    // Convert nonnull assume like:

    // %A = icmp ne i32* %PTR, null

    // call void @llvm.assume(i1 %A)

    // into

    // call void @llvm.assume(i1 true) [ "nonnull"(i32* %PTR) ]

    if (EnableKnowledgeRetention &&

        match(IIOperand,

              m_SpecificICmp(ICmpInst::ICMP_NE, m_Value(A), m_Zero())) &&

        A->getType()->isPointerTy()) {

      if (auto *Replacement = buildAssumeFromKnowledge(

              {RetainedKnowledge{Attribute::NonNull, 0, A}}, Next, &AC, &DT)) {


        Replacement->insertBefore(Next);

        AC.registerAssumption(Replacement);

        return RemoveConditionFromAssume(II);

      }

    }


    // Convert alignment assume like:

    // %B = ptrtoint i32* %A to i64

    // %C = and i64 %B, Constant

    // %D = icmp eq i64 %C, 0

    // call void @llvm.assume(i1 %D)

    // into

    // call void @llvm.assume(i1 true) [ "align"(i32* [[A]], i64  Constant + 1)]

    uint64_t AlignMask = 1;

    if (EnableKnowledgeRetention &&

        (match(IIOperand, m_Not(m_Trunc(m_Value(A)))) ||

         match(IIOperand,

               m_SpecificICmp(ICmpInst::ICMP_EQ,

                              m_And(m_Value(A), m_ConstantInt(AlignMask)),

                              m_Zero())))) {

      if (isPowerOf2_64(AlignMask + 1)) {

        uint64_t Offset = 0;

        match(A, m_Add(m_Value(A), m_ConstantInt(Offset)));

        if (match(A, m_PtrToInt(m_Value(A)))) {

          /// Note: this doesn't preserve the offset information but merges

          /// offset and alignment.

          /// TODO: we can generate a GEP instead of merging the alignment with

          /// the offset.

          RetainedKnowledge RK{Attribute::Alignment,

                               (unsigned)MinAlign(Offset, AlignMask + 1), A};

          if (auto *Replacement =

                  buildAssumeFromKnowledge(RK, Next, &AC, &DT)) {


            Replacement->insertAfter(II);

            AC.registerAssumption(Replacement);

          }

          return RemoveConditionFromAssume(II);

        }

      }

    }


    /// Canonicalize Knowledge in operand bundles.

    if (EnableKnowledgeRetention && II->hasOperandBundles()) {

      for (unsigned Idx = 0; Idx < II->getNumOperandBundles(); Idx++) {

        auto &BOI = II->bundle_op_info_begin()[Idx];

        RetainedKnowledge RK =

          llvm::getKnowledgeFromBundle(cast<AssumeInst>(*II), BOI);

        if (BOI.End - BOI.Begin > 2)

          continue; // Prevent reducing knowledge in an align with offset since

                    // extracting a RetainedKnowledge from them looses offset

                    // information

        RetainedKnowledge CanonRK =

          llvm::simplifyRetainedKnowledge(cast<AssumeInst>(II), RK,

                                          &getAssumptionCache(),

                                          &getDominatorTree());

        if (CanonRK == RK)

          continue;

        if (!CanonRK) {

          if (BOI.End - BOI.Begin > 0) {

            Worklist.pushValue(II->op_begin()[BOI.Begin]);

            Value::dropDroppableUse(II->op_begin()[BOI.Begin]);

          }

          continue;

        }

        assert(RK.AttrKind == CanonRK.AttrKind);

        if (BOI.End - BOI.Begin > 0)

          II->op_begin()[BOI.Begin].set(CanonRK.WasOn);

        if (BOI.End - BOI.Begin > 1)

          II->op_begin()[BOI.Begin + 1].set(ConstantInt::get(

              Type::getInt64Ty(II->getContext()), CanonRK.ArgValue));

        if (RK.WasOn)

          Worklist.pushValue(RK.WasOn);

        return II;

      }

    }


    // If there is a dominating assume with the same condition as this one,

    // then this one is redundant, and should be removed.

    KnownBits Known(1);

    computeKnownBits(IIOperand, Known, 0, II);

    if (Known.isAllOnes() && isAssumeWithEmptyBundle(cast<AssumeInst>(*II)))

      return eraseInstFromFunction(*II);


    // assume(false) is unreachable.

    if (match(IIOperand, m_CombineOr(m_Zero(), m_Undef()))) {

      CreateNonTerminatorUnreachable(II);

      return eraseInstFromFunction(*II);

    }


    // Update the cache of affected values for this assumption (we might be

    // here because we just simplified the condition).

    AC.updateAffectedValues(cast<AssumeInst>(II));

    break;

  }

  case Intrinsic::experimental_guard: {

    // Is this guard followed by another guard?  We scan forward over a small

    // fixed window of instructions to handle common cases with conditions

    // computed between guards.

    Instruction *NextInst = II->getNextNonDebugInstruction();

    for (unsigned i = 0; i < GuardWideningWindow; i++) {

      // Note: Using context-free form to avoid compile time blow up

      if (!isSafeToSpeculativelyExecute(NextInst))

        break;

      NextInst = NextInst->getNextNonDebugInstruction();

    }

    Value *NextCond = nullptr;

    if (match(NextInst,

              m_Intrinsic<Intrinsic::experimental_guard>(m_Value(NextCond)))) {

      Value *CurrCond = II->getArgOperand(0);


      // Remove a guard that it is immediately preceded by an identical guard.

      // Otherwise canonicalize guard(a); guard(b) -> guard(a & b).

      if (CurrCond != NextCond) {

        Instruction *MoveI = II->getNextNonDebugInstruction();

        while (MoveI != NextInst) {

          auto *Temp = MoveI;

          MoveI = MoveI->getNextNonDebugInstruction();

          Temp->moveBefore(II);

        }

        replaceOperand(*II, 0, Builder.CreateAnd(CurrCond, NextCond));

      }

      eraseInstFromFunction(*NextInst);

      return II;

    }

    break;

  }

  case Intrinsic::vector_insert: {

    Value *Vec = II->getArgOperand(0);

    Value *SubVec = II->getArgOperand(1);

    Value *Idx = II->getArgOperand(2);

    auto *DstTy = dyn_cast<FixedVectorType>(II->getType());

    auto *VecTy = dyn_cast<FixedVectorType>(Vec->getType());

    auto *SubVecTy = dyn_cast<FixedVectorType>(SubVec->getType());


    // Only canonicalize if the destination vector, Vec, and SubVec are all

    // fixed vectors.

    if (DstTy && VecTy && SubVecTy) {

      unsigned DstNumElts = DstTy->getNumElements();

      unsigned VecNumElts = VecTy->getNumElements();

      unsigned SubVecNumElts = SubVecTy->getNumElements();

      unsigned IdxN = cast<ConstantInt>(Idx)->getZExtValue();


      // An insert that entirely overwrites Vec with SubVec is a nop.

      if (VecNumElts == SubVecNumElts)

        return replaceInstUsesWith(CI, SubVec);


      // Widen SubVec into a vector of the same width as Vec, since

      // shufflevector requires the two input vectors to be the same width.

      // Elements beyond the bounds of SubVec within the widened vector are

      // undefined.

      SmallVector<int, 8> WidenMask;

      unsigned i;

      for (i = 0; i != SubVecNumElts; ++i)

        WidenMask.push_back(i);

      for (; i != VecNumElts; ++i)

        WidenMask.push_back(PoisonMaskElem);


      Value *WidenShuffle = Builder.CreateShuffleVector(SubVec, WidenMask);


      SmallVector<int, 8> Mask;

      for (unsigned i = 0; i != IdxN; ++i)

        Mask.push_back(i);

      for (unsigned i = DstNumElts; i != DstNumElts + SubVecNumElts; ++i)

        Mask.push_back(i);

      for (unsigned i = IdxN + SubVecNumElts; i != DstNumElts; ++i)

        Mask.push_back(i);


      Value *Shuffle = Builder.CreateShuffleVector(Vec, WidenShuffle, Mask);

      return replaceInstUsesWith(CI, Shuffle);

    }

    break;

  }

  case Intrinsic::vector_extract: {

    Value *Vec = II->getArgOperand(0);

    Value *Idx = II->getArgOperand(1);


    Type *ReturnType = II->getType();

    // (extract_vector (insert_vector InsertTuple, InsertValue, InsertIdx),

    // ExtractIdx)

    unsigned ExtractIdx = cast<ConstantInt>(Idx)->getZExtValue();

    Value *InsertTuple, *InsertIdx, *InsertValue;

    if (match(Vec, m_Intrinsic<Intrinsic::vector_insert>(m_Value(InsertTuple),

                                                         m_Value(InsertValue),

                                                         m_Value(InsertIdx))) &&

        InsertValue->getType() == ReturnType) {

      unsigned Index = cast<ConstantInt>(InsertIdx)->getZExtValue();

      // Case where we get the same index right after setting it.

      // extract.vector(insert.vector(InsertTuple, InsertValue, Idx), Idx) -->

      // InsertValue

      if (ExtractIdx == Index)

        return replaceInstUsesWith(CI, InsertValue);

      // If we are getting a different index than what was set in the

      // insert.vector intrinsic. We can just set the input tuple to the one up

      // in the chain. extract.vector(insert.vector(InsertTuple, InsertValue,

      // InsertIndex), ExtractIndex)

      // --> extract.vector(InsertTuple, ExtractIndex)

      else

        return replaceOperand(CI, 0, InsertTuple);

    }


    auto *DstTy = dyn_cast<VectorType>(ReturnType);

    auto *VecTy = dyn_cast<VectorType>(Vec->getType());


    if (DstTy && VecTy) {

      auto DstEltCnt = DstTy->getElementCount();

      auto VecEltCnt = VecTy->getElementCount();

      unsigned IdxN = cast<ConstantInt>(Idx)->getZExtValue();


      // Extracting the entirety of Vec is a nop.

      if (DstEltCnt == VecTy->getElementCount()) {

        replaceInstUsesWith(CI, Vec);

        return eraseInstFromFunction(CI);

      }


      // Only canonicalize to shufflevector if the destination vector and

      // Vec are fixed vectors.

      if (VecEltCnt.isScalable() || DstEltCnt.isScalable())

        break;


      SmallVector<int, 8> Mask;

      for (unsigned i = 0; i != DstEltCnt.getKnownMinValue(); ++i)

        Mask.push_back(IdxN + i);


      Value *Shuffle = Builder.CreateShuffleVector(Vec, Mask);

      return replaceInstUsesWith(CI, Shuffle);

    }

    break;

  }

  case Intrinsic::vector_reverse: {

    Value *BO0, *BO1, *X, *Y;

    Value *Vec = II->getArgOperand(0);

    if (match(Vec, m_OneUse(m_BinOp(m_Value(BO0), m_Value(BO1))))) {

      auto *OldBinOp = cast<BinaryOperator>(Vec);

      if (match(BO0, m_VecReverse(m_Value(X)))) {

        // rev(binop rev(X), rev(Y)) --> binop X, Y

        if (match(BO1, m_VecReverse(m_Value(Y))))

          return replaceInstUsesWith(CI, BinaryOperator::CreateWithCopiedFlags(

                                             OldBinOp->getOpcode(), X, Y,

                                             OldBinOp, OldBinOp->getName(),

                                             II->getIterator()));

        // rev(binop rev(X), BO1Splat) --> binop X, BO1Splat

        if (isSplatValue(BO1))

          return replaceInstUsesWith(CI, BinaryOperator::CreateWithCopiedFlags(

                                             OldBinOp->getOpcode(), X, BO1,

                                             OldBinOp, OldBinOp->getName(),

                                             II->getIterator()));

      }

      // rev(binop BO0Splat, rev(Y)) --> binop BO0Splat, Y

      if (match(BO1, m_VecReverse(m_Value(Y))) && isSplatValue(BO0))

        return replaceInstUsesWith(CI,

                                   BinaryOperator::CreateWithCopiedFlags(

                                       OldBinOp->getOpcode(), BO0, Y, OldBinOp,

                                       OldBinOp->getName(), II->getIterator()));

    }

    // rev(unop rev(X)) --> unop X

    if (match(Vec, m_OneUse(m_UnOp(m_VecReverse(m_Value(X)))))) {

      auto *OldUnOp = cast<UnaryOperator>(Vec);

      auto *NewUnOp = UnaryOperator::CreateWithCopiedFlags(

          OldUnOp->getOpcode(), X, OldUnOp, OldUnOp->getName(),

          II->getIterator());

      return replaceInstUsesWith(CI, NewUnOp);

    }

    break;

  }

  case Intrinsic::vector_reduce_or:

  case Intrinsic::vector_reduce_and: {

    // Canonicalize logical or/and reductions:

    // Or reduction for i1 is represented as:

    // %val = bitcast <ReduxWidth x i1> to iReduxWidth

    // %res = cmp ne iReduxWidth %val, 0

    // And reduction for i1 is represented as:

    // %val = bitcast <ReduxWidth x i1> to iReduxWidth

    // %res = cmp eq iReduxWidth %val, 11111

    Value *Arg = II->getArgOperand(0);

    Value *Vect;


    if (Value *NewOp =

            simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

      replaceUse(II->getOperandUse(0), NewOp);

      return II;

    }


    if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

      if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

        if (FTy->getElementType() == Builder.getInt1Ty()) {

          Value *Res = Builder.CreateBitCast(

              Vect, Builder.getIntNTy(FTy->getNumElements()));

          if (IID == Intrinsic::vector_reduce_and) {

            Res = Builder.CreateICmpEQ(

                Res, ConstantInt::getAllOnesValue(Res->getType()));

          } else {

            assert(IID == Intrinsic::vector_reduce_or &&

                   "Expected or reduction.");

            Res = Builder.CreateIsNotNull(Res);

          }

          if (Arg != Vect)

            Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                     II->getType());

          return replaceInstUsesWith(CI, Res);

        }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_add: {

    if (IID == Intrinsic::vector_reduce_add) {

      // Convert vector_reduce_add(ZExt(<n x i1>)) to

      // ZExtOrTrunc(ctpop(bitcast <n x i1> to in)).

      // Convert vector_reduce_add(SExt(<n x i1>)) to

      // -ZExtOrTrunc(ctpop(bitcast <n x i1> to in)).

      // Convert vector_reduce_add(<n x i1>) to

      // Trunc(ctpop(bitcast <n x i1> to in)).

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

          if (FTy->getElementType() == Builder.getInt1Ty()) {

            Value *V = Builder.CreateBitCast(

                Vect, Builder.getIntNTy(FTy->getNumElements()));

            Value *Res = Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, V);

            if (Res->getType() != II->getType())

              Res = Builder.CreateZExtOrTrunc(Res, II->getType());

            if (Arg != Vect &&

                cast<Instruction>(Arg)->getOpcode() == Instruction::SExt)

              Res = Builder.CreateNeg(Res);

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_xor: {

    if (IID == Intrinsic::vector_reduce_xor) {

      // Exclusive disjunction reduction over the vector with

      // (potentially-extended) i1 element type is actually a

      // (potentially-extended) arithmetic `add` reduction over the original

      // non-extended value:

      //   vector_reduce_xor(?ext(<n x i1>))

      //     -->

      //   ?ext(vector_reduce_add(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = Builder.CreateAddReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                       II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_mul: {

    if (IID == Intrinsic::vector_reduce_mul) {

      // Multiplicative reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially zero-extended)

      // logical `and` reduction over the original non-extended value:

      //   vector_reduce_mul(?ext(<n x i1>))

      //     -->

      //   zext(vector_reduce_and(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = Builder.CreateAndReduce(Vect);

            if (Res->getType() != II->getType())

              Res = Builder.CreateZExt(Res, II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_umin:

  case Intrinsic::vector_reduce_umax: {

    if (IID == Intrinsic::vector_reduce_umin ||

        IID == Intrinsic::vector_reduce_umax) {

      // UMin/UMax reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially-extended)

      // logical `and`/`or` reduction over the original non-extended value:

      //   vector_reduce_u{min,max}(?ext(<n x i1>))

      //     -->

      //   ?ext(vector_reduce_{and,or}(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = IID == Intrinsic::vector_reduce_umin

                             ? Builder.CreateAndReduce(Vect)

                             : Builder.CreateOrReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                       II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_smin:

  case Intrinsic::vector_reduce_smax: {

    if (IID == Intrinsic::vector_reduce_smin ||

        IID == Intrinsic::vector_reduce_smax) {

      // SMin/SMax reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially-extended)

      // logical `and`/`or` reduction over the original non-extended value:

      //   vector_reduce_s{min,max}(<n x i1>)

      //     -->

      //   vector_reduce_{or,and}(<n x i1>)

      // and

      //   vector_reduce_s{min,max}(sext(<n x i1>))

      //     -->

      //   sext(vector_reduce_{or,and}(<n x i1>))

      // and

      //   vector_reduce_s{min,max}(zext(<n x i1>))

      //     -->

      //   zext(vector_reduce_{and,or}(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Instruction::CastOps ExtOpc = Instruction::CastOps::CastOpsEnd;

            if (Arg != Vect)

              ExtOpc = cast<CastInst>(Arg)->getOpcode();

            Value *Res = ((IID == Intrinsic::vector_reduce_smin) ==

                          (ExtOpc == Instruction::CastOps::ZExt))

                             ? Builder.CreateAndReduce(Vect)

                             : Builder.CreateOrReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(ExtOpc, Res, II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_fmax:

  case Intrinsic::vector_reduce_fmin:

  case Intrinsic::vector_reduce_fadd:

  case Intrinsic::vector_reduce_fmul: {

    bool CanReorderLanes = (IID != Intrinsic::vector_reduce_fadd &&

                            IID != Intrinsic::vector_reduce_fmul) ||

                           II->hasAllowReassoc();

    const unsigned ArgIdx = (IID == Intrinsic::vector_reduce_fadd ||

                             IID == Intrinsic::vector_reduce_fmul)

                                ? 1

                                : 0;

    Value *Arg = II->getArgOperand(ArgIdx);

    if (Value *NewOp = simplifyReductionOperand(Arg, CanReorderLanes)) {

      replaceUse(II->getOperandUse(ArgIdx), NewOp);

      return nullptr;

    }

    break;

  }

  case Intrinsic::is_fpclass: {

    if (Instruction *I = foldIntrinsicIsFPClass(*II))

      return I;

    break;

  }

  case Intrinsic::threadlocal_address: {

    Align MinAlign = getKnownAlignment(II->getArgOperand(0), DL, II, &AC, &DT);

    MaybeAlign Align = II->getRetAlign();

    if (MinAlign > Align.valueOrOne()) {

      II->addRetAttr(Attribute::getWithAlignment(II->getContext(), MinAlign));

      return II;

    }

    break;

  }

  default: {

    // Handle target specific intrinsics

    std::optional<Instruction *> V = targetInstCombineIntrinsic(*II);

    if (V)

      return *V;

    break;

  }

  }


  // Try to fold intrinsic into select operands. This is legal if:

  //  * The intrinsic is speculatable.

  //  * The select condition is not a vector, or the intrinsic does not

  //    perform cross-lane operations.

  if (isSafeToSpeculativelyExecuteWithVariableReplaced(&CI) &&

      isNotCrossLaneOperation(II))

    for (Value *Op : II->args())

      if (auto *Sel = dyn_cast<SelectInst>(Op))

        if (Instruction *R = FoldOpIntoSelect(*II, Sel))

          return R;


  if (Instruction *Shuf = foldShuffledIntrinsicOperands(II, Builder))

    return Shuf;


  // Some intrinsics (like experimental_gc_statepoint) can be used in invoke

  // context, so it is handled in visitCallBase and we should trigger it.

  return visitCallBase(*II);

}


// Fence instruction simplification

Instruction *InstCombinerImpl::visitFenceInst(FenceInst &FI) {

  auto *NFI = dyn_cast<FenceInst>(FI.getNextNonDebugInstruction());

  // This check is solely here to handle arbitrary target-dependent syncscopes.

  // TODO: Can remove if does not matter in practice.

  if (NFI && FI.isIdenticalTo(NFI))

    return eraseInstFromFunction(FI);


  // Returns true if FI1 is identical or stronger fence than FI2.

  auto isIdenticalOrStrongerFence = [](FenceInst *FI1, FenceInst *FI2) {

    auto FI1SyncScope = FI1->getSyncScopeID();

    // Consider same scope, where scope is global or single-thread.

    if (FI1SyncScope != FI2->getSyncScopeID() ||

        (FI1SyncScope != SyncScope::System &&

         FI1SyncScope != SyncScope::SingleThread))

      return false;


    return isAtLeastOrStrongerThan(FI1->getOrdering(), FI2->getOrdering());

  };

  if (NFI && isIdenticalOrStrongerFence(NFI, &FI))

    return eraseInstFromFunction(FI);


  if (auto *PFI = dyn_cast_or_null<FenceInst>(FI.getPrevNonDebugInstruction()))

    if (isIdenticalOrStrongerFence(PFI, &FI))

      return eraseInstFromFunction(FI);

  return nullptr;

}


// InvokeInst simplification

Instruction *InstCombinerImpl::visitInvokeInst(InvokeInst &II) {

  return visitCallBase(II);

}


// CallBrInst simplification

Instruction *InstCombinerImpl::visitCallBrInst(CallBrInst &CBI) {

  return visitCallBase(CBI);

}


Instruction *InstCombinerImpl::tryOptimizeCall(CallInst *CI) {

  if (!CI->getCalledFunction()) return nullptr;


  // Skip optimizing notail and musttail calls so

  // LibCallSimplifier::optimizeCall doesn't have to preserve those invariants.

  // LibCallSimplifier::optimizeCall should try to preserve tail calls though.

  if (CI->isMustTailCall() || CI->isNoTailCall())

    return nullptr;


  auto InstCombineRAUW = [this](Instruction *From, Value *With) {

    replaceInstUsesWith(*From, With);

  };

  auto InstCombineErase = [this](Instruction *I) {

    eraseInstFromFunction(*I);

  };

  LibCallSimplifier Simplifier(DL, &TLI, &DT, &DC, &AC, ORE, BFI, PSI,

                               InstCombineRAUW, InstCombineErase);

  if (Value *With = Simplifier.optimizeCall(CI, Builder)) {

    ++NumSimplified;

    return CI->use_empty() ? CI : replaceInstUsesWith(*CI, With);

  }


  return nullptr;

}


static IntrinsicInst *findInitTrampolineFromAlloca(Value *TrampMem) {

  // Strip off at most one level of pointer casts, looking for an alloca.  This

  // is good enough in practice and simpler than handling any number of casts.

  Value *Underlying = TrampMem->stripPointerCasts();

  if (Underlying != TrampMem &&

      (!Underlying->hasOneUse() || Underlying->user_back() != TrampMem))

    return nullptr;

  if (!isa<AllocaInst>(Underlying))

    return nullptr;


  IntrinsicInst *InitTrampoline = nullptr;

  for (User *U : TrampMem->users()) {

    IntrinsicInst *II = dyn_cast<IntrinsicInst>(U);

    if (!II)

      return nullptr;

    if (II->getIntrinsicID() == Intrinsic::init_trampoline) {

      if (InitTrampoline)

        // More than one init_trampoline writes to this value.  Give up.

        return nullptr;

      InitTrampoline = II;

      continue;

    }

    if (II->getIntrinsicID() == Intrinsic::adjust_trampoline)

      // Allow any number of calls to adjust.trampoline.

      continue;

    return nullptr;

  }


  // No call to init.trampoline found.

  if (!InitTrampoline)

    return nullptr;


  // Check that the alloca is being used in the expected way.

  if (InitTrampoline->getOperand(0) != TrampMem)

    return nullptr;


  return InitTrampoline;

}


static IntrinsicInst *findInitTrampolineFromBB(IntrinsicInst *AdjustTramp,

                                               Value *TrampMem) {

  // Visit all the previous instructions in the basic block, and try to find a

  // init.trampoline which has a direct path to the adjust.trampoline.

  for (BasicBlock::iterator I = AdjustTramp->getIterator(),

                            E = AdjustTramp->getParent()->begin();

       I != E;) {

    Instruction *Inst = &*--I;

    if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(I))

      if (II->getIntrinsicID() == Intrinsic::init_trampoline &&

          II->getOperand(0) == TrampMem)

        return II;

    if (Inst->mayWriteToMemory())

      return nullptr;

  }

  return nullptr;

}


// Given a call to llvm.adjust.trampoline, find and return the corresponding

// call to llvm.init.trampoline if the call to the trampoline can be optimized

// to a direct call to a function.  Otherwise return NULL.

static IntrinsicInst *findInitTrampoline(Value *Callee) {

  Callee = Callee->stripPointerCasts();

  IntrinsicInst *AdjustTramp = dyn_cast<IntrinsicInst>(Callee);

  if (!AdjustTramp ||

      AdjustTramp->getIntrinsicID() != Intrinsic::adjust_trampoline)

    return nullptr;


  Value *TrampMem = AdjustTramp->getOperand(0);


  if (IntrinsicInst *IT = findInitTrampolineFromAlloca(TrampMem))

    return IT;

  if (IntrinsicInst *IT = findInitTrampolineFromBB(AdjustTramp, TrampMem))

    return IT;

  return nullptr;

}


bool InstCombinerImpl::annotateAnyAllocSite(CallBase &Call,

                                            const TargetLibraryInfo *TLI) {

  // Note: We only handle cases which can't be driven from generic attributes

  // here.  So, for example, nonnull and noalias (which are common properties

  // of some allocation functions) are expected to be handled via annotation

  // of the respective allocator declaration with generic attributes.

  bool Changed = false;


  if (!Call.getType()->isPointerTy())

    return Changed;


  std::optional<APInt> Size = getAllocSize(&Call, TLI);

  if (Size && *Size != 0) {

    // TODO: We really should just emit deref_or_null here and then

    // let the generic inference code combine that with nonnull.

    if (Call.hasRetAttr(Attribute::NonNull)) {

      Changed = !Call.hasRetAttr(Attribute::Dereferenceable);

      Call.addRetAttr(Attribute::getWithDereferenceableBytes(

          Call.getContext(), Size->getLimitedValue()));

    } else {

      Changed = !Call.hasRetAttr(Attribute::DereferenceableOrNull);

      Call.addRetAttr(Attribute::getWithDereferenceableOrNullBytes(

          Call.getContext(), Size->getLimitedValue()));

    }

  }


  // Add alignment attribute if alignment is a power of two constant.

  Value *Alignment = getAllocAlignment(&Call, TLI);

  if (!Alignment)

    return Changed;


  ConstantInt *AlignOpC = dyn_cast<ConstantInt>(Alignment);

  if (AlignOpC && AlignOpC->getValue().ult(llvm::Value::MaximumAlignment)) {

    uint64_t AlignmentVal = AlignOpC->getZExtValue();

    if (llvm::isPowerOf2_64(AlignmentVal)) {

      Align ExistingAlign = Call.getRetAlign().valueOrOne();

      Align NewAlign = Align(AlignmentVal);

      if (NewAlign > ExistingAlign) {

        Call.addRetAttr(

            Attribute::getWithAlignment(Call.getContext(), NewAlign));

        Changed = true;

      }

    }

  }

  return Changed;

}


/// Improvements for call, callbr and invoke instructions.

Instruction *InstCombinerImpl::visitCallBase(CallBase &Call) {

  bool Changed = annotateAnyAllocSite(Call, &TLI);


  // Mark any parameters that are known to be non-null with the nonnull

  // attribute.  This is helpful for inlining calls to functions with null

  // checks on their arguments.

  SmallVector<unsigned, 4> ArgNos;

  unsigned ArgNo = 0;


  for (Value *V : Call.args()) {

    if (V->getType()->isPointerTy() &&

        !Call.paramHasAttr(ArgNo, Attribute::NonNull) &&

        isKnownNonZero(V, getSimplifyQuery().getWithInstruction(&Call)))

      ArgNos.push_back(ArgNo);

    ArgNo++;

  }


  assert(ArgNo == Call.arg_size() && "Call arguments not processed correctly.");


  if (!ArgNos.empty()) {

    AttributeList AS = Call.getAttributes();

    LLVMContext &Ctx = Call.getContext();

    AS = AS.addParamAttribute(Ctx, ArgNos,

                              Attribute::get(Ctx, Attribute::NonNull));

    Call.setAttributes(AS);

    Changed = true;

  }


  // If the callee is a pointer to a function, attempt to move any casts to the

  // arguments of the call/callbr/invoke.

  Value *Callee = Call.getCalledOperand();

  Function *CalleeF = dyn_cast<Function>(Callee);

  if ((!CalleeF || CalleeF->getFunctionType() != Call.getFunctionType()) &&

      transformConstExprCastCall(Call))

    return nullptr;


  if (CalleeF) {

    // Remove the convergent attr on calls when the callee is not convergent.

    if (Call.isConvergent() && !CalleeF->isConvergent() &&

        !CalleeF->isIntrinsic()) {

      LLVM_DEBUG(dbgs() << "Removing convergent attr from instr " << Call

                        << "\n");

      Call.setNotConvergent();

      return &Call;

    }


    // If the call and callee calling conventions don't match, and neither one

    // of the calling conventions is compatible with C calling convention

    // this call must be unreachable, as the call is undefined.

    if ((CalleeF->getCallingConv() != Call.getCallingConv() &&

         !(CalleeF->getCallingConv() == llvm::CallingConv::C &&

           TargetLibraryInfoImpl::isCallingConvCCompatible(&Call)) &&

         !(Call.getCallingConv() == llvm::CallingConv::C &&

           TargetLibraryInfoImpl::isCallingConvCCompatible(CalleeF))) &&

        // Only do this for calls to a function with a body.  A prototype may

        // not actually end up matching the implementation's calling conv for a

        // variety of reasons (e.g. it may be written in assembly).

        !CalleeF->isDeclaration()) {

      Instruction *OldCall = &Call;

      CreateNonTerminatorUnreachable(OldCall);

      // If OldCall does not return void then replaceInstUsesWith poison.

      // This allows ValueHandlers and custom metadata to adjust itself.

      if (!OldCall->getType()->isVoidTy())

        replaceInstUsesWith(*OldCall, PoisonValue::get(OldCall->getType()));

      if (isa<CallInst>(OldCall))

        return eraseInstFromFunction(*OldCall);


      // We cannot remove an invoke or a callbr, because it would change thexi

      // CFG, just change the callee to a null pointer.

      cast<CallBase>(OldCall)->setCalledFunction(

          CalleeF->getFunctionType(),

          Constant::getNullValue(CalleeF->getType()));

      return nullptr;

    }

  }


  // Calling a null function pointer is undefined if a null address isn't

  // dereferenceable.

  if ((isa<ConstantPointerNull>(Callee) &&

       !NullPointerIsDefined(Call.getFunction())) ||

      isa<UndefValue>(Callee)) {

    // If Call does not return void then replaceInstUsesWith poison.

    // This allows ValueHandlers and custom metadata to adjust itself.

    if (!Call.getType()->isVoidTy())

      replaceInstUsesWith(Call, PoisonValue::get(Call.getType()));


    if (Call.isTerminator()) {

      // Can't remove an invoke or callbr because we cannot change the CFG.

      return nullptr;

    }


    // This instruction is not reachable, just remove it.

    CreateNonTerminatorUnreachable(&Call);

    return eraseInstFromFunction(Call);

  }


  if (IntrinsicInst *II = findInitTrampoline(Callee))

    return transformCallThroughTrampoline(Call, *II);


  if (isa<InlineAsm>(Callee) && !Call.doesNotThrow()) {

    InlineAsm *IA = cast<InlineAsm>(Callee);

    if (!IA->canThrow()) {

      // Normal inline asm calls cannot throw - mark them

      // 'nounwind'.

      Call.setDoesNotThrow();

      Changed = true;

    }

  }


  // Try to optimize the call if possible, we require DataLayout for most of

  // this.  None of these calls are seen as possibly dead so go ahead and

  // delete the instruction now.

  if (CallInst *CI = dyn_cast<CallInst>(&Call)) {

    Instruction *I = tryOptimizeCall(CI);

    // If we changed something return the result, etc. Otherwise let

    // the fallthrough check.

    if (I) return eraseInstFromFunction(*I);

  }


  if (!Call.use_empty() && !Call.isMustTailCall())

    if (Value *ReturnedArg = Call.getReturnedArgOperand()) {

      Type *CallTy = Call.getType();

      Type *RetArgTy = ReturnedArg->getType();

      if (RetArgTy->canLosslesslyBitCastTo(CallTy))

        return replaceInstUsesWith(

            Call, Builder.CreateBitOrPointerCast(ReturnedArg, CallTy));

    }


  // Drop unnecessary kcfi operand bundles from calls that were converted

  // into direct calls.

  auto Bundle = Call.getOperandBundle(LLVMContext::OB_kcfi);

  if (Bundle && !Call.isIndirectCall()) {

    DEBUG_WITH_TYPE(DEBUG_TYPE "-kcfi", {

      if (CalleeF) {

        ConstantInt *FunctionType = nullptr;

        ConstantInt *ExpectedType = cast<ConstantInt>(Bundle->Inputs[0]);


        if (MDNode *MD = CalleeF->getMetadata(LLVMContext::MD_kcfi_type))

          FunctionType = mdconst::extract<ConstantInt>(MD->getOperand(0));


        if (FunctionType &&

            FunctionType->getZExtValue() != ExpectedType->getZExtValue())

          dbgs() << Call.getModule()->getName()

                 << ": warning: kcfi: " << Call.getCaller()->getName()

                 << ": call to " << CalleeF->getName()

                 << " using a mismatching function pointer type\n";

      }

    });


    return CallBase::removeOperandBundle(&Call, LLVMContext::OB_kcfi);

  }


  if (isRemovableAlloc(&Call, &TLI))

    return visitAllocSite(Call);


  // Handle intrinsics which can be used in both call and invoke context.

  switch (Call.getIntrinsicID()) {

  case Intrinsic::experimental_gc_statepoint: {

    GCStatepointInst &GCSP = *cast<GCStatepointInst>(&Call);

    SmallPtrSet<Value *, 32> LiveGcValues;

    for (const GCRelocateInst *Reloc : GCSP.getGCRelocates()) {

      GCRelocateInst &GCR = *const_cast<GCRelocateInst *>(Reloc);


      // Remove the relocation if unused.

      if (GCR.use_empty()) {

        eraseInstFromFunction(GCR);

        continue;

      }


      Value *DerivedPtr = GCR.getDerivedPtr();

      Value *BasePtr = GCR.getBasePtr();


      // Undef is undef, even after relocation.

      if (isa<UndefValue>(DerivedPtr) || isa<UndefValue>(BasePtr)) {

        replaceInstUsesWith(GCR, UndefValue::get(GCR.getType()));

        eraseInstFromFunction(GCR);

        continue;

      }


      if (auto *PT = dyn_cast<PointerType>(GCR.getType())) {

        // The relocation of null will be null for most any collector.

        // TODO: provide a hook for this in GCStrategy.  There might be some

        // weird collector this property does not hold for.

        if (isa<ConstantPointerNull>(DerivedPtr)) {

          // Use null-pointer of gc_relocate's type to replace it.

          replaceInstUsesWith(GCR, ConstantPointerNull::get(PT));

          eraseInstFromFunction(GCR);

          continue;

        }


        // isKnownNonNull -> nonnull attribute

        if (!GCR.hasRetAttr(Attribute::NonNull) &&

            isKnownNonZero(DerivedPtr,

                           getSimplifyQuery().getWithInstruction(&Call))) {

          GCR.addRetAttr(Attribute::NonNull);

          // We discovered new fact, re-check users.

          Worklist.pushUsersToWorkList(GCR);

        }

      }


      // If we have two copies of the same pointer in the statepoint argument

      // list, canonicalize to one.  This may let us common gc.relocates.

      if (GCR.getBasePtr() == GCR.getDerivedPtr() &&

          GCR.getBasePtrIndex() != GCR.getDerivedPtrIndex()) {

        auto *OpIntTy = GCR.getOperand(2)->getType();

        GCR.setOperand(2, ConstantInt::get(OpIntTy, GCR.getBasePtrIndex()));

      }


      // TODO: bitcast(relocate(p)) -> relocate(bitcast(p))

      // Canonicalize on the type from the uses to the defs


      // TODO: relocate((gep p, C, C2, ...)) -> gep(relocate(p), C, C2, ...)

      LiveGcValues.insert(BasePtr);

      LiveGcValues.insert(DerivedPtr);

    }

    std::optional<OperandBundleUse> Bundle =

        GCSP.getOperandBundle(LLVMContext::OB_gc_live);

    unsigned NumOfGCLives = LiveGcValues.size();

    if (!Bundle || NumOfGCLives == Bundle->Inputs.size())

      break;

    // We can reduce the size of gc live bundle.

    DenseMap<Value *, unsigned> Val2Idx;

    std::vector<Value *> NewLiveGc;

    for (Value *V : Bundle->Inputs) {

      auto [It, Inserted] = Val2Idx.try_emplace(V);

      if (!Inserted)

        continue;

      if (LiveGcValues.count(V)) {

        It->second = NewLiveGc.size();

        NewLiveGc.push_back(V);

      } else

        It->second = NumOfGCLives;

    }

    // Update all gc.relocates

    for (const GCRelocateInst *Reloc : GCSP.getGCRelocates()) {

      GCRelocateInst &GCR = *const_cast<GCRelocateInst *>(Reloc);

      Value *BasePtr = GCR.getBasePtr();

      assert(Val2Idx.count(BasePtr) && Val2Idx[BasePtr] != NumOfGCLives &&

             "Missed live gc for base pointer");

      auto *OpIntTy1 = GCR.getOperand(1)->getType();

      GCR.setOperand(1, ConstantInt::get(OpIntTy1, Val2Idx[BasePtr]));

      Value *DerivedPtr = GCR.getDerivedPtr();

      assert(Val2Idx.count(DerivedPtr) && Val2Idx[DerivedPtr] != NumOfGCLives &&

             "Missed live gc for derived pointer");

      auto *OpIntTy2 = GCR.getOperand(2)->getType();

      GCR.setOperand(2, ConstantInt::get(OpIntTy2, Val2Idx[DerivedPtr]));

    }

    // Create new statepoint instruction.

    OperandBundleDef NewBundle("gc-live", NewLiveGc);

    return CallBase::Create(&Call, NewBundle);

  }

  default: { break; }

  }


  return Changed ? &Call : nullptr;

}


/// If the callee is a constexpr cast of a function, attempt to move the cast to

/// the arguments of the call/invoke.

/// CallBrInst is not supported.

bool InstCombinerImpl::transformConstExprCastCall(CallBase &Call) {

  auto *Callee =

      dyn_cast<Function>(Call.getCalledOperand()->stripPointerCasts());

  if (!Callee)

    return false;


  assert(!isa<CallBrInst>(Call) &&

         "CallBr's don't have a single point after a def to insert at");


  // Don't perform the transform for declarations, which may not be fully

  // accurate. For example, void @foo() is commonly used as a placeholder for

  // unknown prototypes.

  if (Callee->isDeclaration())

    return false;


  // If this is a call to a thunk function, don't remove the cast. Thunks are

  // used to transparently forward all incoming parameters and outgoing return

  // values, so it's important to leave the cast in place.

  if (Callee->hasFnAttribute("thunk"))

    return false;


  // If this is a call to a naked function, the assembly might be

  // using an argument, or otherwise rely on the frame layout,

  // the function prototype will mismatch.

  if (Callee->hasFnAttribute(Attribute::Naked))

    return false;


  // If this is a musttail call, the callee's prototype must match the caller's

  // prototype with the exception of pointee types. The code below doesn't

  // implement that, so we can't do this transform.

  // TODO: Do the transform if it only requires adding pointer casts.

  if (Call.isMustTailCall())

    return false;


  Instruction *Caller = &Call;

  const AttributeList &CallerPAL = Call.getAttributes();


  // Okay, this is a cast from a function to a different type.  Unless doing so

  // would cause a type conversion of one of our arguments, change this call to

  // be a direct call with arguments casted to the appropriate types.

  FunctionType *FT = Callee->getFunctionType();

  Type *OldRetTy = Caller->getType();

  Type *NewRetTy = FT->getReturnType();


  // Check to see if we are changing the return type...

  if (OldRetTy != NewRetTy) {


    if (NewRetTy->isStructTy())

      return false; // TODO: Handle multiple return values.


    if (!CastInst::isBitOrNoopPointerCastable(NewRetTy, OldRetTy, DL)) {

      if (!Caller->use_empty())

        return false;   // Cannot transform this return value.

    }


    if (!CallerPAL.isEmpty() && !Caller->use_empty()) {

      AttrBuilder RAttrs(FT->getContext(), CallerPAL.getRetAttrs());

      if (RAttrs.overlaps(AttributeFuncs::typeIncompatible(

              NewRetTy, CallerPAL.getRetAttrs())))

        return false;   // Attribute not compatible with transformed value.

    }


    // If the callbase is an invoke instruction, and the return value is

    // used by a PHI node in a successor, we cannot change the return type of

    // the call because there is no place to put the cast instruction (without

    // breaking the critical edge).  Bail out in this case.

    if (!Caller->use_empty()) {

      BasicBlock *PhisNotSupportedBlock = nullptr;

      if (auto *II = dyn_cast<InvokeInst>(Caller))

        PhisNotSupportedBlock = II->getNormalDest();

      if (PhisNotSupportedBlock)

        for (User *U : Caller->users())

          if (PHINode *PN = dyn_cast<PHINode>(U))

            if (PN->getParent() == PhisNotSupportedBlock)

              return false;

    }

  }


  unsigned NumActualArgs = Call.arg_size();

  unsigned NumCommonArgs = std::min(FT->getNumParams(), NumActualArgs);


  // Prevent us turning:

  // declare void @takes_i32_inalloca(i32* inalloca)

  //  call void bitcast (void (i32*)* @takes_i32_inalloca to void (i32)*)(i32 0)

  //

  // into:

  //  call void @takes_i32_inalloca(i32* null)

  //

  //  Similarly, avoid folding away bitcasts of byval calls.

  if (Callee->getAttributes().hasAttrSomewhere(Attribute::InAlloca) ||

      Callee->getAttributes().hasAttrSomewhere(Attribute::Preallocated))

    return false;


  auto AI = Call.arg_begin();

  for (unsigned i = 0, e = NumCommonArgs; i != e; ++i, ++AI) {

    Type *ParamTy = FT->getParamType(i);

    Type *ActTy = (*AI)->getType();


    if (!CastInst::isBitOrNoopPointerCastable(ActTy, ParamTy, DL))

      return false;   // Cannot transform this parameter value.


    // Check if there are any incompatible attributes we cannot drop safely.

    if (AttrBuilder(FT->getContext(), CallerPAL.getParamAttrs(i))

            .overlaps(AttributeFuncs::typeIncompatible(

                ParamTy, CallerPAL.getParamAttrs(i),

                AttributeFuncs::ASK_UNSAFE_TO_DROP)))

      return false;   // Attribute not compatible with transformed value.


    if (Call.isInAllocaArgument(i) ||

        CallerPAL.hasParamAttr(i, Attribute::Preallocated))

      return false; // Cannot transform to and from inalloca/preallocated.


    if (CallerPAL.hasParamAttr(i, Attribute::SwiftError))

      return false;


    if (CallerPAL.hasParamAttr(i, Attribute::ByVal) !=

        Callee->getAttributes().hasParamAttr(i, Attribute::ByVal))

      return false; // Cannot transform to or from byval.

  }


  if (FT->getNumParams() < NumActualArgs && FT->isVarArg() &&

      !CallerPAL.isEmpty()) {

    // In this case we have more arguments than the new function type, but we

    // won't be dropping them.  Check that these extra arguments have attributes

    // that are compatible with being a vararg call argument.

    unsigned SRetIdx;

    if (CallerPAL.hasAttrSomewhere(Attribute::StructRet, &SRetIdx) &&

        SRetIdx - AttributeList::FirstArgIndex >= FT->getNumParams())

      return false;

  }


  // Okay, we decided that this is a safe thing to do: go ahead and start

  // inserting cast instructions as necessary.

  SmallVector<Value *, 8> Args;

  SmallVector<AttributeSet, 8> ArgAttrs;

  Args.reserve(NumActualArgs);

  ArgAttrs.reserve(NumActualArgs);


  // Get any return attributes.

  AttrBuilder RAttrs(FT->getContext(), CallerPAL.getRetAttrs());


  // If the return value is not being used, the type may not be compatible

  // with the existing attributes.  Wipe out any problematic attributes.

  RAttrs.remove(

      AttributeFuncs::typeIncompatible(NewRetTy, CallerPAL.getRetAttrs()));


  LLVMContext &Ctx = Call.getContext();

  AI = Call.arg_begin();

  for (unsigned i = 0; i != NumCommonArgs; ++i, ++AI) {

    Type *ParamTy = FT->getParamType(i);


    Value *NewArg = *AI;

    if ((*AI)->getType() != ParamTy)

      NewArg = Builder.CreateBitOrPointerCast(*AI, ParamTy);

    Args.push_back(NewArg);


    // Add any parameter attributes except the ones incompatible with the new

    // type. Note that we made sure all incompatible ones are safe to drop.

    AttributeMask IncompatibleAttrs = AttributeFuncs::typeIncompatible(

        ParamTy, CallerPAL.getParamAttrs(i), AttributeFuncs::ASK_SAFE_TO_DROP);

    ArgAttrs.push_back(

        CallerPAL.getParamAttrs(i).removeAttributes(Ctx, IncompatibleAttrs));

  }


  // If the function takes more arguments than the call was taking, add them

  // now.

  for (unsigned i = NumCommonArgs; i != FT->getNumParams(); ++i) {

    Args.push_back(Constant::getNullValue(FT->getParamType(i)));

    ArgAttrs.push_back(AttributeSet());

  }


  // If we are removing arguments to the function, emit an obnoxious warning.

  if (FT->getNumParams() < NumActualArgs) {

    // TODO: if (!FT->isVarArg()) this call may be unreachable. PR14722

    if (FT->isVarArg()) {

      // Add all of the arguments in their promoted form to the arg list.

      for (unsigned i = FT->getNumParams(); i != NumActualArgs; ++i, ++AI) {

        Type *PTy = getPromotedType((*AI)->getType());

        Value *NewArg = *AI;

        if (PTy != (*AI)->getType()) {

          // Must promote to pass through va_arg area!

          Instruction::CastOps opcode =

            CastInst::getCastOpcode(*AI, false, PTy, false);

          NewArg = Builder.CreateCast(opcode, *AI, PTy);

        }

        Args.push_back(NewArg);


        // Add any parameter attributes.

        ArgAttrs.push_back(CallerPAL.getParamAttrs(i));

      }

    }

  }


  AttributeSet FnAttrs = CallerPAL.getFnAttrs();


  if (NewRetTy->isVoidTy())

    Caller->setName("");   // Void type should not have a name.


  assert((ArgAttrs.size() == FT->getNumParams() || FT->isVarArg()) &&

         "missing argument attributes");

  AttributeList NewCallerPAL = AttributeList::get(

      Ctx, FnAttrs, AttributeSet::get(Ctx, RAttrs), ArgAttrs);


  SmallVector<OperandBundleDef, 1> OpBundles;

  Call.getOperandBundlesAsDefs(OpBundles);


  CallBase *NewCall;

  if (InvokeInst *II = dyn_cast<InvokeInst>(Caller)) {

    NewCall = Builder.CreateInvoke(Callee, II->getNormalDest(),

                                   II->getUnwindDest(), Args, OpBundles);

  } else {

    NewCall = Builder.CreateCall(Callee, Args, OpBundles);

    cast<CallInst>(NewCall)->setTailCallKind(

        cast<CallInst>(Caller)->getTailCallKind());

  }

  NewCall->takeName(Caller);

  NewCall->setCallingConv(Call.getCallingConv());

  NewCall->setAttributes(NewCallerPAL);


  // Preserve prof metadata if any.

  NewCall->copyMetadata(*Caller, {LLVMContext::MD_prof});


  // Insert a cast of the return type as necessary.

  Instruction *NC = NewCall;

  Value *NV = NC;

  if (OldRetTy != NV->getType() && !Caller->use_empty()) {

    assert(!NV->getType()->isVoidTy());

    NV = NC = CastInst::CreateBitOrPointerCast(NC, OldRetTy);

    NC->setDebugLoc(Caller->getDebugLoc());


    auto OptInsertPt = NewCall->getInsertionPointAfterDef();

    assert(OptInsertPt && "No place to insert cast");

    InsertNewInstBefore(NC, *OptInsertPt);

    Worklist.pushUsersToWorkList(*Caller);

  }


  if (!Caller->use_empty())

    replaceInstUsesWith(*Caller, NV);

  else if (Caller->hasValueHandle()) {

    if (OldRetTy == NV->getType())

      ValueHandleBase::ValueIsRAUWd(Caller, NV);

    else

      // We cannot call ValueIsRAUWd with a different type, and the

      // actual tracked value will disappear.

      ValueHandleBase::ValueIsDeleted(Caller);

  }


  eraseInstFromFunction(*Caller);

  return true;

}


/// Turn a call to a function created by init_trampoline / adjust_trampoline

/// intrinsic pair into a direct call to the underlying function.

Instruction *

InstCombinerImpl::transformCallThroughTrampoline(CallBase &Call,

                                                 IntrinsicInst &Tramp) {

  FunctionType *FTy = Call.getFunctionType();

  AttributeList Attrs = Call.getAttributes();


  // If the call already has the 'nest' attribute somewhere then give up -

  // otherwise 'nest' would occur twice after splicing in the chain.

  if (Attrs.hasAttrSomewhere(Attribute::Nest))

    return nullptr;


  Function *NestF = cast<Function>(Tramp.getArgOperand(1)->stripPointerCasts());

  FunctionType *NestFTy = NestF->getFunctionType();


  AttributeList NestAttrs = NestF->getAttributes();

  if (!NestAttrs.isEmpty()) {

    unsigned NestArgNo = 0;

    Type *NestTy = nullptr;

    AttributeSet NestAttr;


    // Look for a parameter marked with the 'nest' attribute.

    for (FunctionType::param_iterator I = NestFTy->param_begin(),

                                      E = NestFTy->param_end();

         I != E; ++NestArgNo, ++I) {

      AttributeSet AS = NestAttrs.getParamAttrs(NestArgNo);

      if (AS.hasAttribute(Attribute::Nest)) {

        // Record the parameter type and any other attributes.

        NestTy = *I;

        NestAttr = AS;

        break;

      }

    }


    if (NestTy) {

      std::vector<Value*> NewArgs;

      std::vector<AttributeSet> NewArgAttrs;

      NewArgs.reserve(Call.arg_size() + 1);

      NewArgAttrs.reserve(Call.arg_size());


      // Insert the nest argument into the call argument list, which may

      // mean appending it.  Likewise for attributes.


      {

        unsigned ArgNo = 0;

        auto I = Call.arg_begin(), E = Call.arg_end();

        do {

          if (ArgNo == NestArgNo) {

            // Add the chain argument and attributes.

            Value *NestVal = Tramp.getArgOperand(2);

            if (NestVal->getType() != NestTy)

              NestVal = Builder.CreateBitCast(NestVal, NestTy, "nest");

            NewArgs.push_back(NestVal);

            NewArgAttrs.push_back(NestAttr);

          }


          if (I == E)

            break;


          // Add the original argument and attributes.

          NewArgs.push_back(*I);

          NewArgAttrs.push_back(Attrs.getParamAttrs(ArgNo));


          ++ArgNo;

          ++I;

        } while (true);

      }


      // The trampoline may have been bitcast to a bogus type (FTy).

      // Handle this by synthesizing a new function type, equal to FTy

      // with the chain parameter inserted.


      std::vector<Type*> NewTypes;

      NewTypes.reserve(FTy->getNumParams()+1);


      // Insert the chain's type into the list of parameter types, which may

      // mean appending it.

      {

        unsigned ArgNo = 0;

        FunctionType::param_iterator I = FTy->param_begin(),

          E = FTy->param_end();


        do {

          if (ArgNo == NestArgNo)

            // Add the chain's type.

            NewTypes.push_back(NestTy);


          if (I == E)

            break;


          // Add the original type.

          NewTypes.push_back(*I);


          ++ArgNo;

          ++I;

        } while (true);

      }


      // Replace the trampoline call with a direct call.  Let the generic

      // code sort out any function type mismatches.

      FunctionType *NewFTy =

          FunctionType::get(FTy->getReturnType(), NewTypes, FTy->isVarArg());

      AttributeList NewPAL =

          AttributeList::get(FTy->getContext(), Attrs.getFnAttrs(),

                             Attrs.getRetAttrs(), NewArgAttrs);


      SmallVector<OperandBundleDef, 1> OpBundles;

      Call.getOperandBundlesAsDefs(OpBundles);


      Instruction *NewCaller;

      if (InvokeInst *II = dyn_cast<InvokeInst>(&Call)) {

        NewCaller = InvokeInst::Create(NewFTy, NestF, II->getNormalDest(),

                                       II->getUnwindDest(), NewArgs, OpBundles);

        cast<InvokeInst>(NewCaller)->setCallingConv(II->getCallingConv());

        cast<InvokeInst>(NewCaller)->setAttributes(NewPAL);

      } else if (CallBrInst *CBI = dyn_cast<CallBrInst>(&Call)) {

        NewCaller =

            CallBrInst::Create(NewFTy, NestF, CBI->getDefaultDest(),

                               CBI->getIndirectDests(), NewArgs, OpBundles);

        cast<CallBrInst>(NewCaller)->setCallingConv(CBI->getCallingConv());

        cast<CallBrInst>(NewCaller)->setAttributes(NewPAL);

      } else {

        NewCaller = CallInst::Create(NewFTy, NestF, NewArgs, OpBundles);

        cast<CallInst>(NewCaller)->setTailCallKind(

            cast<CallInst>(Call).getTailCallKind());

        cast<CallInst>(NewCaller)->setCallingConv(

            cast<CallInst>(Call).getCallingConv());

        cast<CallInst>(NewCaller)->setAttributes(NewPAL);

      }

      NewCaller->setDebugLoc(Call.getDebugLoc());


      return NewCaller;

    }

  }


  // Replace the trampoline call with a direct call.  Since there is no 'nest'

  // parameter, there is no need to adjust the argument list.  Let the generic

  // code sort out any function type mismatches.

  Call.setCalledFunction(FTy, NestF);

  return &Call;

}

Intr
unsigned Intr
Definition: AMDGPUBaseInfo.cpp:2958

Select
AMDGPU Register Bank Select
Definition: AMDGPURegBankSelect.cpp:59

APFloat.h
This file declares a class to represent arbitrary precision floating point values and provide a varie...

APInt.h
This file implements a class to represent arbitrary precision integral constant values and operations...

APSInt.h
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

IT
static cl::opt< ITMode > IT(cl::desc("IT block support"), cl::Hidden, cl::init(DefaultIT), cl::values(clEnumValN(DefaultIT, "arm-default-it", "Generate any type of IT block"), clEnumValN(RestrictedIT, "arm-restrict-it", "Disallow complex IT blocks")))

AliasAnalysis.h

ArrayRef.h

AssumeBundleBuilder.h

AssumeBundleQueries.h

AssumptionCache.h

AtomicOrdering.h
Atomic ordering constants.

AttributeMask.h

Attributes.h
This file contains the simple types necessary to represent the attributes associated with functions a...

From
BlockVerifier::State From
Definition: BlockVerifier.cpp:57

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

Casting.h

CommandLine.h

Compiler.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

foldBitOrderCrossLogicOp
static SDValue foldBitOrderCrossLogicOp(SDNode *N, SelectionDAG &DAG)
Definition: DAGCombiner.cpp:10455

DataLayout.h

RetTy
return RetTy
Definition: DeadArgumentElimination.cpp:361

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:353

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition: Debug.h:106

DEBUG_WITH_TYPE
#define DEBUG_WITH_TYPE(TYPE,...)
DEBUG_WITH_TYPE macro - This macro should be used by passes to emit debug information.
Definition: Debug.h:64

DerivedTypes.h

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

X
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")

DEBUG_TYPE
#define DEBUG_TYPE
Definition: GenericCycleImpl.h:31

GlobalVariable.h

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:112

BasicBlock.h

Constant.h

Function.h

Instruction.h

IntrinsicInst.h

Type.h

User.h

Value.h

InlineAsm.h

getPromotedType
static Type * getPromotedType(Type *Ty)
Return the specified type promoted as it would be to pass though a va_arg area.
Definition: InstCombineCalls.cpp:94

createOverflowTuple
static Instruction * createOverflowTuple(IntrinsicInst *II, Value *Result, Constant *Overflow)
Creates a result tuple for an overflow intrinsic II with a given Result and a constant Overflow value...
Definition: InstCombineCalls.cpp:839

findInitTrampolineFromAlloca
static IntrinsicInst * findInitTrampolineFromAlloca(Value *TrampMem)
Definition: InstCombineCalls.cpp:3861

removeTriviallyEmptyRange
static bool removeTriviallyEmptyRange(IntrinsicInst &EndI, InstCombinerImpl &IC, std::function< bool(const IntrinsicInst &)> IsStart)
Definition: InstCombineCalls.cpp:791

inputDenormalIsDAZ
static bool inputDenormalIsDAZ(const Function &F, const Type *Ty)
Definition: InstCombineCalls.cpp:892

reassociateMinMaxWithConstantInOperand
static Instruction * reassociateMinMaxWithConstantInOperand(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If this min/max has a matching min/max operand with a constant, try to push the constant operand into...
Definition: InstCombineCalls.cpp:1312

signBitMustBeTheSame
static bool signBitMustBeTheSame(Value *Op0, Value *Op1, const SimplifyQuery &SQ)
Return true if two values Op0 and Op1 are known to have the same sign.
Definition: InstCombineCalls.cpp:1125

moveAddAfterMinMax
static Instruction * moveAddAfterMinMax(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
Try to canonicalize min/max(X + C0, C1) as min/max(X, C1 - C0) + C0.
Definition: InstCombineCalls.cpp:1138

simplifyInvariantGroupIntrinsic
static Instruction * simplifyInvariantGroupIntrinsic(IntrinsicInst &II, InstCombinerImpl &IC)
This function transforms launder.invariant.group and strip.invariant.group like: launder(launder(x)) ...
Definition: InstCombineCalls.cpp:449

haveSameOperands
static bool haveSameOperands(const IntrinsicInst &I, const IntrinsicInst &E, unsigned NumOperands)
Definition: InstCombineCalls.cpp:771

getKnownSign
static std::optional< bool > getKnownSign(Value *Op, const SimplifyQuery &SQ)
Definition: InstCombineCalls.cpp:1098

GuardWideningWindow
static cl::opt< unsigned > GuardWideningWindow("instcombine-guard-widening-window", cl::init(3), cl::desc("How wide an instruction window to bypass looking for " "another guard"))

hasUndefSource
static bool hasUndefSource(AnyMemTransferInst *MI)
Recognize a memcpy/memmove from a trivially otherwise unused alloca.
Definition: InstCombineCalls.cpp:105

foldShuffledIntrinsicOperands
static Instruction * foldShuffledIntrinsicOperands(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If all arguments of the intrinsic are unary shuffles with the same mask, try to shuffle after the int...
Definition: InstCombineCalls.cpp:1400

factorizeMinMaxTree
static Instruction * factorizeMinMaxTree(IntrinsicInst *II)
Reduce a sequence of min/max intrinsics with a common operand.
Definition: InstCombineCalls.cpp:1340

simplifyNeonTbl1
static Value * simplifyNeonTbl1(const IntrinsicInst &II, InstCombiner::BuilderTy &Builder)
Convert a table lookup to shufflevector if the mask is constant.
Definition: InstCombineCalls.cpp:735

foldClampRangeOfTwo
static Instruction * foldClampRangeOfTwo(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If we have a clamp pattern like max (min X, 42), 41 – where the output can only be one of two possibl...
Definition: InstCombineCalls.cpp:1238

simplifyReductionOperand
static Value * simplifyReductionOperand(Value *Arg, bool CanReorderLanes)
Definition: InstCombineCalls.cpp:1486

findInitTrampolineFromBB
static IntrinsicInst * findInitTrampolineFromBB(IntrinsicInst *AdjustTramp, Value *TrampMem)
Definition: InstCombineCalls.cpp:3900

foldIntrinsicUsingDistributiveLaws
static Value * foldIntrinsicUsingDistributiveLaws(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
Definition: InstCombineCalls.cpp:1570

getKnownSignOrZero
static std::optional< bool > getKnownSignOrZero(Value *Op, const SimplifyQuery &SQ)
Definition: InstCombineCalls.cpp:1112

foldMinimumOverTrailingOrLeadingZeroCount
static Value * foldMinimumOverTrailingOrLeadingZeroCount(Value *I0, Value *I1, const DataLayout &DL, InstCombiner::BuilderTy &Builder)
Fold an unsigned minimum of trailing or leading zero bits counts: umin(cttz(CtOp, ZeroUndef),...
Definition: InstCombineCalls.cpp:1519

foldCtpop
static Instruction * foldCtpop(IntrinsicInst &II, InstCombinerImpl &IC)
Definition: InstCombineCalls.cpp:643

foldCttzCtlz
static Instruction * foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC)
Definition: InstCombineCalls.cpp:479

findInitTrampoline
static IntrinsicInst * findInitTrampoline(Value *Callee)
Definition: InstCombineCalls.cpp:3921

fpclassTestIsFCmp0
static FCmpInst::Predicate fpclassTestIsFCmp0(FPClassTest Mask, const Function &F, Type *Ty)
Definition: InstCombineCalls.cpp:900

leftDistributesOverRight
static bool leftDistributesOverRight(Instruction::BinaryOps LOp, bool HasNUW, bool HasNSW, Intrinsic::ID ROp)
Return whether "X LOp (Y ROp Z)" is always equal to "(X LOp Y) ROp (X LOp Z)".
Definition: InstCombineCalls.cpp:1552

reassociateMinMaxWithConstants
static Value * reassociateMinMaxWithConstants(IntrinsicInst *II, IRBuilderBase &Builder, const SimplifyQuery &SQ)
If this min/max has a constant operand and an operand that is a matching min/max with a constant oper...
Definition: InstCombineCalls.cpp:1278

canonicalizeConstantArg0ToArg1
static CallInst * canonicalizeConstantArg0ToArg1(CallInst &Call)
Definition: InstCombineCalls.cpp:826

InstCombineInternal.h
This file provides internal interfaces used to implement the InstCombine.

InstCombiner.h
This file provides the interface for the instcombine pass implementation.

InstrTypes.h

InstructionSimplify.h

InstructionWorklist.h

Instructions.h

Intrinsics.h

KnownBits.h

LLVMContext.h

Loads.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

MathExtras.h

MemoryBuiltins.h

Metadata.h
This file contains the declarations for metadata subclasses.

Range
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:51

Y
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")

PatternMatch.h

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition: RISCVRedundantCopyElimination.cpp:75

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

STLFunctionalExtras.h

SimplifyLibCalls.h

SmallBitVector.h
This file implements the SmallBitVector class.

SmallVector.h
This file defines the SmallVector class.

Statepoint.h

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition: Statistic.h:166

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:77

Struct
@ Struct
Definition: TargetLibraryInfo.cpp:78

Local.h

getOpcode
static std::optional< unsigned > getOpcode(ArrayRef< VPValue * > Values)
Returns the opcode of Values or ~0 if they do not all agree.
Definition: VPlanSLP.cpp:191

ValueHandle.h

inputDenormalIsIEEE
static bool inputDenormalIsIEEE(const Function &F, const Type *Ty)
Return true if it's possible to assume IEEE treatment of input denormals in F for Val.
Definition: ValueTracking.cpp:4388

ValueTracking.h

VectorUtils.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

FunctionType
Definition: ItaniumDemangle.h:823

VectorType
Definition: ItaniumDemangle.h:1173

llvm::AAResults::getModRefInfoMask
ModRefInfo getModRefInfoMask(const MemoryLocation &Loc, bool IgnoreLocals=false)
Returns a bitmask that should be unconditionally applied to the ModRef info of a memory location.
Definition: AliasAnalysis.cpp:149

llvm::APFloat
Definition: APFloat.h:904

llvm::APFloat::isNegative
bool isNegative() const
Definition: APFloat.h:1445

llvm::APFloat::clearSign
void clearSign()
Definition: APFloat.h:1300

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition: APInt.h:234

llvm::APInt::getSignMask
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition: APInt.h:229

llvm::APInt::usub_ov
APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1922

llvm::APInt::isZero
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition: APInt.h:380

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition: APInt.h:1468

llvm::APInt::ult
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition: APInt.h:1111

llvm::APInt::sadd_ov
APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1902

llvm::APInt::uadd_ov
APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1909

llvm::APInt::getSplat
static APInt getSplat(unsigned NewLen, const APInt &V)
Return a value containing V broadcasted over NewLen bits.
Definition: APInt.cpp:624

llvm::APInt::getSignedMinValue
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition: APInt.h:219

llvm::APInt::uadd_sat
APInt uadd_sat(const APInt &RHS) const
Definition: APInt.cpp:2010

llvm::APInt::isNonNegative
bool isNonNegative() const
Determine if this APInt Value is non-negative (>= 0)
Definition: APInt.h:334

llvm::APInt::getLowBitsSet
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
Definition: APInt.h:306

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition: APInt.h:200

llvm::APInt::ssub_ov
APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1915

llvm::APSInt::getMinValue
static APSInt getMinValue(uint32_t numBits, bool Unsigned)
Return the APSInt representing the minimum integer value with the given bit width and signedness.
Definition: APSInt.h:311

llvm::APSInt::getMaxValue
static APSInt getMaxValue(uint32_t numBits, bool Unsigned)
Return the APSInt representing the maximum integer value with the given bit width and signedness.
Definition: APSInt.h:303

llvm::AnyMemSetInst
This class represents any memset intrinsic.
Definition: IntrinsicInst.h:1393

llvm::AnyMemTransferInst
Definition: IntrinsicInst.h:1413

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::AssumptionCache::registerAssumption
void registerAssumption(AssumeInst *CI)
Add an @llvm.assume intrinsic to this function's cache.
Definition: AssumptionCache.cpp:185

llvm::AssumptionCache::updateAffectedValues
void updateAffectedValues(AssumeInst *CI)
Update the cache of values being affected by this assumption (i.e.
Definition: AssumptionCache.cpp:97

llvm::AssumptionCache::assumptionsFor
MutableArrayRef< ResultElem > assumptionsFor(const Value *V)
Access the list of assumptions which affect this value.
Definition: AssumptionCache.h:157

llvm::AttrBuilder
Definition: Attributes.h:1064

llvm::AttrBuilder::overlaps
bool overlaps(const AttributeMask &AM) const
Return true if the builder has any attribute that's in the specified builder.
Definition: Attributes.cpp:2300

llvm::AttributeList
Definition: Attributes.h:490

llvm::AttributeList::getFnAttrs
AttributeSet getFnAttrs() const
The function attributes are returned.
Definition: Attributes.cpp:1860

llvm::AttributeList::get
static AttributeList get(LLVMContext &C, ArrayRef< std::pair< unsigned, Attribute > > Attrs)
Create an AttributeList with the specified parameters in it.
Definition: Attributes.cpp:1499

llvm::AttributeList::isEmpty
bool isEmpty() const
Return true if there are no attributes.
Definition: Attributes.h:1025

llvm::AttributeList::getRetAttrs
AttributeSet getRetAttrs() const
The attributes for the ret value are returned.
Definition: Attributes.cpp:1856

llvm::AttributeList::hasAttrSomewhere
bool hasAttrSomewhere(Attribute::AttrKind Kind, unsigned *Index=nullptr) const
Return true if the specified attribute is set for at least one parameter or for the return value.
Definition: Attributes.cpp:1885

llvm::AttributeList::hasParamAttr
bool hasParamAttr(unsigned ArgNo, Attribute::AttrKind Kind) const
Return true if the attribute exists for the given argument.
Definition: Attributes.h:833

llvm::AttributeList::getParamAttrs
AttributeSet getParamAttrs(unsigned ArgNo) const
The attributes for the argument or parameter at the given index are returned.
Definition: Attributes.cpp:1852

llvm::AttributeList::addParamAttribute
AttributeList addParamAttribute(LLVMContext &C, unsigned ArgNo, Attribute::AttrKind Kind) const
Add an argument attribute to the list.
Definition: Attributes.h:628

llvm::AttributeList::FirstArgIndex
@ FirstArgIndex
Definition: Attributes.h:495

llvm::AttributeMask
Definition: AttributeMask.h:29

llvm::AttributeSet
Definition: Attributes.h:345

llvm::AttributeSet::hasAttribute
bool hasAttribute(Attribute::AttrKind Kind) const
Return true if the attribute exists in this set.
Definition: Attributes.cpp:1107

llvm::AttributeSet::removeAttributes
AttributeSet removeAttributes(LLVMContext &C, const AttributeMask &AttrsToRemove) const
Remove the specified attributes from this set.
Definition: Attributes.cpp:962

llvm::AttributeSet::get
static AttributeSet get(LLVMContext &C, const AttrBuilder &B)
Definition: Attributes.cpp:910

llvm::Attribute::get
static Attribute get(LLVMContext &Context, AttrKind Kind, uint64_t Val=0)
Return a uniquified Attribute object.
Definition: Attributes.cpp:95

llvm::Attribute::getWithDereferenceableBytes
static Attribute getWithDereferenceableBytes(LLVMContext &Context, uint64_t Bytes)
Definition: Attributes.cpp:244

llvm::Attribute::getWithDereferenceableOrNullBytes
static Attribute getWithDereferenceableOrNullBytes(LLVMContext &Context, uint64_t Bytes)
Definition: Attributes.cpp:250

llvm::Attribute::getWithAlignment
static Attribute getWithAlignment(LLVMContext &Context, Align Alignment)
Return a uniquified Attribute object that has the specific alignment set.
Definition: Attributes.cpp:234

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::BasicBlock::reverse_iterator
InstListType::reverse_iterator reverse_iterator
Definition: BasicBlock.h:179

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition: BasicBlock.h:177

llvm::BinaryOpIntrinsic::getRHS
Value * getRHS() const
Definition: IntrinsicInst.h:914

llvm::BinaryOpIntrinsic::isSigned
bool isSigned() const
Whether the intrinsic is signed or unsigned.
Definition: IntrinsicInst.cpp:822

llvm::BinaryOpIntrinsic::getBinaryOp
Instruction::BinaryOps getBinaryOp() const
Returns the binary operation underlying the intrinsic.
Definition: IntrinsicInst.cpp:802

llvm::BinaryOpIntrinsic::getLHS
Value * getLHS() const
Definition: IntrinsicInst.h:913

llvm::BinaryOperator
Definition: InstrTypes.h:170

llvm::BinaryOperator::CreateFAddFMF
static BinaryOperator * CreateFAddFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:235

llvm::BinaryOperator::CreateNeg
static BinaryOperator * CreateNeg(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Helper functions to construct and inspect unary operations (NEG and NOT) via binary operators SUB and...
Definition: Instructions.cpp:2647

llvm::BinaryOperator::CreateNSW
static BinaryOperator * CreateNSW(BinaryOps Opc, Value *V1, Value *V2, const Twine &Name="")
Definition: InstrTypes.h:278

llvm::BinaryOperator::CreateNot
static BinaryOperator * CreateNot(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.cpp:2660

llvm::BinaryOperator::Create
static BinaryOperator * Create(BinaryOps Op, Value *S1, Value *S2, const Twine &Name=Twine(), InsertPosition InsertBefore=nullptr)
Construct a binary instruction, given the opcode and the two operands.
Definition: Instructions.cpp:2639

llvm::BinaryOperator::CreateNUW
static BinaryOperator * CreateNUW(BinaryOps Opc, Value *V1, Value *V2, const Twine &Name="")
Definition: InstrTypes.h:293

llvm::BinaryOperator::CreateFMulFMF
static BinaryOperator * CreateFMulFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:243

llvm::BinaryOperator::CreateFDivFMF
static BinaryOperator * CreateFDivFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:247

llvm::BinaryOperator::CreateFSubFMF
static BinaryOperator * CreateFSubFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:239

llvm::BinaryOperator::CreateWithCopiedFlags
static BinaryOperator * CreateWithCopiedFlags(BinaryOps Opc, Value *V1, Value *V2, Value *CopyO, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: InstrTypes.h:218

llvm::BinaryOperator::CreateNSWNeg
static BinaryOperator * CreateNSWNeg(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.cpp:2654

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1112

llvm::CallBase::setCallingConv
void setCallingConv(CallingConv::ID CC)
Definition: InstrTypes.h:1403

llvm::CallBase::setDoesNotThrow
void setDoesNotThrow()
Definition: InstrTypes.h:1926

llvm::CallBase::getRetAlign
MaybeAlign getRetAlign() const
Extract the alignment of the return value.
Definition: InstrTypes.h:1739

llvm::CallBase::getOperandBundle
std::optional< OperandBundleUse > getOperandBundle(StringRef Name) const
Return an operand bundle by name, if present.
Definition: InstrTypes.h:2053

llvm::CallBase::getCalledFunction
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
Definition: InstrTypes.h:1341

llvm::CallBase::hasRetAttr
bool hasRetAttr(Attribute::AttrKind Kind) const
Determine whether the return value has the given attribute.
Definition: InstrTypes.h:1573

llvm::CallBase::getCalledOperand
Value * getCalledOperand() const
Definition: InstrTypes.h:1334

llvm::CallBase::setAttributes
void setAttributes(AttributeList A)
Set the attributes for this call.
Definition: InstrTypes.h:1420

llvm::CallBase::doesNotThrow
bool doesNotThrow() const
Determine if the call cannot unwind.
Definition: InstrTypes.h:1925

llvm::CallBase::addRetAttr
void addRetAttr(Attribute::AttrKind Kind)
Adds the attribute to the return value.
Definition: InstrTypes.h:1484

llvm::CallBase::getArgOperand
Value * getArgOperand(unsigned i) const
Definition: InstrTypes.h:1286

llvm::CallBase::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Returns the intrinsic ID of the intrinsic called or Intrinsic::not_intrinsic if the called function i...
Definition: Instructions.cpp:356

llvm::CallBase::Create
static CallBase * Create(CallBase *CB, ArrayRef< OperandBundleDef > Bundles, InsertPosition InsertPt=nullptr)
Create a clone of CB with a different set of operand bundles and insert it before InsertPt.
Definition: Instructions.cpp:301

llvm::CallBase::args
iterator_range< User::op_iterator > args()
Iteration adapter for range-for loops.
Definition: InstrTypes.h:1277

llvm::CallBase::removeOperandBundle
static CallBase * removeOperandBundle(CallBase *CB, uint32_t ID, InsertPosition InsertPt=nullptr)
Create a clone of CB with operand bundle ID removed.
Definition: Instructions.cpp:574

llvm::CallBase::arg_size
unsigned arg_size() const
Definition: InstrTypes.h:1284

llvm::CallBase::setCalledFunction
void setCalledFunction(Function *Fn)
Sets the function called, including updating the function type.
Definition: InstrTypes.h:1380

llvm::CallBrInst
CallBr instruction, tracking function calls that may not return control but instead transfer it to a ...
Definition: Instructions.h:3830

llvm::CallBrInst::Create
static CallBrInst * Create(FunctionType *Ty, Value *Func, BasicBlock *DefaultDest, ArrayRef< BasicBlock * > IndirectDests, ArrayRef< Value * > Args, const Twine &NameStr, InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:3864

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1479

llvm::CallInst::isNoTailCall
bool isNoTailCall() const
Definition: Instructions.h:1596

llvm::CallInst::setTailCallKind
void setTailCallKind(TailCallKind TCK)
Definition: Instructions.h:1598

llvm::CallInst::Create
static CallInst * Create(FunctionType *Ty, Value *F, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:1514

llvm::CallInst::isMustTailCall
bool isMustTailCall() const
Definition: Instructions.h:1594

llvm::CastInst::getCastOpcode
static Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
Definition: Instructions.cpp:3144

llvm::CastInst::CreateIntegerCast
static CastInst * CreateIntegerCast(Value *S, Type *Ty, bool isSigned, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a ZExt, BitCast, or Trunc for int -> int casts.
Definition: Instructions.cpp:3058

llvm::CastInst::isBitOrNoopPointerCastable
static bool isBitOrNoopPointerCastable(Type *SrcTy, Type *DestTy, const DataLayout &DL)
Check whether a bitcast, inttoptr, or ptrtoint cast between these types is valid and a no-op.
Definition: Instructions.cpp:3122

llvm::CastInst::CreateBitOrPointerCast
static CastInst * CreateBitOrPointerCast(Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a BitCast, a PtrToInt, or an IntToPTr cast instruction.
Definition: Instructions.cpp:3047

llvm::CastInst::Create
static CastInst * Create(Instruction::CastOps, Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Provides a way to construct any of the CastInst subclasses using an opcode instead of the subclass's ...
Definition: Instructions.cpp:2972

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:673

llvm::CmpInst::FCMP_OEQ
@ FCMP_OEQ
0 0 0 1 True if ordered and equal
Definition: InstrTypes.h:676

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition: InstrTypes.h:706

llvm::CmpInst::ICMP_SLT
@ ICMP_SLT
signed less than
Definition: InstrTypes.h:702

llvm::CmpInst::ICMP_SLE
@ ICMP_SLE
signed less or equal
Definition: InstrTypes.h:703

llvm::CmpInst::FCMP_OLT
@ FCMP_OLT
0 1 0 0 True if ordered and less than
Definition: InstrTypes.h:679

llvm::CmpInst::FCMP_OGT
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
Definition: InstrTypes.h:677

llvm::CmpInst::FCMP_OGE
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
Definition: InstrTypes.h:678

llvm::CmpInst::ICMP_UGT
@ ICMP_UGT
unsigned greater than
Definition: InstrTypes.h:696

llvm::CmpInst::ICMP_SGT
@ ICMP_SGT
signed greater than
Definition: InstrTypes.h:700

llvm::CmpInst::FCMP_ONE
@ FCMP_ONE
0 1 1 0 True if ordered and operands are unequal
Definition: InstrTypes.h:681

llvm::CmpInst::FCMP_UEQ
@ FCMP_UEQ
1 0 0 1 True if unordered or equal
Definition: InstrTypes.h:684

llvm::CmpInst::ICMP_ULT
@ ICMP_ULT
unsigned less than
Definition: InstrTypes.h:698

llvm::CmpInst::FCMP_OLE
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
Definition: InstrTypes.h:680

llvm::CmpInst::ICMP_EQ
@ ICMP_EQ
equal
Definition: InstrTypes.h:694

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition: InstrTypes.h:695

llvm::CmpInst::FCMP_UNE
@ FCMP_UNE
1 1 1 0 True if unordered or not equal
Definition: InstrTypes.h:689

llvm::CmpInst::BAD_FCMP_PREDICATE
@ BAD_FCMP_PREDICATE
Definition: InstrTypes.h:693

llvm::CmpInst::getSwappedPredicate
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition: InstrTypes.h:825

llvm::CmpInst::getNonStrictPredicate
Predicate getNonStrictPredicate() const
For example, SGT -> SGE, SLT -> SLE, ULT -> ULE, UGT -> UGE.
Definition: InstrTypes.h:869

llvm::CmpInst::getUnorderedPredicate
Predicate getUnorderedPredicate() const
Definition: InstrTypes.h:809

llvm::ConstantAggregateZero::get
static ConstantAggregateZero * get(Type *Ty)
Definition: Constants.cpp:1672

llvm::ConstantExpr::getPointerCast
static Constant * getPointerCast(Constant *C, Type *Ty)
Create a BitCast, AddrSpaceCast, or a PtrToInt cast constant expression.
Definition: Constants.cpp:2253

llvm::ConstantExpr::getSub
static Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
Definition: Constants.cpp:2645

llvm::ConstantExpr::getNeg
static Constant * getNeg(Constant *C, bool HasNSW=false)
Definition: Constants.cpp:2626

llvm::ConstantFP::getInfinity
static Constant * getInfinity(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1103

llvm::ConstantFP::getZero
static Constant * getZero(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1057

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:83

llvm::ConstantInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=~0ULL) const
getLimitedValue - If the value is smaller than the specified limit, return it, otherwise return the l...
Definition: Constants.h:258

llvm::ConstantInt::getTrue
static ConstantInt * getTrue(LLVMContext &Context)
Definition: Constants.cpp:866

llvm::ConstantInt::getFalse
static ConstantInt * getFalse(LLVMContext &Context)
Definition: Constants.cpp:873

llvm::ConstantInt::getZExtValue
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition: Constants.h:157

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition: Constants.h:148

llvm::ConstantInt::getBool
static ConstantInt * getBool(LLVMContext &Context, bool V)
Definition: Constants.cpp:880

llvm::ConstantPointerNull::get
static ConstantPointerNull * get(PointerType *T)
Static factory methods - Return objects of the specified value.
Definition: Constants.cpp:1826

llvm::ConstantPtrAuth::get
static ConstantPtrAuth * get(Constant *Ptr, ConstantInt *Key, ConstantInt *Disc, Constant *AddrDisc)
Return a pointer signed with the specified parameters.
Definition: Constants.cpp:2072

llvm::ConstantRange
This class represents a range of values.
Definition: ConstantRange.h:47

llvm::ConstantRange::Unsigned
@ Unsigned
Definition: ConstantRange.h:327

llvm::ConstantRange::isFullSet
bool isFullSet() const
Return true if this set contains all of the elements possible for this data-type.
Definition: ConstantRange.cpp:414

llvm::ConstantRange::icmp
bool icmp(CmpInst::Predicate Pred, const ConstantRange &Other) const
Does the predicate Pred hold between ranges this and Other? NOTE: false does not mean that inverse pr...
Definition: ConstantRange.cpp:243

llvm::ConstantRange::contains
bool contains(const APInt &Val) const
Return true if the specified value is in the set.
Definition: ConstantRange.cpp:507

llvm::ConstantRange::intersectWith
ConstantRange intersectWith(const ConstantRange &CR, PreferredRangeType Type=Smallest) const
Return the range that results from the intersection of this range with another range.
Definition: ConstantRange.cpp:581

llvm::ConstantStruct::get
static Constant * get(StructType *T, ArrayRef< Constant * > V)
Definition: Constants.cpp:1378

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:42

llvm::Constant::getIntegerValue
static Constant * getIntegerValue(Type *Ty, const APInt &V)
Return the value for an integer or pointer constant, or a vector thereof, with the given scalar value...
Definition: Constants.cpp:403

llvm::Constant::getAllOnesValue
static Constant * getAllOnesValue(Type *Ty)
Definition: Constants.cpp:420

llvm::Constant::getNullValue
static Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
Definition: Constants.cpp:373

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::DataLayout::getPointerTypeSizeInBits
unsigned getPointerTypeSizeInBits(Type *) const
Layout pointer size, in bits, based on the type.
Definition: DataLayout.cpp:743

llvm::DenseMapBase::try_emplace
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
Definition: DenseMap.h:226

llvm::DenseMapBase::count
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition: DenseMap.h:152

llvm::DenseMap
Definition: DenseMap.h:727

llvm::ElementCount
Definition: TypeSize.h:300

llvm::FMFSource::intersect
static FMFSource intersect(Value *A, Value *B)
Intersect the FMF from two instructions.
Definition: IRBuilder.h:106

llvm::FPExtInst
This class represents an extension of floating point types.
Definition: Instructions.h:4661

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition: FMF.h:20

llvm::FastMathFlags::setNoSignedZeros
void setNoSignedZeros(bool B=true)
Definition: FMF.h:85

llvm::FastMathFlags::allowReassoc
bool allowReassoc() const
Flag queries.
Definition: FMF.h:65

llvm::FenceInst
An instruction for ordering other memory operations.
Definition: Instructions.h:424

llvm::FenceInst::getSyncScopeID
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this fence instruction.
Definition: Instructions.h:460

llvm::FenceInst::getOrdering
AtomicOrdering getOrdering() const
Returns the ordering constraint of this fence instruction.
Definition: Instructions.h:449

llvm::FunctionType
Class to represent function types.
Definition: DerivedTypes.h:105

llvm::FunctionType::param_iterator
Type::subtype_iterator param_iterator
Definition: DerivedTypes.h:128

llvm::FunctionType::get
static FunctionType * get(Type *Result, ArrayRef< Type * > Params, bool isVarArg)
This static method is the primary way of constructing a FunctionType.

llvm::Function
Definition: Function.h:63

llvm::Function::isConvergent
bool isConvergent() const
Determine if the call is convergent.
Definition: Function.h:611

llvm::Function::getFunctionType
FunctionType * getFunctionType() const
Returns the FunctionType for me.
Definition: Function.h:216

llvm::Function::getCallingConv
CallingConv::ID getCallingConv() const
getCallingConv()/setCallingConv(CC) - These method get and set the calling convention of this functio...
Definition: Function.h:277

llvm::Function::getAttributes
AttributeList getAttributes() const
Return the attribute list for this Function.
Definition: Function.h:353

llvm::Function::doesNotThrow
bool doesNotThrow() const
Determine if the function cannot unwind.
Definition: Function.h:595

llvm::Function::isIntrinsic
bool isIntrinsic() const
isIntrinsic - Returns true if the function's name starts with "llvm.".
Definition: Function.h:256

llvm::GCRelocateInst
Represents calls to the gc.relocate intrinsic.
Definition: IntrinsicInst.h:1802

llvm::GCRelocateInst::getBasePtr
Value * getBasePtr() const
Definition: IntrinsicInst.cpp:867

llvm::GCRelocateInst::getBasePtrIndex
unsigned getBasePtrIndex() const
The index into the associate statepoint's argument list which contains the base pointer of the pointe...
Definition: IntrinsicInst.h:1815

llvm::GCRelocateInst::getDerivedPtr
Value * getDerivedPtr() const
Definition: IntrinsicInst.cpp:878

llvm::GCRelocateInst::getDerivedPtrIndex
unsigned getDerivedPtrIndex() const
The index into the associate statepoint's argument list which contains the pointer whose relocation t...
Definition: IntrinsicInst.h:1821

llvm::GCStatepointInst
Represents a gc.statepoint intrinsic call.
Definition: Statepoint.h:61

llvm::GCStatepointInst::getGCRelocates
std::vector< const GCRelocateInst * > getGCRelocates() const
Get list of all gc reloactes linked to this statepoint May contain several relocations for the same b...
Definition: Statepoint.h:206

llvm::GlobalObject::getMetadata
MDNode * getMetadata(unsigned KindID) const
Get the current metadata attachments for the given kind, if any.
Definition: Value.h:565

llvm::GlobalValue::isDeclaration
bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
Definition: Globals.cpp:296

llvm::GlobalValue::getType
PointerType * getType() const
Global values are always pointers.
Definition: GlobalValue.h:295

llvm::GlobalVariable
Definition: GlobalVariable.h:39

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition: IRBuilder.h:113

llvm::IRBuilderBase::CreateFCmpONE
Value * CreateFCmpONE(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2335

llvm::IRBuilderBase::CreateLdexp
Value * CreateLdexp(Value *Src, Value *Exp, FMFSource FMFSource={}, const Twine &Name="")
Create call to the ldexp intrinsic.
Definition: IRBuilder.h:1057

llvm::IRBuilderBase::CreateLaunderInvariantGroup
Value * CreateLaunderInvariantGroup(Value *Ptr)
Create a launder.invariant.group intrinsic call.
Definition: IRBuilder.cpp:1086

llvm::IRBuilderBase::CreateFCmp
Value * CreateFCmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2390

llvm::IRBuilderBase::getInt1Ty
IntegerType * getInt1Ty()
Fetch the type representing a single bit.
Definition: IRBuilder.h:530

llvm::IRBuilderBase::CreateExtractElement
Value * CreateExtractElement(Value *Vec, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2499

llvm::IRBuilderBase::getIntNTy
IntegerType * getIntNTy(unsigned N)
Fetch the type representing an N-bit integer.
Definition: IRBuilder.h:558

llvm::IRBuilderBase::CreateAlignedLoad
LoadInst * CreateAlignedLoad(Type *Ty, Value *Ptr, MaybeAlign Align, const char *Name)
Definition: IRBuilder.h:1815

llvm::IRBuilderBase::CreateFCmpORD
Value * CreateFCmpORD(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2340

llvm::IRBuilderBase::CreateZExtOrTrunc
Value * CreateZExtOrTrunc(Value *V, Type *DestTy, const Twine &Name="")
Create a ZExt or Trunc from the integer value V to DestTy.
Definition: IRBuilder.h:2051

llvm::IRBuilderBase::CreateAndReduce
CallInst * CreateAndReduce(Value *Src)
Create a vector int AND reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:420

llvm::IRBuilderBase::CreateAssumption
CallInst * CreateAssumption(Value *Cond, ArrayRef< OperandBundleDef > OpBundles={})
Create an assume intrinsic call that allows the optimizer to assume that the provided condition will ...
Definition: IRBuilder.cpp:521

llvm::IRBuilderBase::CreateVectorSplat
Value * CreateVectorSplat(unsigned NumElts, Value *V, const Twine &Name="")
Return a vector value that contains.
Definition: IRBuilder.cpp:1163

llvm::IRBuilderBase::getTrue
ConstantInt * getTrue()
Get the constant value for i1 true.
Definition: IRBuilder.h:485

llvm::IRBuilderBase::CreateSelect
Value * CreateSelect(Value *C, Value *True, Value *False, const Twine &Name="", Instruction *MDFrom=nullptr)
Definition: IRBuilder.cpp:1053

llvm::IRBuilderBase::CreateInvoke
InvokeInst * CreateInvoke(FunctionType *Ty, Value *Callee, BasicBlock *NormalDest, BasicBlock *UnwindDest, ArrayRef< Value * > Args, ArrayRef< OperandBundleDef > OpBundles, const Twine &Name="")
Create an invoke instruction.
Definition: IRBuilder.h:1202

llvm::IRBuilderBase::CreateFCmpUNE
Value * CreateFCmpUNE(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2375

llvm::IRBuilderBase::CreateAddReduce
CallInst * CreateAddReduce(Value *Src)
Create a vector int add reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:412

llvm::IRBuilderBase::CreateLShr
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1480

llvm::IRBuilderBase::getInt32Ty
IntegerType * getInt32Ty()
Fetch the type representing a 32-bit integer.
Definition: IRBuilder.h:545

llvm::IRBuilderBase::CreateCast
Value * CreateCast(Instruction::CastOps Op, Value *V, Type *DestTy, const Twine &Name="", MDNode *FPMathTag=nullptr, FMFSource FMFSource={})
Definition: IRBuilder.h:2186

llvm::IRBuilderBase::CreateNSWMul
Value * CreateNSWMul(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1413

llvm::IRBuilderBase::CreateICmpNE
Value * CreateICmpNE(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2274

llvm::IRBuilderBase::CreateNeg
Value * CreateNeg(Value *V, const Twine &Name="", bool HasNSW=false)
Definition: IRBuilder.h:1733

llvm::IRBuilderBase::CreateOrReduce
CallInst * CreateOrReduce(Value *Src)
Create a vector int OR reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:424

llvm::IRBuilderBase::CreateBinaryIntrinsic
Value * CreateBinaryIntrinsic(Intrinsic::ID ID, Value *LHS, Value *RHS, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with 2 operands which is mangled on the first type.
Definition: IRBuilder.cpp:889

llvm::IRBuilderBase::CreateIntrinsic
CallInst * CreateIntrinsic(Intrinsic::ID ID, ArrayRef< Type * > Types, ArrayRef< Value * > Args, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with Args, mangled using Types.
Definition: IRBuilder.cpp:900

llvm::IRBuilderBase::getInt32
ConstantInt * getInt32(uint32_t C)
Get a constant 32-bit value.
Definition: IRBuilder.h:505

llvm::IRBuilderBase::CreateBitOrPointerCast
Value * CreateBitOrPointerCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2234

llvm::IRBuilderBase::CreateNot
Value * CreateNot(Value *V, const Twine &Name="")
Definition: IRBuilder.h:1757

llvm::IRBuilderBase::CreateICmpEQ
Value * CreateICmpEQ(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2270

llvm::IRBuilderBase::CreateFCmpUEQ
Value * CreateFCmpUEQ(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2350

llvm::IRBuilderBase::CreateSub
Value * CreateSub(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1387

llvm::IRBuilderBase::CreateBitCast
Value * CreateBitCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2152

llvm::IRBuilderBase::CreateCopySign
Value * CreateCopySign(Value *LHS, Value *RHS, FMFSource FMFSource={}, const Twine &Name="")
Create call to the copysign intrinsic.
Definition: IRBuilder.h:1050

llvm::IRBuilderBase::CreateUnaryIntrinsic
CallInst * CreateUnaryIntrinsic(Intrinsic::ID ID, Value *V, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with 1 operand which is mangled on its type.
Definition: IRBuilder.cpp:881

llvm::IRBuilderBase::CreateLoad
LoadInst * CreateLoad(Type *Ty, Value *Ptr, const char *Name)
Provided to resolve 'CreateLoad(Ty, Ptr, "...")' correctly, instead of converting the string to 'bool...
Definition: IRBuilder.h:1798

llvm::IRBuilderBase::CreateZExt
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
Definition: IRBuilder.h:2033

llvm::IRBuilderBase::CreateShuffleVector
Value * CreateShuffleVector(Value *V1, Value *V2, Value *Mask, const Twine &Name="")
Definition: IRBuilder.h:2533

llvm::IRBuilderBase::CreateFCmpOEQ
Value * CreateFCmpOEQ(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2310

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1518

llvm::IRBuilderBase::CreateStore
StoreInst * CreateStore(Value *Val, Value *Ptr, bool isVolatile=false)
Definition: IRBuilder.h:1811

llvm::IRBuilderBase::CreateAdd
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1370

llvm::IRBuilderBase::CreatePtrToInt
Value * CreatePtrToInt(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2142

llvm::IRBuilderBase::getFalse
ConstantInt * getFalse()
Get the constant value for i1 false.
Definition: IRBuilder.h:490

llvm::IRBuilderBase::CreateIsNotNull
Value * CreateIsNotNull(Value *Arg, const Twine &Name="")
Return a boolean value testing if Arg != 0.
Definition: IRBuilder.h:2588

llvm::IRBuilderBase::CreateCall
CallInst * CreateCall(FunctionType *FTy, Value *Callee, ArrayRef< Value * > Args={}, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2449

llvm::IRBuilderBase::CreateTrunc
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Definition: IRBuilder.h:2019

llvm::IRBuilderBase::CreateOr
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1540

llvm::IRBuilderBase::getPtrTy
PointerType * getPtrTy(unsigned AddrSpace=0)
Fetch the type representing a pointer.
Definition: IRBuilder.h:588

llvm::IRBuilderBase::CreateBinOp
Value * CreateBinOp(Instruction::BinaryOps Opc, Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:1671

llvm::IRBuilderBase::CreateElementCount
Value * CreateElementCount(Type *DstType, ElementCount EC)
Create an expression which evaluates to the number of elements in EC at runtime.
Definition: IRBuilder.cpp:98

llvm::IRBuilderBase::CreateIntCast
Value * CreateIntCast(Value *V, Type *DestTy, bool isSigned, const Twine &Name="")
Definition: IRBuilder.h:2225

llvm::IRBuilderBase::CreateFCmpUNO
Value * CreateFCmpUNO(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2345

llvm::IRBuilderBase::CreateIsNull
Value * CreateIsNull(Value *Arg, const Twine &Name="")
Return a boolean value testing if Arg == 0.
Definition: IRBuilder.h:2583

llvm::IRBuilderBase::CreateFNegFMF
Value * CreateFNegFMF(Value *V, FMFSource FMFSource, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:1747

llvm::IRBuilderBase::CreateICmp
Value * CreateICmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2380

llvm::IRBuilderBase::CreateFNeg
Value * CreateFNeg(Value *V, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:1742

llvm::IRBuilderBase::CreateAddrSpaceCast
Value * CreateAddrSpaceCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2157

llvm::IRBuilderBase::CreateMul
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1404

llvm::IRBuilderBase::CreateStripInvariantGroup
Value * CreateStripInvariantGroup(Value *Ptr)
Create a strip.invariant.group intrinsic call.
Definition: IRBuilder.cpp:1102

llvm::IRBuilder< TargetFolder, IRBuilderCallbackInserter >

llvm::InlineAsm
Definition: InlineAsm.h:34

llvm::InsertValueInst::Create
static InsertValueInst * Create(Value *Agg, Value *Val, ArrayRef< unsigned > Idxs, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:2519

llvm::InstCombinerImpl
Definition: InstCombineInternal.h:61

llvm::InstCombinerImpl::FoldOpIntoSelect
Instruction * FoldOpIntoSelect(Instruction &Op, SelectInst *SI, bool FoldWithMultiUse=false)
Given an instruction with a select as one operand and a constant as the other operand,...
Definition: InstructionCombining.cpp:1687

llvm::InstCombinerImpl::computeKnownFPClass
KnownFPClass computeKnownFPClass(Value *Val, FastMathFlags FMF, FPClassTest Interested=fcAllFlags, const Instruction *CtxI=nullptr, unsigned Depth=0) const
Definition: InstCombineInternal.h:200

llvm::InstCombinerImpl::SimplifyDemandedVectorElts
Value * SimplifyDemandedVectorElts(Value *V, APInt DemandedElts, APInt &PoisonElts, unsigned Depth=0, bool AllowMultipleUsers=false) override
The specified value produces a vector with any number of elements.
Definition: InstCombineSimplifyDemanded.cpp:1393

llvm::InstCombinerImpl::SimplifyAnyMemSet
Instruction * SimplifyAnyMemSet(AnyMemSetInst *MI)
Definition: InstCombineCalls.cpp:217

llvm::InstCombinerImpl::getLosslessUnsignedTrunc
Constant * getLosslessUnsignedTrunc(Constant *C, Type *TruncTy)
Definition: InstCombineInternal.h:231

llvm::InstCombinerImpl::visitFree
Instruction * visitFree(CallInst &FI, Value *FreedOp)
Definition: InstructionCombining.cpp:3547

llvm::InstCombinerImpl::visitCallBrInst
Instruction * visitCallBrInst(CallBrInst &CBI)
Definition: InstCombineCalls.cpp:3832

llvm::InstCombinerImpl::eraseInstFromFunction
Instruction * eraseInstFromFunction(Instruction &I) override
Combiner aware instruction erasure.
Definition: InstCombineInternal.h:474

llvm::InstCombinerImpl::SimplifyDemandedBits
bool SimplifyDemandedBits(Instruction *I, unsigned Op, const APInt &DemandedMask, KnownBits &Known, unsigned Depth, const SimplifyQuery &Q) override
This form of SimplifyDemandedBits simplifies the specified instruction operand if possible,...
Definition: InstCombineSimplifyDemanded.cpp:95

llvm::InstCombinerImpl::tryGetLog2
Value * tryGetLog2(Value *Op, bool AssumeNonZero)
Definition: InstCombineInternal.h:795

llvm::InstCombinerImpl::visitFenceInst
Instruction * visitFenceInst(FenceInst &FI)
Definition: InstCombineCalls.cpp:3799

llvm::InstCombinerImpl::visitInvokeInst
Instruction * visitInvokeInst(InvokeInst &II)
Definition: InstCombineCalls.cpp:3827

llvm::InstCombinerImpl::getLosslessSignedTrunc
Constant * getLosslessSignedTrunc(Constant *C, Type *TruncTy)
Definition: InstCombineInternal.h:235

llvm::InstCombinerImpl::SimplifyDemandedInstructionBits
bool SimplifyDemandedInstructionBits(Instruction &Inst)
Tries to simplify operands to an integer instruction based on its demanded bits.
Definition: InstCombineSimplifyDemanded.cpp:87

llvm::InstCombinerImpl::CreateNonTerminatorUnreachable
void CreateNonTerminatorUnreachable(Instruction *InsertAt)
Create and insert the idiom we use to indicate a block is unreachable without having to rewrite the C...
Definition: InstCombineInternal.h:461

llvm::InstCombinerImpl::visitVAEndInst
Instruction * visitVAEndInst(VAEndInst &I)
Definition: InstCombineCalls.cpp:818

llvm::InstCombinerImpl::matchBSwapOrBitReverse
Instruction * matchBSwapOrBitReverse(Instruction &I, bool MatchBSwaps, bool MatchBitReversals)
Given an initial instruction, check to see if it is the root of a bswap/bitreverse idiom.
Definition: InstCombineAndOrXor.cpp:2861

llvm::InstCombinerImpl::visitAllocSite
Instruction * visitAllocSite(Instruction &FI)
Definition: InstructionCombining.cpp:3331

llvm::InstCombinerImpl::SimplifyAnyMemTransfer
Instruction * SimplifyAnyMemTransfer(AnyMemTransferInst *MI)
Definition: InstCombineCalls.cpp:115

llvm::InstCombinerImpl::computeOverflow
OverflowResult computeOverflow(Instruction::BinaryOps BinaryOp, bool IsSigned, Value *LHS, Value *RHS, Instruction *CxtI) const
Definition: InstCombineCompares.cpp:6264

llvm::InstCombinerImpl::visitCallInst
Instruction * visitCallInst(CallInst &CI)
CallInst simplification.
Definition: InstCombineCalls.cpp:1623

llvm::InstCombiner::SQ
SimplifyQuery SQ
Definition: InstCombiner.h:77

llvm::InstCombiner::isFreeToInvert
bool isFreeToInvert(Value *V, bool WillInvertAllUses, bool &DoesConsume)
Return true if the specified value is free to invert (apply ~ to).
Definition: InstCombiner.h:228

llvm::InstCombiner::getDominatorTree
DominatorTree & getDominatorTree() const
Definition: InstCombiner.h:336

llvm::InstCombiner::BFI
BlockFrequencyInfo * BFI
Definition: InstCombiner.h:79

llvm::InstCombiner::TLI
TargetLibraryInfo & TLI
Definition: InstCombiner.h:74

llvm::InstCombiner::isKnownToBeAPowerOfTwo
bool isKnownToBeAPowerOfTwo(const Value *V, bool OrZero=false, unsigned Depth=0, const Instruction *CxtI=nullptr)
Definition: InstCombiner.h:443

llvm::InstCombiner::InsertNewInstBefore
Instruction * InsertNewInstBefore(Instruction *New, BasicBlock::iterator Old)
Inserts an instruction New before instruction Old.
Definition: InstCombiner.h:368

llvm::InstCombiner::AA
AAResults * AA
Definition: InstCombiner.h:70

llvm::InstCombiner::replaceInstUsesWith
Instruction * replaceInstUsesWith(Instruction &I, Value *V)
A combiner-aware RAUW-like routine.
Definition: InstCombiner.h:388

llvm::InstCombiner::replaceUse
void replaceUse(Use &U, Value *NewValue)
Replace use and add the previously used value to the worklist.
Definition: InstCombiner.h:420

llvm::InstCombiner::Worklist
InstructionWorklist & Worklist
A worklist of the instructions that need to be simplified.
Definition: InstCombiner.h:65

llvm::InstCombiner::DL
const DataLayout & DL
Definition: InstCombiner.h:76

llvm::InstCombiner::DC
DomConditionCache DC
Definition: InstCombiner.h:82

llvm::InstCombiner::targetInstCombineIntrinsic
std::optional< Instruction * > targetInstCombineIntrinsic(IntrinsicInst &II)
Definition: InstructionCombining.cpp:156

llvm::InstCombiner::AC
AssumptionCache & AC
Definition: InstCombiner.h:73

llvm::InstCombiner::replaceOperand
Instruction * replaceOperand(Instruction &I, unsigned OpNum, Value *V)
Replace operand of instruction and add old operand to the worklist.
Definition: InstCombiner.h:412

llvm::InstCombiner::DT
DominatorTree & DT
Definition: InstCombiner.h:75

llvm::InstCombiner::PSI
ProfileSummaryInfo * PSI
Definition: InstCombiner.h:81

llvm::InstCombiner::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, unsigned Depth, const Instruction *CxtI) const
Definition: InstCombiner.h:433

llvm::InstCombiner::Builder
BuilderTy & Builder
Definition: InstCombiner.h:61

llvm::InstCombiner::getAssumptionCache
AssumptionCache & getAssumptionCache() const
Definition: InstCombiner.h:334

llvm::InstCombiner::MaskedValueIsZero
bool MaskedValueIsZero(const Value *V, const APInt &Mask, unsigned Depth=0, const Instruction *CxtI=nullptr) const
Definition: InstCombiner.h:450

llvm::InstCombiner::ORE
OptimizationRemarkEmitter & ORE
Definition: InstCombiner.h:78

llvm::InstCombiner::getFreelyInverted
Value * getFreelyInverted(Value *V, bool WillInvertAllUses, BuilderTy *Builder, bool &DoesConsume)
Definition: InstCombiner.h:209

llvm::InstCombiner::getSimplifyQuery
const SimplifyQuery & getSimplifyQuery() const
Definition: InstCombiner.h:338

llvm::InstCombiner::ComputeMaxSignificantBits
unsigned ComputeMaxSignificantBits(const Value *Op, unsigned Depth=0, const Instruction *CxtI=nullptr) const
Definition: InstCombiner.h:460

llvm::InstructionWorklist::pushValue
void pushValue(Value *V)
Definition: InstructionWorklist.h:68

llvm::InstructionWorklist::pushUsersToWorkList
void pushUsersToWorkList(Instruction &I)
When an instruction is simplified, add all users of the instruction to the work lists because they mi...
Definition: InstructionWorklist.h:106

llvm::InstructionWorklist::add
void add(Instruction *I)
Add instruction to the worklist.
Definition: InstructionWorklist.h:44

llvm::Instruction
Definition: Instruction.h:68

llvm::Instruction::setHasNoUnsignedWrap
void setHasNoUnsignedWrap(bool b=true)
Set or clear the nuw flag on this instruction, which must be an operator which supports this flag.
Definition: Instruction.cpp:365

llvm::Instruction::mayWriteToMemory
bool mayWriteToMemory() const LLVM_READONLY
Return true if this instruction may modify memory.
Definition: Instruction.cpp:997

llvm::Instruction::copyIRFlags
void copyIRFlags(const Value *V, bool IncludeWrapFlags=true)
Convenience method to copy supported exact, fast-math, and (optionally) wrapping flags from V to this...
Definition: Instruction.cpp:646

llvm::Instruction::setHasNoSignedWrap
void setHasNoSignedWrap(bool b=true)
Set or clear the nsw flag on this instruction, which must be an operator which supports this flag.
Definition: Instruction.cpp:372

llvm::Instruction::getModule
const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
Definition: Instruction.cpp:68

llvm::Instruction::setAAMetadata
void setAAMetadata(const AAMDNodes &N)
Sets the AA metadata on this instruction from the AAMDNodes structure.
Definition: Metadata.cpp:1764

llvm::Instruction::getPrevNonDebugInstruction
const Instruction * getPrevNonDebugInstruction(bool SkipPseudoOp=false) const
Return a pointer to the previous non-debug instruction in the same basic block as 'this',...
Definition: Instruction.cpp:1220

llvm::Instruction::getFunction
const Function * getFunction() const
Return the function this instruction belongs to.
Definition: Instruction.cpp:72

llvm::Instruction::getNextNonDebugInstruction
const Instruction * getNextNonDebugInstruction(bool SkipPseudoOp=false) const
Return a pointer to the next non-debug instruction in the same basic block as 'this',...
Definition: Instruction.cpp:1212

llvm::Instruction::setMetadata
void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
Definition: Metadata.cpp:1679

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition: Instruction.h:274

llvm::Instruction::BinaryOps
BinaryOps
Definition: Instruction.h:972

llvm::Instruction::getInsertionPointAfterDef
std::optional< InstListType::iterator > getInsertionPointAfterDef()
Get the first insertion point at which the result of this instruction is defined.
Definition: Instruction.cpp:330

llvm::Instruction::isIdenticalTo
bool isIdenticalTo(const Instruction *I) const LLVM_READONLY
Return true if the specified instruction is exactly identical to the current one.
Definition: Instruction.cpp:900

llvm::Instruction::setDebugLoc
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
Definition: Instruction.h:472

llvm::Instruction::copyMetadata
void copyMetadata(const Instruction &SrcInst, ArrayRef< unsigned > WL=ArrayRef< unsigned >())
Copy metadata from SrcInst to this instruction.
Definition: Instruction.cpp:1331

llvm::Instruction::moveBefore
void moveBefore(Instruction *MovePos)
Unlink this instruction from its current basic block and insert it into the basic block that MovePos ...
Definition: Instruction.cpp:169

llvm::Instruction::CastOps
CastOps
Definition: Instruction.h:986

llvm::IntegerType
Class to represent integer types.
Definition: DerivedTypes.h:42

llvm::IntegerType::get
static IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition: Type.cpp:311

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:48

llvm::IntrinsicInst::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
Definition: IntrinsicInst.h:55

llvm::InvokeInst
Invoke instruction.
Definition: Instructions.h:3670

llvm::InvokeInst::Create
static InvokeInst * Create(FunctionType *Ty, Value *Func, BasicBlock *IfNormal, BasicBlock *IfException, ArrayRef< Value * > Args, const Twine &NameStr, InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:3710

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LLVMContext::OB_kcfi
@ OB_kcfi
Definition: LLVMContext.h:97

llvm::LLVMContext::OB_gc_live
@ OB_gc_live
Definition: LLVMContext.h:94

llvm::LibCallSimplifier
LibCallSimplifier - This class implements a collection of optimizations that replace well formed call...
Definition: SimplifyLibCalls.h:103

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:176

llvm::MDNode
Metadata node.
Definition: Metadata.h:1073

llvm::MDNode::get
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition: Metadata.h:1549

llvm::MinMaxIntrinsic::getPredicate
ICmpInst::Predicate getPredicate() const
Returns the comparison predicate underlying the intrinsic.
Definition: IntrinsicInst.h:798

llvm::MinMaxIntrinsic::isSigned
bool isSigned() const
Whether the intrinsic is signed or unsigned.
Definition: IntrinsicInst.h:808

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:65

llvm::OperandBundleDefT
A container for an operand bundle being viewed as a set of values rather than a set of uses.
Definition: InstrTypes.h:1065

llvm::Operator::getOpcode
unsigned getOpcode() const
Return the opcode for this Instruction or ConstantExpr.
Definition: Operator.h:42

llvm::OverflowingBinaryOperator
Utility class for integer operators which may exhibit overflow - Add, Sub, Mul, and Shl.
Definition: Operator.h:77

llvm::OverflowingBinaryOperator::hasNoSignedWrap
bool hasNoSignedWrap() const
Test whether this operation is known to never undergo signed overflow, aka the nsw property.
Definition: Operator.h:110

llvm::OverflowingBinaryOperator::hasNoUnsignedWrap
bool hasNoUnsignedWrap() const
Test whether this operation is known to never undergo unsigned overflow, aka the nuw property.
Definition: Operator.h:104

llvm::OverflowingBinaryOperator::isCommutative
bool isCommutative() const
Return true if the instruction is commutative.
Definition: Operator.h:127

llvm::PHINode
Definition: Instructions.h:2600

llvm::PoisonValue::get
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition: Constants.cpp:1878

llvm::SaturatingInst
Represents a saturating add/sub intrinsic.
Definition: IntrinsicInst.h:948

llvm::SelectInst
This class represents the LLVM 'select' instruction.
Definition: Instructions.h:1657

llvm::SelectInst::Create
static SelectInst * Create(Value *C, Value *S1, Value *S2, const Twine &NameStr="", InsertPosition InsertBefore=nullptr, Instruction *MDFrom=nullptr)
Definition: Instructions.h:1682

llvm::ShuffleVectorInst
This instruction constructs a fixed permutation of two input vectors.
Definition: Instructions.h:1901

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition: SmallBitVector.h:35

llvm::SmallBitVector::set
SmallBitVector & set()
Definition: SmallBitVector.h:366

llvm::SmallBitVector::test
bool test(unsigned Idx) const
Definition: SmallBitVector.h:472

llvm::SmallBitVector::all
bool all() const
Returns true if all bits are set.
Definition: SmallBitVector.h:216

llvm::SmallPtrSetImplBase::size
size_type size() const
Definition: SmallPtrSet.h:94

llvm::SmallPtrSetImpl::count
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
Definition: SmallPtrSet.h:452

llvm::SmallPtrSetImpl::insert
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
Definition: SmallPtrSet.h:384

llvm::SmallPtrSet
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
Definition: SmallPtrSet.h:519

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:81

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:78

llvm::SmallVectorImpl::reserve
void reserve(size_type N)
Definition: SmallVector.h:663

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:413

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::StoreInst
An instruction for storing to memory.
Definition: Instructions.h:292

llvm::StoreInst::setVolatile
void setVolatile(bool V)
Specify whether this is a volatile store or not.
Definition: Instructions.h:328

llvm::StoreInst::setAlignment
void setAlignment(Align Align)
Definition: Instructions.h:337

llvm::StoreInst::setOrdering
void setOrdering(AtomicOrdering Ordering)
Sets the ordering constraint of this store instruction.
Definition: Instructions.h:348

llvm::StructType
Class to represent struct types.
Definition: DerivedTypes.h:218

llvm::TargetLibraryInfoImpl::isCallingConvCCompatible
static bool isCallingConvCCompatible(CallBase *CI)
Returns true if call site / callee has cdecl-compatible calling conventions.
Definition: TargetLibraryInfo.cpp:152

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:280

llvm::TruncInst
This class represents a truncation of integer types.
Definition: Instructions.h:4503

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getIntegerBitWidth
unsigned getIntegerBitWidth() const

llvm::Type::getFltSemantics
const fltSemantics & getFltSemantics() const

llvm::Type::isPointerTy
bool isPointerTy() const
True if this is an instance of PointerType.
Definition: Type.h:264

llvm::Type::getScalarSizeInBits
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::Type::isStructTy
bool isStructTy() const
True if this is an instance of StructType.
Definition: Type.h:258

llvm::Type::getWithNewBitWidth
Type * getWithNewBitWidth(unsigned NewBitWidth) const
Given an integer or vector type, change the lane bitwidth to NewBitwidth, whilst keeping the old numb...

llvm::Type::getContext
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition: Type.h:128

llvm::Type::canLosslesslyBitCastTo
bool canLosslesslyBitCastTo(Type *Ty) const
Return true if this type could be converted with a lossless BitCast to type 'Ty'.

llvm::Type::getInt32Ty
static IntegerType * getInt32Ty(LLVMContext &C)

llvm::Type::getInt64Ty
static IntegerType * getInt64Ty(LLVMContext &C)

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:237

llvm::Type::isVoidTy
bool isVoidTy() const
Return true if this is 'void'.
Definition: Type.h:139

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition: Type.h:355

llvm::UnaryOperator::CreateWithCopiedFlags
static UnaryOperator * CreateWithCopiedFlags(UnaryOps Opc, Value *V, Instruction *CopyO, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: InstrTypes.h:138

llvm::UnaryOperator::CreateFNegFMF
static UnaryOperator * CreateFNegFMF(Value *Op, Instruction *FMFSource, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: InstrTypes.h:146

llvm::UndefValue::get
static UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
Definition: Constants.cpp:1859

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition: Use.h:43

llvm::User
Definition: User.h:44

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition: User.h:233

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:228

llvm::VAEndInst
This represents the llvm.va_end intrinsic.
Definition: IntrinsicInst.h:1485

llvm::ValueHandleBase::ValueIsDeleted
static void ValueIsDeleted(Value *V)
Definition: Value.cpp:1202

llvm::ValueHandleBase::ValueIsRAUWd
static void ValueIsRAUWd(Value *Old, Value *New)
Definition: Value.cpp:1255

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::MaximumAlignment
static constexpr uint64_t MaximumAlignment
Definition: Value.h:811

llvm::Value::setMetadata
void setMetadata(unsigned KindID, MDNode *Node)
Set a particular kind of metadata attachment.
Definition: Metadata.cpp:1531

llvm::Value::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition: Value.h:434

llvm::Value::users
iterator_range< user_iterator > users()
Definition: Value.h:421

llvm::Value::dropDroppableUse
static void dropDroppableUse(Use &U)
Remove the droppable use U.
Definition: Value.cpp:217

llvm::Value::stripPointerCasts
const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition: Value.cpp:694

llvm::Value::use_empty
bool use_empty() const
Definition: Value.h:344

llvm::Value::getContext
LLVMContext & getContext() const
All values hold a context through their type.
Definition: Value.cpp:1075

llvm::Value::MaxAlignmentExponent
static constexpr unsigned MaxAlignmentExponent
The maximum alignment for instructions.
Definition: Value.h:810

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::Value::takeName
void takeName(Value *V)
Transfer the name from V to this value.
Definition: Value.cpp:383

llvm::VectorType
Base class of all SIMD vector types.
Definition: DerivedTypes.h:427

llvm::VectorType::getElementCount
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Definition: DerivedTypes.h:665

llvm::WithOverflowInst
Represents an op.with.overflow intrinsic.
Definition: IntrinsicInst.h:927

llvm::cl::opt
Definition: CommandLine.h:1423

llvm::details::FixedOrScalableQuantity< ElementCount, unsigned >::isKnownLT
static constexpr bool isKnownLT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition: TypeSize.h:218

llvm::details::FixedOrScalableQuantity< ElementCount, unsigned >::isKnownGT
static constexpr bool isKnownGT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition: TypeSize.h:225

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition: ilist_node.h:32

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:132

uint32_t

uint64_t

unsigned

DebugInfo.h

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::AArch64PACKey::IA
@ IA
Definition: AArch64BaseInfo.h:875

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition: AMDGPUMetadata.h:395

llvm::AMDGPU::HSAMD::Kernel::Key::Attrs
constexpr char Attrs[]
Key for Kernel::Metadata::mAttrs.
Definition: AMDGPUMetadata.h:393

llvm::AttributeFuncs::ASK_UNSAFE_TO_DROP
@ ASK_UNSAFE_TO_DROP
Definition: Attributes.h:1297

llvm::AttributeFuncs::ASK_SAFE_TO_DROP
@ ASK_SAFE_TO_DROP
Definition: Attributes.h:1296

llvm::AttributeFuncs::typeIncompatible
AttributeMask typeIncompatible(Type *Ty, AttributeSet AS, AttributeSafetyKind ASK=ASK_ALL)
Which attributes cannot be applied to a type.
Definition: Attributes.cpp:2349

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition: BitmaskEnum.h:125

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::Intrinsic::getOrInsertDeclaration
Function * getOrInsertDeclaration(Module *M, ID id, ArrayRef< Type * > Tys={})
Look up the Function declaration of the intrinsic id in the Module M.
Definition: Intrinsics.cpp:731

llvm::M68k::MemAddrModeKind::U
@ U

llvm::M68k::MemAddrModeKind::V
@ V

llvm::M68k::MemAddrModeKind::L
@ L

llvm::MCID::Call
@ Call
Definition: MCInstrDesc.h:156

llvm::PatternMatch::m_AllOnes
cst_pred_ty< is_all_ones > m_AllOnes()
Match an integer or vector with all bits set.
Definition: PatternMatch.h:524

llvm::PatternMatch::m_And
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1216

llvm::PatternMatch::m_Add
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1102

llvm::PatternMatch::m_BinOp
class_match< BinaryOperator > m_BinOp()
Match an arbitrary binary operation and ignore it.
Definition: PatternMatch.h:100

llvm::PatternMatch::m_BitReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_BitReverse(const Opnd0 &Op0)
Definition: PatternMatch.h:2692

llvm::PatternMatch::m_Constant
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
Definition: PatternMatch.h:165

llvm::PatternMatch::m_c_And
BinaryOp_match< LHS, RHS, Instruction::And, true > m_c_And(const LHS &L, const RHS &R)
Matches an And with LHS and RHS in either order.
Definition: PatternMatch.h:2798

llvm::PatternMatch::m_Trunc
CastInst_match< OpTy, TruncInst > m_Trunc(const OpTy &Op)
Matches Trunc.
Definition: PatternMatch.h:2075

llvm::PatternMatch::m_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor > m_Xor(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1228

llvm::PatternMatch::m_NSWSub
OverflowingBinaryOp_match< LHS, RHS, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWSub(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1289

llvm::PatternMatch::m_SpecificInt
specific_intval< false > m_SpecificInt(const APInt &V)
Match a specific integer value or vector with all elements equal to the value.
Definition: PatternMatch.h:982

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_Instruction
bind_ty< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
Definition: PatternMatch.h:826

llvm::PatternMatch::m_Specific
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
Definition: PatternMatch.h:885

llvm::PatternMatch::m_NSWNeg
OverflowingBinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWNeg(const ValTy &V)
Matches a 'Neg' as 'sub nsw 0, V'.
Definition: PatternMatch.h:2829

llvm::PatternMatch::m_ConstantInt
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
Definition: PatternMatch.h:168

llvm::PatternMatch::m_One
cst_pred_ty< is_one > m_One()
Match an integer 1 or a vector with all elements equal to 1.
Definition: PatternMatch.h:592

llvm::PatternMatch::m_Select
ThreeOps_match< Cond, LHS, RHS, Instruction::Select > m_Select(const Cond &C, const LHS &L, const RHS &R)
Matches SelectInst.
Definition: PatternMatch.h:1799

llvm::PatternMatch::m_NegZeroFP
cstfp_pred_ty< is_neg_zero_fp > m_NegZeroFP()
Match a floating-point negative zero.
Definition: PatternMatch.h:782

llvm::PatternMatch::m_SpecificFP
specific_fpval m_SpecificFP(double V)
Match a specific floating point value or vector with all elements equal to the value.
Definition: PatternMatch.h:928

llvm::PatternMatch::m_LogicalShift
BinOpPred_match< LHS, RHS, is_logical_shift_op > m_LogicalShift(const LHS &L, const RHS &R)
Matches logical shift operations.
Definition: PatternMatch.h:1533

llvm::PatternMatch::m_CombineAnd
match_combine_and< LTy, RTy > m_CombineAnd(const LTy &L, const RTy &R)
Combine two pattern matchers matching L && R.
Definition: PatternMatch.h:245

llvm::PatternMatch::m_SMin
MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > m_SMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2348

llvm::PatternMatch::m_c_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor, true > m_c_Xor(const LHS &L, const RHS &R)
Matches an Xor with LHS and RHS in either order.
Definition: PatternMatch.h:2812

llvm::PatternMatch::m_Deferred
deferredval_ty< Value > m_Deferred(Value *const &V)
Like m_Specific(), but works if the specific value to match is determined as part of the same match()...
Definition: PatternMatch.h:903

llvm::PatternMatch::m_ZeroInt
cst_pred_ty< is_zero_int > m_ZeroInt()
Match an integer 0 or a vector with all elements equal to 0.
Definition: PatternMatch.h:599

llvm::PatternMatch::m_APIntAllowPoison
apint_match m_APIntAllowPoison(const APInt *&Res)
Match APInt while allowing poison in splat vector constants.
Definition: PatternMatch.h:305

llvm::PatternMatch::m_ZExtOrSExtOrSelf
match_combine_or< match_combine_or< CastInst_match< OpTy, ZExtInst >, CastInst_match< OpTy, SExtInst > >, OpTy > m_ZExtOrSExtOrSelf(const OpTy &Op)
Definition: PatternMatch.h:2146

llvm::PatternMatch::m_OneUse
OneUse_match< T > m_OneUse(const T &SubPattern)
Definition: PatternMatch.h:67

llvm::PatternMatch::m_LogicalOr
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
Definition: PatternMatch.h:3099

llvm::PatternMatch::m_Neg
BinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub > m_Neg(const ValTy &V)
Matches a 'Neg' as 'sub 0, V'.
Definition: PatternMatch.h:2820

llvm::PatternMatch::m_Shuffle
TwoOps_match< V1_t, V2_t, Instruction::ShuffleVector > m_Shuffle(const V1_t &v1, const V2_t &v2)
Matches ShuffleVectorInst independently of mask value.
Definition: PatternMatch.h:1911

llvm::PatternMatch::m_ImmConstant
match_combine_and< class_match< Constant >, match_unless< constantexpr_match > > m_ImmConstant()
Match an arbitrary immediate Constant and ignore it.
Definition: PatternMatch.h:864

llvm::PatternMatch::m_c_Select
ThreeOps_match< decltype(m_Value()), LHS, RHS, Instruction::Select, true > m_c_Select(const LHS &L, const RHS &R)
Match Select(C, LHS, RHS) or Select(C, RHS, LHS)
Definition: PatternMatch.h:1815

llvm::PatternMatch::m_FPExt
CastInst_match< OpTy, FPExtInst > m_FPExt(const OpTy &Op)
Definition: PatternMatch.h:2176

llvm::PatternMatch::m_SpecificICmp
SpecificCmpClass_match< LHS, RHS, ICmpInst > m_SpecificICmp(CmpPredicate MatchPred, const LHS &L, const RHS &R)
Definition: PatternMatch.h:1690

llvm::PatternMatch::m_ZExt
CastInst_match< OpTy, ZExtInst > m_ZExt(const OpTy &Op)
Matches ZExt.
Definition: PatternMatch.h:2107

llvm::PatternMatch::m_NUWShl
OverflowingBinaryOp_match< LHS, RHS, Instruction::Shl, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWShl(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1348

llvm::PatternMatch::m_NUWMul
OverflowingBinaryOp_match< LHS, RHS, Instruction::Mul, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWMul(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1340

llvm::PatternMatch::m_UMax
MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty > m_UMax(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2354

llvm::PatternMatch::m_NegatedPower2
cst_pred_ty< is_negated_power2 > m_NegatedPower2()
Match a integer or vector negated power-of-2.
Definition: PatternMatch.h:627

llvm::PatternMatch::m_CheckedInt
cst_pred_ty< custom_checkfn< APInt > > m_CheckedInt(function_ref< bool(const APInt &)> CheckFn)
Match an integer or vector where CheckFn(ele) for each element is true.
Definition: PatternMatch.h:481

llvm::PatternMatch::m_FShl
m_Intrinsic_Ty< Opnd0, Opnd1, Opnd2 >::Ty m_FShl(const Opnd0 &Op0, const Opnd1 &Op1, const Opnd2 &Op2)
Definition: PatternMatch.h:2725

llvm::PatternMatch::m_c_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty, true >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty, true > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty, true >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty, true > > > m_c_MaxOrMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2864

llvm::PatternMatch::m_UnOp
class_match< UnaryOperator > m_UnOp()
Match an arbitrary unary operation and ignore it.
Definition: PatternMatch.h:95

llvm::PatternMatch::m_NUWSub
OverflowingBinaryOp_match< LHS, RHS, Instruction::Sub, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWSub(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1332

llvm::PatternMatch::m_SMax
MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty > m_SMax(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2342

llvm::PatternMatch::m_APInt
apint_match m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
Definition: PatternMatch.h:299

llvm::PatternMatch::m_NSWAddLike
match_combine_or< OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoSignedWrap >, DisjointOr_match< LHS, RHS > > m_NSWAddLike(const LHS &L, const RHS &R)
Match either "add nsw" or "or disjoint".
Definition: PatternMatch.h:1419

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_LShr
BinaryOp_match< LHS, RHS, Instruction::LShr > m_LShr(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1240

llvm::PatternMatch::m_Exact
Exact_match< T > m_Exact(const T &SubPattern)
Definition: PatternMatch.h:1580

llvm::PatternMatch::m_FNeg
FNeg_match< OpTy > m_FNeg(const OpTy &X)
Match 'fneg X' as 'fsub -0.0, X'.
Definition: PatternMatch.h:1156

llvm::PatternMatch::m_Shift
BinOpPred_match< LHS, RHS, is_shift_op > m_Shift(const LHS &L, const RHS &R)
Matches shift operations.
Definition: PatternMatch.h:1518

llvm::PatternMatch::m_PosZeroFP
cstfp_pred_ty< is_pos_zero_fp > m_PosZeroFP()
Match a floating-point positive zero.
Definition: PatternMatch.h:773

llvm::PatternMatch::m_Shl
BinaryOp_match< LHS, RHS, Instruction::Shl > m_Shl(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1234

llvm::PatternMatch::m_VecReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_VecReverse(const Opnd0 &Op0)
Definition: PatternMatch.h:2747

llvm::PatternMatch::m_APFloat
apfloat_match m_APFloat(const APFloat *&Res)
Match a ConstantFP or splatted ConstantVector, binding the specified pointer to the contained APFloat...
Definition: PatternMatch.h:316

llvm::PatternMatch::m_LogicalAnd
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Definition: PatternMatch.h:3081

llvm::PatternMatch::m_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > > > m_MaxOrMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2371

llvm::PatternMatch::m_FShr
m_Intrinsic_Ty< Opnd0, Opnd1, Opnd2 >::Ty m_FShr(const Opnd0 &Op0, const Opnd1 &Op1, const Opnd2 &Op2)
Definition: PatternMatch.h:2731

llvm::PatternMatch::m_SRem
BinaryOp_match< LHS, RHS, Instruction::SRem > m_SRem(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1204

llvm::PatternMatch::m_Undef
auto m_Undef()
Match an arbitrary undef constant.
Definition: PatternMatch.h:152

llvm::PatternMatch::m_Not
BinaryOp_match< cst_pred_ty< is_all_ones >, ValTy, Instruction::Xor, true > m_Not(const ValTy &V)
Matches a 'Not' as 'xor V, -1' or 'xor -1, V'.
Definition: PatternMatch.h:2467

llvm::PatternMatch::m_BSwap
m_Intrinsic_Ty< Opnd0 >::Ty m_BSwap(const Opnd0 &Op0)
Definition: PatternMatch.h:2697

llvm::PatternMatch::m_SExt
CastInst_match< OpTy, SExtInst > m_SExt(const OpTy &Op)
Matches SExt.
Definition: PatternMatch.h:2101

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition: PatternMatch.h:612

llvm::PatternMatch::m_c_Or
BinaryOp_match< LHS, RHS, Instruction::Or, true > m_c_Or(const LHS &L, const RHS &R)
Matches an Or with LHS and RHS in either order.
Definition: PatternMatch.h:2805

llvm::PatternMatch::m_NUWAddLike
match_combine_or< OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoUnsignedWrap >, DisjointOr_match< LHS, RHS > > m_NUWAddLike(const LHS &L, const RHS &R)
Match either "add nuw" or "or disjoint".
Definition: PatternMatch.h:1429

llvm::PatternMatch::m_BitwiseLogic
BinOpPred_match< LHS, RHS, is_bitwiselogic_op > m_BitwiseLogic(const LHS &L, const RHS &R)
Matches bitwise logic operations.
Definition: PatternMatch.h:1540

llvm::PatternMatch::m_FAbs
m_Intrinsic_Ty< Opnd0 >::Ty m_FAbs(const Opnd0 &Op0)
Definition: PatternMatch.h:2702

llvm::PatternMatch::m_c_Mul
BinaryOp_match< LHS, RHS, Instruction::Mul, true > m_c_Mul(const LHS &L, const RHS &R)
Matches a Mul with LHS and RHS in either order.
Definition: PatternMatch.h:2791

llvm::PatternMatch::m_CopySign
m_Intrinsic_Ty< Opnd0, Opnd1 >::Ty m_CopySign(const Opnd0 &Op0, const Opnd1 &Op1)
Definition: PatternMatch.h:2741

llvm::PatternMatch::m_PtrToInt
CastOperator_match< OpTy, Instruction::PtrToInt > m_PtrToInt(const OpTy &Op)
Matches PtrToInt.
Definition: PatternMatch.h:2056

llvm::PatternMatch::m_UMin
MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > m_UMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2360

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition: PatternMatch.h:239

llvm::SyncScope::SingleThread
@ SingleThread
Synchronized with respect to signal handlers executing in the same thread.
Definition: LLVMContext.h:54

llvm::SyncScope::System
@ System
Synchronized with respect to all concurrently executing threads.
Definition: LLVMContext.h:57

llvm::X86::FirstMacroFusionInstKind::AddSub
@ AddSub

llvm::at::getAssignmentMarkers
AssignmentMarkerRange getAssignmentMarkers(DIAssignID *ID)
Return a range of dbg.assign intrinsics which use \ID as an operand.
Definition: DebugInfo.cpp:1867

llvm::at::getDVRAssignmentMarkers
SmallVector< DbgVariableRecord * > getDVRAssignmentMarkers(const Instruction *Inst)
Definition: DebugInfo.h:240

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm::codeview::EncodedFramePtrReg::BasePtr
@ BasePtr

llvm::logicalview::LVAttributeKind::Inserted
@ Inserted

llvm::logicalview::LVAttributeKind::Zero
@ Zero

llvm::ms_demangle::QualifierMangleMode::Result
@ Result

llvm::numbers::e
constexpr double e
Definition: MathExtras.h:48

llvm::ore::NV
DiagnosticInfoOptimizationBase::Argument NV
Definition: OptimizationRemarkEmitter.h:135

llvm::pdb::PDB_SymType::Caller
@ Caller

llvm::pdb::PDB_SymType::Callee
@ Callee

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::EnableKnowledgeRetention
cl::opt< bool > EnableKnowledgeRetention

llvm::getInverseMinMaxIntrinsic
Intrinsic::ID getInverseMinMaxIntrinsic(Intrinsic::ID MinMaxID)
Definition: ValueTracking.cpp:9140

llvm::Log2_32_Ceil
unsigned Log2_32_Ceil(uint32_t Value)
Return the ceil log base 2 of the specified value, 32 if the value is zero.
Definition: MathExtras.h:355

llvm::Offset
@ Offset
Definition: DWP.cpp:480

llvm::OverflowResult
OverflowResult
Definition: ValueTracking.h:899

llvm::OverflowResult::NeverOverflows
@ NeverOverflows
Never overflows.

llvm::OverflowResult::AlwaysOverflowsHigh
@ AlwaysOverflowsHigh
Always overflows in the direction of signed/unsigned max value.

llvm::OverflowResult::AlwaysOverflowsLow
@ AlwaysOverflowsLow
Always overflows in the direction of signed/unsigned min value.

llvm::OverflowResult::MayOverflow
@ MayOverflow
May or may not overflow.

llvm::for_each
UnaryFunction for_each(R &&Range, UnaryFunction F)
Provide wrappers to std::for_each which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1732

llvm::simplifyFMulInst
Value * simplifyFMulInst(Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q, fp::ExceptionBehavior ExBehavior=fp::ebIgnore, RoundingMode Rounding=RoundingMode::NearestTiesToEven)
Given operands for an FMul, fold the result or return null.
Definition: InstructionSimplify.cpp:5896

llvm::isValidAssumeForContext
bool isValidAssumeForContext(const Instruction *I, const Instruction *CxtI, const DominatorTree *DT=nullptr, bool AllowEphemerals=false)
Return true if it is valid to use the assumptions provided by an assume intrinsic,...
Definition: ValueTracking.cpp:509

llvm::isSafeToSpeculativelyExecuteWithVariableReplaced
bool isSafeToSpeculativelyExecuteWithVariableReplaced(const Instruction *I)
Don't use information from its non-constant operands.
Definition: ValueTracking.h:847

llvm::possiblyDemandedEltsInMask
APInt possiblyDemandedEltsInMask(Value *Mask)
Given a mask vector of the form <Y x i1>, return an APInt (of bitwidth Y) for each lane which may be ...
Definition: VectorUtils.cpp:1202

llvm::simplifyRetainedKnowledge
RetainedKnowledge simplifyRetainedKnowledge(AssumeInst *Assume, RetainedKnowledge RK, AssumptionCache *AC, DominatorTree *DT)
canonicalize the RetainedKnowledge RK.
Definition: AssumeBundleBuilder.cpp:319

llvm::isRemovableAlloc
bool isRemovableAlloc(const CallBase *V, const TargetLibraryInfo *TLI)
Return true if this is a call to an allocation function that does not have side effects that we are r...
Definition: MemoryBuiltins.cpp:330

llvm::lowerObjectSizeCall
Value * lowerObjectSizeCall(IntrinsicInst *ObjectSize, const DataLayout &DL, const TargetLibraryInfo *TLI, bool MustSucceed)
Try to turn a call to @llvm.objectsize into an integer value of the given Type.
Definition: MemoryBuiltins.cpp:589

llvm::getAllocAlignment
Value * getAllocAlignment(const CallBase *V, const TargetLibraryInfo *TLI)
Gets the alignment argument for an aligned_alloc-like function, using either built-in knowledge based...
Definition: MemoryBuiltins.cpp:341

llvm::maximum
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition: APFloat.h:1604

llvm::getUnderlyingObject
const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=6)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
Definition: ValueTracking.cpp:6768

llvm::simplifyCall
Value * simplifyCall(CallBase *Call, Value *Callee, ArrayRef< Value * > Args, const SimplifyQuery &Q)
Given a callsite, callee, and arguments, fold the result or return null.
Definition: InstructionSimplify.cpp:7005

llvm::ConstantFoldCompareInstOperands
Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
Definition: ConstantFolding.cpp:1186

llvm::alignDown
constexpr T alignDown(U Value, V Align, W Skew=0)
Returns the largest unsigned integer less than or equal to Value and is Skew mod Align.
Definition: MathExtras.h:557

llvm::isPowerOf2_64
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
Definition: MathExtras.h:298

llvm::isAssumeWithEmptyBundle
bool isAssumeWithEmptyBundle(const AssumeInst &Assume)
Return true iff the operand bundles of the provided llvm.assume doesn't contain any valuable informat...
Definition: AssumeBundleQueries.cpp:128

llvm::getSplatValue
Value * getSplatValue(const Value *V)
Get splat value if the input is a splat vector or return nullptr.
Definition: VectorUtils.cpp:312

llvm::MinAlign
constexpr T MinAlign(U A, V B)
A and B are either alignments or offsets.
Definition: MathExtras.h:368

llvm::getKnowledgeFromBundle
RetainedKnowledge getKnowledgeFromBundle(AssumeInst &Assume, const CallBase::BundleOpInfo &BOI)
This extracts the Knowledge from an element of an operand bundle.
Definition: AssumeBundleQueries.cpp:99

llvm::getKnownAlignment
Align getKnownAlignment(Value *V, const DataLayout &DL, const Instruction *CxtI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr)
Try to infer an alignment for the specified pointer.
Definition: Local.h:242

llvm::isSplatValue
bool isSplatValue(const Value *V, int Index=-1, unsigned Depth=0)
Return true if each element of the vector value V is poisoned or equal to every other non-poisoned el...
Definition: VectorUtils.cpp:327

llvm::maxnum
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2019 maximumNumber semantics.
Definition: APFloat.h:1563

llvm::HexPrintStyle::Upper
@ Upper

llvm::HexPrintStyle::Lower
@ Lower

llvm::fneg
FPClassTest fneg(FPClassTest Mask)
Return the test mask which returns true if the value's sign bit is flipped.
Definition: FloatingPointMode.cpp:14

llvm::SelectPatternFlavor
SelectPatternFlavor
Specific patterns of select instructions we can match.
Definition: ValueTracking.h:1113

llvm::SPF_ABS
@ SPF_ABS
Floating point maxnum.
Definition: ValueTracking.h:1121

llvm::SPF_NABS
@ SPF_NABS
Absolute value.
Definition: ValueTracking.h:1122

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:293

llvm::isModSet
bool isModSet(const ModRefInfo MRI)
Definition: ModRef.h:48

llvm::ComplexDeinterleavingOperation::Splat
@ Splat

llvm::FPClassTest
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
Definition: FloatingPointMode.h:239

llvm::fcInf
@ fcInf
Definition: FloatingPointMode.h:254

llvm::fcNegSubnormal
@ fcNegSubnormal
Definition: FloatingPointMode.h:246

llvm::fcPosNormal
@ fcPosNormal
Definition: FloatingPointMode.h:250

llvm::fcNegZero
@ fcNegZero
Definition: FloatingPointMode.h:247

llvm::fcNegInf
@ fcNegInf
Definition: FloatingPointMode.h:244

llvm::fcSubnormal
@ fcSubnormal
Definition: FloatingPointMode.h:256

llvm::fcNone
@ fcNone
Definition: FloatingPointMode.h:240

llvm::fcPositive
@ fcPositive
Definition: FloatingPointMode.h:261

llvm::fcPosZero
@ fcPosZero
Definition: FloatingPointMode.h:248

llvm::fcNegNormal
@ fcNegNormal
Definition: FloatingPointMode.h:245

llvm::fcZero
@ fcZero
Definition: FloatingPointMode.h:257

llvm::fcNegative
@ fcNegative
Definition: FloatingPointMode.h:262

llvm::fcAllFlags
@ fcAllFlags
Definition: FloatingPointMode.h:264

llvm::fcPosSubnormal
@ fcPosSubnormal
Definition: FloatingPointMode.h:249

llvm::fcPosInf
@ fcPosInf
Definition: FloatingPointMode.h:251

llvm::fcNan
@ fcNan
Definition: FloatingPointMode.h:253

llvm::None
@ None
Definition: CodeGenData.h:106

llvm::matchSelectPattern
SelectPatternResult matchSelectPattern(Value *V, Value *&LHS, Value *&RHS, Instruction::CastOps *CastOp=nullptr, unsigned Depth=0)
Pattern match integer [SU]MIN, [SU]MAX and ABS idioms, returning the kind and providing the out param...
Definition: ValueTracking.cpp:9047

llvm::NullPointerIsDefined
bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
Definition: Function.cpp:1187

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::none_of
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1753

llvm::isAtLeastOrStrongerThan
bool isAtLeastOrStrongerThan(AtomicOrdering AO, AtomicOrdering Other)
Definition: AtomicOrdering.h:106

llvm::buildAssumeFromKnowledge
AssumeInst * buildAssumeFromKnowledge(ArrayRef< RetainedKnowledge > Knowledge, Instruction *CtxI, AssumptionCache *AC=nullptr, DominatorTree *DT=nullptr)
Build and return a new assume created from the provided knowledge if the knowledge in the assume is f...
Definition: AssumeBundleBuilder.cpp:310

llvm::isSafeToSpeculativelyExecute
bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
Definition: ValueTracking.cpp:7043

llvm::inverse_fabs
FPClassTest inverse_fabs(FPClassTest Mask)
Return the test mask which returns true after fabs is applied to the value.
Definition: FloatingPointMode.cpp:35

llvm::isNotCrossLaneOperation
bool isNotCrossLaneOperation(const Instruction *I)
Return true if the instruction doesn't potentially cross vector lanes.
Definition: ValueTracking.cpp:7035

llvm::maskIsAllOneOrUndef
bool maskIsAllOneOrUndef(Value *Mask)
Given a mask vector of i1, Return true if all of the elements of this predicate mask are known to be ...
Definition: VectorUtils.cpp:1149

llvm::ConstantFoldBinaryOpOperands
Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
Definition: ConstantFolding.cpp:1300

llvm::isKnownNonZero
bool isKnownNonZero(const Value *V, const SimplifyQuery &Q, unsigned Depth=0)
Return true if the given value is known to be non-zero when defined.
Definition: ValueTracking.cpp:3487

llvm::PoisonMaskElem
constexpr int PoisonMaskElem
Definition: Instructions.h:1889

llvm::AtomicOrdering::Unordered
@ Unordered

llvm::ModRefInfo::Mod
@ Mod
The access may modify the value stored in memory.

llvm::simplifyFMAFMul
Value * simplifyFMAFMul(Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q, fp::ExceptionBehavior ExBehavior=fp::ebIgnore, RoundingMode Rounding=RoundingMode::NearestTiesToEven)
Given operands for the multiplication of a FMA, fold the result or return null.
Definition: InstructionSimplify.cpp:5904

llvm::IRMemLocation::Other
@ Other
Any other memory.

llvm::simplifyConstrainedFPCall
Value * simplifyConstrainedFPCall(CallBase *Call, const SimplifyQuery &Q)
Given a constrained FP intrinsic call, tries to compute its simplified version.
Definition: InstructionSimplify.cpp:7031

llvm::minnum
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2019 minimumNumber semantics.
Definition: APFloat.h:1549

llvm::RecurKind::And
@ And
Bitwise or logical AND of integers.

llvm::RecurKind::Add
@ Add
Sum of integers.

llvm::computeConstantRangeIncludingKnownBits
ConstantRange computeConstantRangeIncludingKnownBits(const WithCache< const Value * > &V, bool ForSigned, const SimplifyQuery &SQ)
Combine constant ranges from computeConstantRange() and computeKnownBits().
Definition: ValueTracking.cpp:7189

llvm::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, unsigned Depth=0, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
Definition: ValueTracking.cpp:164

llvm::getFreedOperand
Value * getFreedOperand(const CallBase *CB, const TargetLibraryInfo *TLI)
If this if a call to a free function, return the freed operand.
Definition: MemoryBuiltins.cpp:545

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:217

llvm::isDereferenceablePointer
bool isDereferenceablePointer(const Value *V, Type *Ty, const DataLayout &DL, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr)
Return true if this is always a dereferenceable pointer.
Definition: Loads.cpp:236

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition: STLExtras.h:1903

llvm::getAllocSize
std::optional< APInt > getAllocSize(const CallBase *CB, const TargetLibraryInfo *TLI, function_ref< const Value *(const Value *)> Mapper=[](const Value *V) { return V;})
Return the size of the requested allocation.
Definition: MemoryBuiltins.cpp:367

llvm::computeKnownFPSignBit
std::optional< bool > computeKnownFPSignBit(const Value *V, unsigned Depth, const SimplifyQuery &SQ)
Return false if we can prove that the specified FP value's sign bit is 0.
Definition: ValueTracking.h:610

llvm::Log2
unsigned Log2(Align A)
Returns the log2 of the alignment.
Definition: Alignment.h:208

llvm::maskContainsAllOneOrUndef
bool maskContainsAllOneOrUndef(Value *Mask)
Given a mask vector of i1, Return true if any of the elements of this predicate mask are known to be ...
Definition: VectorUtils.cpp:1175

llvm::isImpliedByDomCondition
std::optional< bool > isImpliedByDomCondition(const Value *Cond, const Instruction *ContextI, const DataLayout &DL)
Return the boolean condition value in the context of the given instruction if it is known based on do...
Definition: ValueTracking.cpp:9680

llvm::minimum
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition: APFloat.h:1577

llvm::isKnownNegation
bool isKnownNegation(const Value *X, const Value *Y, bool NeedNSW=false, bool AllowPoison=true)
Return true if the two given values are negation.
Definition: ValueTracking.cpp:8571

llvm::Data
@ Data
Definition: SIMachineScheduler.h:55

llvm::isKnownNonNegative
bool isKnownNonNegative(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the give value is known to be non-negative.
Definition: ValueTracking.cpp:292

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:860

raw_ostream.h

NC
#define NC
Definition: regutils.h:42

llvm::AAMDNodes
A collection of metadata nodes that might be associated with a memory access used by the alias-analys...
Definition: Metadata.h:764

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::BitTracker
Definition: BitTracker.h:35

llvm::DenormalMode::IEEE
@ IEEE
IEEE-754 denormal numbers preserved.
Definition: FloatingPointMode.h:77

llvm::KnownBits
Definition: KnownBits.h:23

llvm::KnownBits::isNonNegative
bool isNonNegative() const
Returns true if this value is known to be non-negative.
Definition: KnownBits.h:100

llvm::KnownBits::countMinTrailingZeros
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition: KnownBits.h:234

llvm::KnownBits::countMaxTrailingZeros
unsigned countMaxTrailingZeros() const
Returns the maximum number of trailing zero bits possible.
Definition: KnownBits.h:266

llvm::KnownBits::countMaxPopulation
unsigned countMaxPopulation() const
Returns the maximum number of bits that could be one.
Definition: KnownBits.h:281

llvm::KnownBits::getBitWidth
unsigned getBitWidth() const
Get the bit width of this value.
Definition: KnownBits.h:43

llvm::KnownBits::isNonZero
bool isNonZero() const
Returns true if this value is known to be non-zero.
Definition: KnownBits.h:103

llvm::KnownBits::countMinLeadingZeros
unsigned countMinLeadingZeros() const
Returns the minimum number of leading zero bits.
Definition: KnownBits.h:240

llvm::KnownBits::isNegative
bool isNegative() const
Returns true if this value is known to be negative.
Definition: KnownBits.h:97

llvm::KnownBits::countMaxLeadingZeros
unsigned countMaxLeadingZeros() const
Returns the maximum number of leading zero bits possible.
Definition: KnownBits.h:272

llvm::KnownBits::One
APInt One
Definition: KnownBits.h:25

llvm::KnownBits::Zero
APInt Zero
Definition: KnownBits.h:24

llvm::KnownBits::countMinPopulation
unsigned countMinPopulation() const
Returns the number of bits known to be one.
Definition: KnownBits.h:278

llvm::KnownBits::isAllOnes
bool isAllOnes() const
Returns true if value is all one bits.
Definition: KnownBits.h:82

llvm::KnownFPClass
Definition: ValueTracking.h:261

llvm::KnownFPClass::KnownFPClasses
FPClassTest KnownFPClasses
Floating-point classes the value could be one of.
Definition: ValueTracking.h:263

llvm::MaybeAlign
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition: Alignment.h:117

llvm::MaybeAlign::valueOrOne
Align valueOrOne() const
For convenience, returns a valid alignment or 1 if undefined.
Definition: Alignment.h:141

llvm::MinMax
Definition: AssumeBundleQueries.h:70

llvm::OperandBundleUse
A lightweight accessor for an operand bundle meant to be passed around by value.
Definition: InstrTypes.h:1007

llvm::OperandBundleUse::getTagName
StringRef getTagName() const
Return the tag of this operand bundle as a string.
Definition: InstrTypes.h:1026

llvm::OperandBundleUse::Inputs
ArrayRef< Use > Inputs
Definition: InstrTypes.h:1008

llvm::PatternMatch::m_Mask
Definition: PatternMatch.h:1859

llvm::PatternMatch::m_SpecificMask
Definition: PatternMatch.h:1874

llvm::RetainedKnowledge
Represent one information held inside an operand bundle of an llvm.assume.
Definition: AssumeBundleQueries.h:99

llvm::RetainedKnowledge::AttrKind
Attribute::AttrKind AttrKind
Definition: AssumeBundleQueries.h:100

llvm::RetainedKnowledge::ArgValue
uint64_t ArgValue
Definition: AssumeBundleQueries.h:101

llvm::RetainedKnowledge::WasOn
Value * WasOn
Definition: AssumeBundleQueries.h:102

llvm::SelectPatternResult::Flavor
SelectPatternFlavor Flavor
Definition: ValueTracking.h:1137

llvm::SimplifyQuery
Definition: SimplifyQuery.h:70

llvm::SimplifyQuery::DL
const DataLayout & DL
Definition: SimplifyQuery.h:71

llvm::SimplifyQuery::CxtI
const Instruction * CxtI
Definition: SimplifyQuery.h:75

llvm::SimplifyQuery::getWithInstruction
SimplifyQuery getWithInstruction(const Instruction *I) const
Definition: SimplifyQuery.h:107

llvm::UnderlyingObject
Definition: ScheduleDAGInstrs.h:104

llvm::cl::desc
Definition: CommandLine.h:409