doxygen/TargetTransformInfo%5F8h%5Fsource.html

//===- TargetTransformInfo.h ------------------------------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This pass exposes codegen information to IR-level passes. Every

/// transformation that uses codegen information is broken into three parts:

/// 1. The IR-level analysis pass.

/// 2. The IR-level transformation interface which provides the needed

///    information.

/// 3. Codegen-level implementation which uses target-specific hooks.

///

/// This file defines #2, which is the interface that IR-level transformations

/// use for querying the codegen.

///

//===----------------------------------------------------------------------===//


#ifndef LLVM_ANALYSIS_TARGETTRANSFORMINFO_H

#define LLVM_ANALYSIS_TARGETTRANSFORMINFO_H


#include "llvm/ADT/APInt.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/ADT/BitmaskEnum.h"

#include "llvm/ADT/Uniformity.h"

#include "llvm/Analysis/IVDescriptors.h"

#include "llvm/Analysis/InterestingMemoryOperand.h"

#include "llvm/IR/FMF.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/PassManager.h"

#include "llvm/Pass.h"

#include "llvm/Support/AtomicOrdering.h"

#include "llvm/Support/BranchProbability.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/InstructionCost.h"

#include <functional>

#include <optional>

#include <utility>


namespace llvm {


namespace Intrinsic {

typedef unsigned ID;

}


class AllocaInst;

class AssumptionCache;

class BlockFrequencyInfo;

class DominatorTree;

class BranchInst;

class Function;

class GlobalValue;

class InstCombiner;

class OptimizationRemarkEmitter;

class InterleavedAccessInfo;

class IntrinsicInst;

class LoadInst;

class Loop;

class LoopInfo;

class LoopVectorizationLegality;

class ProfileSummaryInfo;

class RecurrenceDescriptor;

class SCEV;

class ScalarEvolution;

class SmallBitVector;

class StoreInst;

class SwitchInst;

class TargetLibraryInfo;

class Type;

class VPIntrinsic;

struct KnownBits;


/// Information about a load/store intrinsic defined by the target.


struct MemIntrinsicInfo {

  /// This is the pointer that the intrinsic is loading from or storing to.

  /// If this is non-null, then analysis/optimization passes can assume that

  /// this intrinsic is functionally equivalent to a load/store from this

  /// pointer.

  Value *PtrVal = nullptr;


  // Ordering for atomic operations.

  AtomicOrdering Ordering = AtomicOrdering::NotAtomic;


  // Same Id is set by the target for corresponding load/store intrinsics.

  unsigned short MatchingId = 0;


  bool ReadMem = false;

  bool WriteMem = false;

  bool IsVolatile = false;


  SmallVector<InterestingMemoryOperand, 1> InterestingOperands;


  bool isUnordered() const {

    return (Ordering == AtomicOrdering::NotAtomic ||

            Ordering == AtomicOrdering::Unordered) &&

           !IsVolatile;

  }


};


/// Attributes of a target dependent hardware loop.


struct HardwareLoopInfo {

  HardwareLoopInfo() = delete;

  LLVM_ABI HardwareLoopInfo(Loop *L);

  Loop *L = nullptr;

  BasicBlock *ExitBlock = nullptr;

  BranchInst *ExitBranch = nullptr;

  const SCEV *ExitCount = nullptr;

  IntegerType *CountType = nullptr;

  Value *LoopDecrement = nullptr; // Decrement the loop counter by this

                                  // value in every iteration.

  bool IsNestingLegal = false;    // Can a hardware loop be a parent to

                                  // another hardware loop?

  bool CounterInReg = false;      // Should loop counter be updated in

                                  // the loop via a phi?

  bool PerformEntryTest = false;  // Generate the intrinsic which also performs

                                  // icmp ne zero on the loop counter value and

                                  // produces an i1 to guard the loop entry.

  LLVM_ABI bool isHardwareLoopCandidate(ScalarEvolution &SE, LoopInfo &LI,

                                        DominatorTree &DT,

                                        bool ForceNestedLoop = false,

                                        bool ForceHardwareLoopPHI = false);

  LLVM_ABI bool canAnalyze(LoopInfo &LI);

};


/// Information for memory intrinsic cost model.


class MemIntrinsicCostAttributes {

  /// Optional context instruction, if one exists, e.g. the

  /// load/store to transform to the intrinsic.

  const Instruction *I = nullptr;


  /// Address in memory.

  const Value *Ptr = nullptr;


  /// Vector type of the data to be loaded or stored.

  Type *DataTy = nullptr;


  /// ID of the memory intrinsic.

  Intrinsic::ID IID;


  /// True when the memory access is predicated with a mask

  /// that is not a compile-time constant.

  bool VariableMask = true;


  /// Address space of the pointer.

  unsigned AddressSpace = 0;


  /// Alignment of single element.

  Align Alignment;


public:


  LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy,

                                      const Value *Ptr, bool VariableMask,

                                      Align Alignment,

                                      const Instruction *I = nullptr)

      : I(I), Ptr(Ptr), DataTy(DataTy), IID(Id), VariableMask(VariableMask),

        Alignment(Alignment) {}


  LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy,

                                      Align Alignment,

                                      unsigned AddressSpace = 0)

      : DataTy(DataTy), IID(Id), AddressSpace(AddressSpace),

        Alignment(Alignment) {}


  LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy,

                                      bool VariableMask, Align Alignment,

                                      const Instruction *I = nullptr)

      : I(I), DataTy(DataTy), IID(Id), VariableMask(VariableMask),

        Alignment(Alignment) {}


  Intrinsic::ID getID() const { return IID; }

  const Instruction *getInst() const { return I; }

  const Value *getPointer() const { return Ptr; }

  Type *getDataType() const { return DataTy; }

  bool getVariableMask() const { return VariableMask; }

  unsigned getAddressSpace() const { return AddressSpace; }

  Align getAlignment() const { return Alignment; }

};


class IntrinsicCostAttributes {

  const IntrinsicInst *II = nullptr;

  Type *RetTy = nullptr;

  Intrinsic::ID IID;

  SmallVector<Type *, 4> ParamTys;

  SmallVector<const Value *, 4> Arguments;

  FastMathFlags FMF;

  // If ScalarizationCost is UINT_MAX, the cost of scalarizing the

  // arguments and the return value will be computed based on types.

  InstructionCost ScalarizationCost = InstructionCost::getInvalid();

  TargetLibraryInfo const *LibInfo = nullptr;


public:

  LLVM_ABI IntrinsicCostAttributes(

      Intrinsic::ID Id, const CallBase &CI,

      InstructionCost ScalarCost = InstructionCost::getInvalid(),

      bool TypeBasedOnly = false, TargetLibraryInfo const *LibInfo = nullptr);


  LLVM_ABI IntrinsicCostAttributes(

      Intrinsic::ID Id, Type *RTy, ArrayRef<Type *> Tys,

      FastMathFlags Flags = FastMathFlags(), const IntrinsicInst *I = nullptr,

      InstructionCost ScalarCost = InstructionCost::getInvalid());


  LLVM_ABI IntrinsicCostAttributes(Intrinsic::ID Id, Type *RTy,

                                   ArrayRef<const Value *> Args);


  LLVM_ABI IntrinsicCostAttributes(

      Intrinsic::ID Id, Type *RTy, ArrayRef<const Value *> Args,

      ArrayRef<Type *> Tys, FastMathFlags Flags = FastMathFlags(),

      const IntrinsicInst *I = nullptr,

      InstructionCost ScalarCost = InstructionCost::getInvalid(),

      TargetLibraryInfo const *LibInfo = nullptr);


  Intrinsic::ID getID() const { return IID; }

  const IntrinsicInst *getInst() const { return II; }

  Type *getReturnType() const { return RetTy; }

  FastMathFlags getFlags() const { return FMF; }

  InstructionCost getScalarizationCost() const { return ScalarizationCost; }

  const SmallVectorImpl<const Value *> &getArgs() const { return Arguments; }

  const SmallVectorImpl<Type *> &getArgTypes() const { return ParamTys; }

  const TargetLibraryInfo *getLibInfo() const { return LibInfo; }


  bool isTypeBasedOnly() const {

    return Arguments.empty();

  }


  bool skipScalarizationCost() const { return ScalarizationCost.isValid(); }

};


enum class TailFoldingStyle {

  /// Don't use tail folding

  None,

  /// Use predicate only to mask operations on data in the loop.

  /// When the VL is not known to be a power-of-2, this method requires a

  /// runtime overflow check for the i + VL in the loop because it compares the

  /// scalar induction variable against the tripcount rounded up by VL which may

  /// overflow. When the VL is a power-of-2, both the increment and uprounded

  /// tripcount will overflow to 0, which does not require a runtime check

  /// since the loop is exited when the loop induction variable equals the

  /// uprounded trip-count, which are both 0.

  Data,

  /// Same as Data, but avoids using the get.active.lane.mask intrinsic to

  /// calculate the mask and instead implements this with a

  /// splat/stepvector/cmp.

  /// FIXME: Can this kind be removed now that SelectionDAGBuilder expands the

  /// active.lane.mask intrinsic when it is not natively supported?

  DataWithoutLaneMask,

  /// Use predicate to control both data and control flow.

  /// This method always requires a runtime overflow check for the i + VL

  /// increment inside the loop, because it uses the result direclty in the

  /// active.lane.mask to calculate the mask for the next iteration. If the

  /// increment overflows, the mask is no longer correct.

  DataAndControlFlow,

  /// Use predicate to control both data and control flow, but modify

  /// the trip count so that a runtime overflow check can be avoided

  /// and such that the scalar epilogue loop can always be removed.

  DataAndControlFlowWithoutRuntimeCheck,

  /// Use predicated EVL instructions for tail-folding.

  /// Indicates that VP intrinsics should be used.

  DataWithEVL,

};


struct TailFoldingInfo {

  TargetLibraryInfo *TLI;

  LoopVectorizationLegality *LVL;

  InterleavedAccessInfo *IAI;


  TailFoldingInfo(TargetLibraryInfo *TLI, LoopVectorizationLegality *LVL,

                  InterleavedAccessInfo *IAI)

      : TLI(TLI), LVL(LVL), IAI(IAI) {}


};


class TargetTransformInfo;

typedef TargetTransformInfo TTI;

class TargetTransformInfoImplBase;


/// This pass provides access to the codegen interfaces that are needed

/// for IR-level transformations.


class TargetTransformInfo {

public:

  enum PartialReductionExtendKind { PR_None, PR_SignExtend, PR_ZeroExtend };


  /// Get the kind of extension that an instruction represents.

  LLVM_ABI static PartialReductionExtendKind

  getPartialReductionExtendKind(Instruction *I);

  /// Get the kind of extension that a cast opcode represents.

  LLVM_ABI static PartialReductionExtendKind

  getPartialReductionExtendKind(Instruction::CastOps CastOpc);


  /// Construct a TTI object using a type implementing the \c Concept

  /// API below.

  ///

  /// This is used by targets to construct a TTI wrapping their target-specific

  /// implementation that encodes appropriate costs for their target.

  LLVM_ABI explicit TargetTransformInfo(

      std::unique_ptr<const TargetTransformInfoImplBase> Impl);


  /// Construct a baseline TTI object using a minimal implementation of

  /// the \c Concept API below.

  ///

  /// The TTI implementation will reflect the information in the DataLayout

  /// provided if non-null.

  LLVM_ABI explicit TargetTransformInfo(const DataLayout &DL);


  // Provide move semantics.

  LLVM_ABI TargetTransformInfo(TargetTransformInfo &&Arg);

  LLVM_ABI TargetTransformInfo &operator=(TargetTransformInfo &&RHS);


  // We need to define the destructor out-of-line to define our sub-classes

  // out-of-line.

  LLVM_ABI ~TargetTransformInfo();


  /// Handle the invalidation of this information.

  ///

  /// When used as a result of \c TargetIRAnalysis this method will be called

  /// when the function this was computed for changes. When it returns false,

  /// the information is preserved across those changes.


  bool invalidate(Function &, const PreservedAnalyses &,

                  FunctionAnalysisManager::Invalidator &) {

    // FIXME: We should probably in some way ensure that the subtarget

    // information for a function hasn't changed.

    return false;

  }


  /// \name Generic Target Information

  /// @{


  /// The kind of cost model.

  ///

  /// There are several different cost models that can be customized by the

  /// target. The normalization of each cost model may be target specific.

  /// e.g. TCK_SizeAndLatency should be comparable to target thresholds such as

  /// those derived from MCSchedModel::LoopMicroOpBufferSize etc.


  enum TargetCostKind {

    TCK_RecipThroughput, ///< Reciprocal throughput.

    TCK_Latency,         ///< The latency of instruction.

    TCK_CodeSize,        ///< Instruction code size.

    TCK_SizeAndLatency   ///< The weighted sum of size and latency.

  };


  /// Underlying constants for 'cost' values in this interface.

  ///

  /// Many APIs in this interface return a cost. This enum defines the

  /// fundamental values that should be used to interpret (and produce) those

  /// costs. The costs are returned as an int rather than a member of this

  /// enumeration because it is expected that the cost of one IR instruction

  /// may have a multiplicative factor to it or otherwise won't fit directly

  /// into the enum. Moreover, it is common to sum or average costs which works

  /// better as simple integral values. Thus this enum only provides constants.

  /// Also note that the returned costs are signed integers to make it natural

  /// to add, subtract, and test with zero (a common boundary condition). It is

  /// not expected that 2^32 is a realistic cost to be modeling at any point.

  ///

  /// Note that these costs should usually reflect the intersection of code-size

  /// cost and execution cost. A free instruction is typically one that folds

  /// into another instruction. For example, reg-to-reg moves can often be

  /// skipped by renaming the registers in the CPU, but they still are encoded

  /// and thus wouldn't be considered 'free' here.


  enum TargetCostConstants {

    TCC_Free = 0,     ///< Expected to fold away in lowering.

    TCC_Basic = 1,    ///< The cost of a typical 'add' instruction.

    TCC_Expensive = 4 ///< The cost of a 'div' instruction on x86.

  };


  /// Estimate the cost of a GEP operation when lowered.

  ///

  /// \p PointeeType is the source element type of the GEP.

  /// \p Ptr is the base pointer operand.

  /// \p Operands is the list of indices following the base pointer.

  ///

  /// \p AccessType is a hint as to what type of memory might be accessed by

  /// users of the GEP. getGEPCost will use it to determine if the GEP can be

  /// folded into the addressing mode of a load/store. If AccessType is null,

  /// then the resulting target type based off of PointeeType will be used as an

  /// approximation.

  LLVM_ABI InstructionCost

  getGEPCost(Type *PointeeType, const Value *Ptr,

             ArrayRef<const Value *> Operands, Type *AccessType = nullptr,

             TargetCostKind CostKind = TCK_SizeAndLatency) const;


  /// Describe known properties for a set of pointers.


  struct PointersChainInfo {

    /// All the GEPs in a set have same base address.

    unsigned IsSameBaseAddress : 1;

    /// These properties only valid if SameBaseAddress is set.

    /// True if all pointers are separated by a unit stride.

    unsigned IsUnitStride : 1;

    /// True if distance between any two neigbouring pointers is a known value.

    unsigned IsKnownStride : 1;

    unsigned Reserved : 29;


    bool isSameBase() const { return IsSameBaseAddress; }

    bool isUnitStride() const { return IsSameBaseAddress && IsUnitStride; }

    bool isKnownStride() const { return IsSameBaseAddress && IsKnownStride; }


    static PointersChainInfo getUnitStride() {

      return {/*IsSameBaseAddress=*/1, /*IsUnitStride=*/1,

              /*IsKnownStride=*/1, 0};

    }


    static PointersChainInfo getKnownStride() {

      return {/*IsSameBaseAddress=*/1, /*IsUnitStride=*/0,

              /*IsKnownStride=*/1, 0};

    }


    static PointersChainInfo getUnknownStride() {

      return {/*IsSameBaseAddress=*/1, /*IsUnitStride=*/0,

              /*IsKnownStride=*/0, 0};

    }


  };


  static_assert(sizeof(PointersChainInfo) == 4, "Was size increase justified?");


  /// Estimate the cost of a chain of pointers (typically pointer operands of a

  /// chain of loads or stores within same block) operations set when lowered.

  /// \p AccessTy is the type of the loads/stores that will ultimately use the

  /// \p Ptrs.

  LLVM_ABI InstructionCost getPointersChainCost(

      ArrayRef<const Value *> Ptrs, const Value *Base,

      const PointersChainInfo &Info, Type *AccessTy,

      TargetCostKind CostKind = TTI::TCK_RecipThroughput) const;


  /// \returns A value by which our inlining threshold should be multiplied.

  /// This is primarily used to bump up the inlining threshold wholesale on

  /// targets where calls are unusually expensive.

  ///

  /// TODO: This is a rather blunt instrument.  Perhaps altering the costs of

  /// individual classes of instructions would be better.

  LLVM_ABI unsigned getInliningThresholdMultiplier() const;


  LLVM_ABI unsigned getInliningCostBenefitAnalysisSavingsMultiplier() const;

  LLVM_ABI unsigned getInliningCostBenefitAnalysisProfitableMultiplier() const;


  /// \returns The bonus of inlining the last call to a static function.

  LLVM_ABI int getInliningLastCallToStaticBonus() const;


  /// \returns A value to be added to the inlining threshold.

  LLVM_ABI unsigned adjustInliningThreshold(const CallBase *CB) const;


  /// \returns The cost of having an Alloca in the caller if not inlined, to be

  /// added to the threshold

  LLVM_ABI unsigned getCallerAllocaCost(const CallBase *CB,

                                        const AllocaInst *AI) const;


  /// \returns Vector bonus in percent.

  ///

  /// Vector bonuses: We want to more aggressively inline vector-dense kernels

  /// and apply this bonus based on the percentage of vector instructions. A

  /// bonus is applied if the vector instructions exceed 50% and half that

  /// amount is applied if it exceeds 10%. Note that these bonuses are some what

  /// arbitrary and evolved over time by accident as much as because they are

  /// principled bonuses.

  /// FIXME: It would be nice to base the bonus values on something more

  /// scientific. A target may has no bonus on vector instructions.

  LLVM_ABI int getInlinerVectorBonusPercent() const;


  /// \return the expected cost of a memcpy, which could e.g. depend on the

  /// source/destination type and alignment and the number of bytes copied.

  LLVM_ABI InstructionCost getMemcpyCost(const Instruction *I) const;


  /// Returns the maximum memset / memcpy size in bytes that still makes it

  /// profitable to inline the call.

  LLVM_ABI uint64_t getMaxMemIntrinsicInlineSizeThreshold() const;


  /// \return The estimated number of case clusters when lowering \p 'SI'.

  /// \p JTSize Set a jump table size only when \p SI is suitable for a jump

  /// table.

  LLVM_ABI unsigned

  getEstimatedNumberOfCaseClusters(const SwitchInst &SI, unsigned &JTSize,

                                   ProfileSummaryInfo *PSI,

                                   BlockFrequencyInfo *BFI) const;


  /// Estimate the cost of a given IR user when lowered.

  ///

  /// This can estimate the cost of either a ConstantExpr or Instruction when

  /// lowered.

  ///

  /// \p Operands is a list of operands which can be a result of transformations

  /// of the current operands. The number of the operands on the list must equal

  /// to the number of the current operands the IR user has. Their order on the

  /// list must be the same as the order of the current operands the IR user

  /// has.

  ///

  /// The returned cost is defined in terms of \c TargetCostConstants, see its

  /// comments for a detailed explanation of the cost values.

  LLVM_ABI InstructionCost getInstructionCost(const User *U,

                                              ArrayRef<const Value *> Operands,

                                              TargetCostKind CostKind) const;


  /// This is a helper function which calls the three-argument

  /// getInstructionCost with \p Operands which are the current operands U has.


  InstructionCost getInstructionCost(const User *U,

                                     TargetCostKind CostKind) const {

    SmallVector<const Value *, 4> Operands(U->operand_values());

    return getInstructionCost(U, Operands, CostKind);

  }


  /// If a branch or a select condition is skewed in one direction by more than

  /// this factor, it is very likely to be predicted correctly.

  LLVM_ABI BranchProbability getPredictableBranchThreshold() const;


  /// Returns estimated penalty of a branch misprediction in latency. Indicates

  /// how aggressive the target wants for eliminating unpredictable branches. A

  /// zero return value means extra optimization applied to them should be

  /// minimal.

  LLVM_ABI InstructionCost getBranchMispredictPenalty() const;


  /// Return true if branch divergence exists.

  ///

  /// Branch divergence has a significantly negative impact on GPU performance

  /// when threads in the same wavefront take different paths due to conditional

  /// branches.

  ///

  /// If \p F is passed, provides a context function. If \p F is known to only

  /// execute in a single threaded environment, the target may choose to skip

  /// uniformity analysis and assume all values are uniform.

  LLVM_ABI bool hasBranchDivergence(const Function *F = nullptr) const;


  /// Get target-specific uniformity information for an instruction.

  /// This allows targets to provide more fine-grained control over

  /// uniformity analysis by specifying whether specific instructions

  /// should always or never be considered uniform, or require custom

  /// operand-based analysis.

  /// \param V The value to query for uniformity information.

  /// \return InstructionUniformity.

  LLVM_ABI InstructionUniformity getInstructionUniformity(const Value *V) const;


  /// Query the target whether the specified address space cast from FromAS to

  /// ToAS is valid.

  LLVM_ABI bool isValidAddrSpaceCast(unsigned FromAS, unsigned ToAS) const;


  /// Return false if a \p AS0 address cannot possibly alias a \p AS1 address.

  LLVM_ABI bool addrspacesMayAlias(unsigned AS0, unsigned AS1) const;


  /// Returns the address space ID for a target's 'flat' address space. Note

  /// this is not necessarily the same as addrspace(0), which LLVM sometimes

  /// refers to as the generic address space. The flat address space is a

  /// generic address space that can be used access multiple segments of memory

  /// with different address spaces. Access of a memory location through a

  /// pointer with this address space is expected to be legal but slower

  /// compared to the same memory location accessed through a pointer with a

  /// different address space.

  //

  /// This is for targets with different pointer representations which can

  /// be converted with the addrspacecast instruction. If a pointer is converted

  /// to this address space, optimizations should attempt to replace the access

  /// with the source address space.

  ///

  /// \returns ~0u if the target does not have such a flat address space to

  /// optimize away.

  LLVM_ABI unsigned getFlatAddressSpace() const;


  /// Return any intrinsic address operand indexes which may be rewritten if

  /// they use a flat address space pointer.

  ///

  /// \returns true if the intrinsic was handled.

  LLVM_ABI bool collectFlatAddressOperands(SmallVectorImpl<int> &OpIndexes,

                                           Intrinsic::ID IID) const;


  LLVM_ABI bool isNoopAddrSpaceCast(unsigned FromAS, unsigned ToAS) const;


  /// Return true if globals in this address space can have initializers other

  /// than `undef`.

  LLVM_ABI bool

  canHaveNonUndefGlobalInitializerInAddressSpace(unsigned AS) const;


  LLVM_ABI unsigned getAssumedAddrSpace(const Value *V) const;


  LLVM_ABI bool isSingleThreaded() const;


  LLVM_ABI std::pair<const Value *, unsigned>

  getPredicatedAddrSpace(const Value *V) const;


  /// Rewrite intrinsic call \p II such that \p OldV will be replaced with \p

  /// NewV, which has a different address space. This should happen for every

  /// operand index that collectFlatAddressOperands returned for the intrinsic.

  /// \returns nullptr if the intrinsic was not handled. Otherwise, returns the

  /// new value (which may be the original \p II with modified operands).

  LLVM_ABI Value *rewriteIntrinsicWithAddressSpace(IntrinsicInst *II,

                                                   Value *OldV,

                                                   Value *NewV) const;


  /// Test whether calls to a function lower to actual program function

  /// calls.

  ///

  /// The idea is to test whether the program is likely to require a 'call'

  /// instruction or equivalent in order to call the given function.

  ///

  /// FIXME: It's not clear that this is a good or useful query API. Client's

  /// should probably move to simpler cost metrics using the above.

  /// Alternatively, we could split the cost interface into distinct code-size

  /// and execution-speed costs. This would allow modelling the core of this

  /// query more accurately as a call is a single small instruction, but

  /// incurs significant execution cost.

  LLVM_ABI bool isLoweredToCall(const Function *F) const;


  struct LSRCost {

    /// TODO: Some of these could be merged. Also, a lexical ordering

    /// isn't always optimal.

    unsigned Insns;

    unsigned NumRegs;

    unsigned AddRecCost;

    unsigned NumIVMuls;

    unsigned NumBaseAdds;

    unsigned ImmCost;

    unsigned SetupCost;

    unsigned ScaleCost;

  };


  /// Parameters that control the generic loop unrolling transformation.


  struct UnrollingPreferences {

    /// The cost threshold for the unrolled loop. Should be relative to the

    /// getInstructionCost values returned by this API, and the expectation is

    /// that the unrolled loop's instructions when run through that interface

    /// should not exceed this cost. However, this is only an estimate. Also,

    /// specific loops may be unrolled even with a cost above this threshold if

    /// deemed profitable. Set this to UINT_MAX to disable the loop body cost

    /// restriction.

    unsigned Threshold;

    /// If complete unrolling will reduce the cost of the loop, we will boost

    /// the Threshold by a certain percent to allow more aggressive complete

    /// unrolling. This value provides the maximum boost percentage that we

    /// can apply to Threshold (The value should be no less than 100).

    /// BoostedThreshold = Threshold * min(RolledCost / UnrolledCost,

    ///                                    MaxPercentThresholdBoost / 100)

    /// E.g. if complete unrolling reduces the loop execution time by 50%

    /// then we boost the threshold by the factor of 2x. If unrolling is not

    /// expected to reduce the running time, then we do not increase the

    /// threshold.

    unsigned MaxPercentThresholdBoost;

    /// The cost threshold for the unrolled loop when optimizing for size (set

    /// to UINT_MAX to disable).

    unsigned OptSizeThreshold;

    /// The cost threshold for the unrolled loop, like Threshold, but used

    /// for partial/runtime unrolling (set to UINT_MAX to disable).

    unsigned PartialThreshold;

    /// The cost threshold for the unrolled loop when optimizing for size, like

    /// OptSizeThreshold, but used for partial/runtime unrolling (set to

    /// UINT_MAX to disable).

    unsigned PartialOptSizeThreshold;

    /// A forced unrolling factor (the number of concatenated bodies of the

    /// original loop in the unrolled loop body). When set to 0, the unrolling

    /// transformation will select an unrolling factor based on the current cost

    /// threshold and other factors.

    unsigned Count;

    /// Default unroll count for loops with run-time trip count.

    unsigned DefaultUnrollRuntimeCount;

    // Set the maximum unrolling factor. The unrolling factor may be selected

    // using the appropriate cost threshold, but may not exceed this number

    // (set to UINT_MAX to disable). This does not apply in cases where the

    // loop is being fully unrolled.

    unsigned MaxCount;

    /// Set the maximum upper bound of trip count. Allowing the MaxUpperBound

    /// to be overrided by a target gives more flexiblity on certain cases.

    /// By default, MaxUpperBound uses UnrollMaxUpperBound which value is 8.

    unsigned MaxUpperBound;

    /// Set the maximum unrolling factor for full unrolling. Like MaxCount, but

    /// applies even if full unrolling is selected. This allows a target to fall

    /// back to Partial unrolling if full unrolling is above FullUnrollMaxCount.

    unsigned FullUnrollMaxCount;

    // Represents number of instructions optimized when "back edge"

    // becomes "fall through" in unrolled loop.

    // For now we count a conditional branch on a backedge and a comparison

    // feeding it.

    unsigned BEInsns;

    /// Allow partial unrolling (unrolling of loops to expand the size of the

    /// loop body, not only to eliminate small constant-trip-count loops).

    bool Partial;

    /// Allow runtime unrolling (unrolling of loops to expand the size of the

    /// loop body even when the number of loop iterations is not known at

    /// compile time).

    bool Runtime;

    /// Allow generation of a loop remainder (extra iterations after unroll).

    bool AllowRemainder;

    /// Allow emitting expensive instructions (such as divisions) when computing

    /// the trip count of a loop for runtime unrolling.

    bool AllowExpensiveTripCount;

    /// Apply loop unroll on any kind of loop

    /// (mainly to loops that fail runtime unrolling).

    bool Force;

    /// Allow using trip count upper bound to unroll loops.

    bool UpperBound;

    /// Allow unrolling of all the iterations of the runtime loop remainder.

    bool UnrollRemainder;

    /// Allow unroll and jam. Used to enable unroll and jam for the target.

    bool UnrollAndJam;

    /// Threshold for unroll and jam, for inner loop size. The 'Threshold'

    /// value above is used during unroll and jam for the outer loop size.

    /// This value is used in the same manner to limit the size of the inner

    /// loop.

    unsigned UnrollAndJamInnerLoopThreshold;

    /// Don't allow loop unrolling to simulate more than this number of

    /// iterations when checking full unroll profitability

    unsigned MaxIterationsCountToAnalyze;

    /// Don't disable runtime unroll for the loops which were vectorized.

    bool UnrollVectorizedLoop = false;

    /// Don't allow runtime unrolling if expanding the trip count takes more

    /// than SCEVExpansionBudget.

    unsigned SCEVExpansionBudget;

    /// Allow runtime unrolling multi-exit loops. Should only be set if the

    /// target determined that multi-exit unrolling is profitable for the loop.

    /// Fall back to the generic logic to determine whether multi-exit unrolling

    /// is profitable if set to false.

    bool RuntimeUnrollMultiExit;

    /// Allow unrolling to add parallel reduction phis.

    bool AddAdditionalAccumulators;

  };


  /// Get target-customized preferences for the generic loop unrolling

  /// transformation. The caller will initialize UP with the current

  /// target-independent defaults.

  LLVM_ABI void getUnrollingPreferences(Loop *L, ScalarEvolution &,

                                        UnrollingPreferences &UP,

                                        OptimizationRemarkEmitter *ORE) const;


  /// Query the target whether it would be profitable to convert the given loop

  /// into a hardware loop.

  LLVM_ABI bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE,

                                         AssumptionCache &AC,

                                         TargetLibraryInfo *LibInfo,

                                         HardwareLoopInfo &HWLoopInfo) const;


  // Query the target for which minimum vectorization factor epilogue

  // vectorization should be considered.

  LLVM_ABI unsigned getEpilogueVectorizationMinVF() const;


  /// Query the target whether it would be prefered to create a predicated

  /// vector loop, which can avoid the need to emit a scalar epilogue loop.

  LLVM_ABI bool preferPredicateOverEpilogue(TailFoldingInfo *TFI) const;


  /// Query the target what the preferred style of tail folding is.

  /// \param IVUpdateMayOverflow Tells whether it is known if the IV update

  /// may (or will never) overflow for the suggested VF/UF in the given loop.

  /// Targets can use this information to select a more optimal tail folding

  /// style. The value conservatively defaults to true, such that no assumptions

  /// are made on overflow.

  LLVM_ABI TailFoldingStyle

  getPreferredTailFoldingStyle(bool IVUpdateMayOverflow = true) const;


  // Parameters that control the loop peeling transformation


  struct PeelingPreferences {

    /// A forced peeling factor (the number of bodied of the original loop

    /// that should be peeled off before the loop body). When set to 0, the

    /// a peeling factor based on profile information and other factors.

    unsigned PeelCount;

    /// Allow peeling off loop iterations.

    bool AllowPeeling;

    /// Allow peeling off loop iterations for loop nests.

    bool AllowLoopNestsPeeling;

    /// Allow peeling basing on profile. Uses to enable peeling off all

    /// iterations basing on provided profile.

    /// If the value is true the peeling cost model can decide to peel only

    /// some iterations and in this case it will set this to false.

    bool PeelProfiledIterations;


    /// Peel off the last PeelCount loop iterations.

    bool PeelLast;

  };


  /// Get target-customized preferences for the generic loop peeling

  /// transformation. The caller will initialize \p PP with the current

  /// target-independent defaults with information from \p L and \p SE.

  LLVM_ABI void getPeelingPreferences(Loop *L, ScalarEvolution &SE,

                                      PeelingPreferences &PP) const;


  /// Targets can implement their own combinations for target-specific

  /// intrinsics. This function will be called from the InstCombine pass every

  /// time a target-specific intrinsic is encountered.

  ///

  /// \returns std::nullopt to not do anything target specific or a value that

  /// will be returned from the InstCombiner. It is possible to return null and

  /// stop further processing of the intrinsic by returning nullptr.

  LLVM_ABI std::optional<Instruction *>

  instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const;

  /// Can be used to implement target-specific instruction combining.

  /// \see instCombineIntrinsic

  LLVM_ABI std::optional<Value *>

  simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II,

                                   APInt DemandedMask, KnownBits &Known,

                                   bool &KnownBitsComputed) const;

  /// Can be used to implement target-specific instruction combining.

  /// \see instCombineIntrinsic

  LLVM_ABI std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const;

  /// @}


  /// \name Scalar Target Information

  /// @{


  /// Flags indicating the kind of support for population count.

  ///

  /// Compared to the SW implementation, HW support is supposed to

  /// significantly boost the performance when the population is dense, and it

  /// may or may not degrade performance if the population is sparse. A HW

  /// support is considered as "Fast" if it can outperform, or is on a par

  /// with, SW implementation when the population is sparse; otherwise, it is

  /// considered as "Slow".

  enum PopcntSupportKind { PSK_Software, PSK_SlowHardware, PSK_FastHardware };


  /// Return true if the specified immediate is legal add immediate, that

  /// is the target has add instructions which can add a register with the

  /// immediate without having to materialize the immediate into a register.

  LLVM_ABI bool isLegalAddImmediate(int64_t Imm) const;


  /// Return true if adding the specified scalable immediate is legal, that is

  /// the target has add instructions which can add a register with the

  /// immediate (multiplied by vscale) without having to materialize the

  /// immediate into a register.

  LLVM_ABI bool isLegalAddScalableImmediate(int64_t Imm) const;


  /// Return true if the specified immediate is legal icmp immediate,

  /// that is the target has icmp instructions which can compare a register

  /// against the immediate without having to materialize the immediate into a

  /// register.

  LLVM_ABI bool isLegalICmpImmediate(int64_t Imm) const;


  /// Return true if the addressing mode represented by AM is legal for

  /// this target, for a load/store of the specified type.

  /// The type may be VoidTy, in which case only return true if the addressing

  /// mode is legal for a load/store of any legal type.

  /// If target returns true in LSRWithInstrQueries(), I may be valid.

  /// \param ScalableOffset represents a quantity of bytes multiplied by vscale,

  /// an invariant value known only at runtime. Most targets should not accept

  /// a scalable offset.

  ///

  /// TODO: Handle pre/postinc as well.

  LLVM_ABI bool isLegalAddressingMode(Type *Ty, GlobalValue *BaseGV,

                                      int64_t BaseOffset, bool HasBaseReg,

                                      int64_t Scale, unsigned AddrSpace = 0,

                                      Instruction *I = nullptr,

                                      int64_t ScalableOffset = 0) const;


  /// Return true if LSR cost of C1 is lower than C2.

  LLVM_ABI bool isLSRCostLess(const TargetTransformInfo::LSRCost &C1,

                              const TargetTransformInfo::LSRCost &C2) const;


  /// Return true if LSR major cost is number of registers. Targets which

  /// implement their own isLSRCostLess and unset number of registers as major

  /// cost should return false, otherwise return true.

  LLVM_ABI bool isNumRegsMajorCostOfLSR() const;


  /// Return true if LSR should drop a found solution if it's calculated to be

  /// less profitable than the baseline.

  LLVM_ABI bool shouldDropLSRSolutionIfLessProfitable() const;


  /// \returns true if LSR should not optimize a chain that includes \p I.

  LLVM_ABI bool isProfitableLSRChainElement(Instruction *I) const;


  /// Return true if the target can fuse a compare and branch.

  /// Loop-strength-reduction (LSR) uses that knowledge to adjust its cost

  /// calculation for the instructions in a loop.

  LLVM_ABI bool canMacroFuseCmp() const;


  /// Return true if the target can save a compare for loop count, for example

  /// hardware loop saves a compare.

  LLVM_ABI bool canSaveCmp(Loop *L, BranchInst **BI, ScalarEvolution *SE,

                           LoopInfo *LI, DominatorTree *DT, AssumptionCache *AC,

                           TargetLibraryInfo *LibInfo) const;


  /// Which addressing mode Loop Strength Reduction will try to generate.


  enum AddressingModeKind {

    AMK_None = 0x0,        ///< Don't prefer any addressing mode

    AMK_PreIndexed = 0x1,  ///< Prefer pre-indexed addressing mode

    AMK_PostIndexed = 0x2, ///< Prefer post-indexed addressing mode

    AMK_All = 0x3,         ///< Consider all addressing modes

    LLVM_MARK_AS_BITMASK_ENUM(/*LargestValue=*/AMK_All)

  };


  /// Return the preferred addressing mode LSR should make efforts to generate.

  LLVM_ABI AddressingModeKind

  getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const;


  /// Some targets only support masked load/store with a constant mask.


  enum MaskKind {

    VariableOrConstantMask,

    ConstantMask,

  };


  /// Return true if the target supports masked store.

  LLVM_ABI bool

  isLegalMaskedStore(Type *DataType, Align Alignment, unsigned AddressSpace,

                     MaskKind MaskKind = VariableOrConstantMask) const;

  /// Return true if the target supports masked load.

  LLVM_ABI bool

  isLegalMaskedLoad(Type *DataType, Align Alignment, unsigned AddressSpace,

                    MaskKind MaskKind = VariableOrConstantMask) const;


  /// Return true if the target supports nontemporal store.

  LLVM_ABI bool isLegalNTStore(Type *DataType, Align Alignment) const;

  /// Return true if the target supports nontemporal load.

  LLVM_ABI bool isLegalNTLoad(Type *DataType, Align Alignment) const;


  /// \Returns true if the target supports broadcasting a load to a vector of

  /// type <NumElements x ElementTy>.

  LLVM_ABI bool isLegalBroadcastLoad(Type *ElementTy,

                                     ElementCount NumElements) const;


  /// Return true if the target supports masked scatter.

  LLVM_ABI bool isLegalMaskedScatter(Type *DataType, Align Alignment) const;

  /// Return true if the target supports masked gather.

  LLVM_ABI bool isLegalMaskedGather(Type *DataType, Align Alignment) const;

  /// Return true if the target forces scalarizing of llvm.masked.gather

  /// intrinsics.

  LLVM_ABI bool forceScalarizeMaskedGather(VectorType *Type,

                                           Align Alignment) const;

  /// Return true if the target forces scalarizing of llvm.masked.scatter

  /// intrinsics.

  LLVM_ABI bool forceScalarizeMaskedScatter(VectorType *Type,

                                            Align Alignment) const;


  /// Return true if the target supports masked compress store.

  LLVM_ABI bool isLegalMaskedCompressStore(Type *DataType,

                                           Align Alignment) const;

  /// Return true if the target supports masked expand load.

  LLVM_ABI bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment) const;


  /// Return true if the target supports strided load.

  LLVM_ABI bool isLegalStridedLoadStore(Type *DataType, Align Alignment) const;


  /// Return true is the target supports interleaved access for the given vector

  /// type \p VTy, interleave factor \p Factor, alignment \p Alignment and

  /// address space \p AddrSpace.

  LLVM_ABI bool isLegalInterleavedAccessType(VectorType *VTy, unsigned Factor,

                                             Align Alignment,

                                             unsigned AddrSpace) const;


  // Return true if the target supports masked vector histograms.

  LLVM_ABI bool isLegalMaskedVectorHistogram(Type *AddrType,

                                             Type *DataType) const;


  /// Return true if this is an alternating opcode pattern that can be lowered

  /// to a single instruction on the target. In X86 this is for the addsub

  /// instruction which corrsponds to a Shuffle + Fadd + FSub pattern in IR.

  /// This function expectes two opcodes: \p Opcode1 and \p Opcode2 being

  /// selected by \p OpcodeMask. The mask contains one bit per lane and is a `0`

  /// when \p Opcode0 is selected and `1` when Opcode1 is selected.

  /// \p VecTy is the vector type of the instruction to be generated.

  LLVM_ABI bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0,

                                unsigned Opcode1,

                                const SmallBitVector &OpcodeMask) const;


  /// Return true if we should be enabling ordered reductions for the target.

  LLVM_ABI bool enableOrderedReductions() const;


  /// Return true if the target has a unified operation to calculate division

  /// and remainder. If so, the additional implicit multiplication and

  /// subtraction required to calculate a remainder from division are free. This

  /// can enable more aggressive transformations for division and remainder than

  /// would typically be allowed using throughput or size cost models.

  LLVM_ABI bool hasDivRemOp(Type *DataType, bool IsSigned) const;


  /// Return true if the given instruction (assumed to be a memory access

  /// instruction) has a volatile variant. If that's the case then we can avoid

  /// addrspacecast to generic AS for volatile loads/stores. Default

  /// implementation returns false, which prevents address space inference for

  /// volatile loads/stores.

  LLVM_ABI bool hasVolatileVariant(Instruction *I, unsigned AddrSpace) const;


  /// Return true if target doesn't mind addresses in vectors.

  LLVM_ABI bool prefersVectorizedAddressing() const;


  /// Return the cost of the scaling factor used in the addressing

  /// mode represented by AM for this target, for a load/store

  /// of the specified type.

  /// If the AM is supported, the return value must be >= 0.

  /// If the AM is not supported, it returns a negative value.

  /// TODO: Handle pre/postinc as well.

  LLVM_ABI InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                                StackOffset BaseOffset,

                                                bool HasBaseReg, int64_t Scale,

                                                unsigned AddrSpace = 0) const;


  /// Return true if the loop strength reduce pass should make

  /// Instruction* based TTI queries to isLegalAddressingMode(). This is

  /// needed on SystemZ, where e.g. a memcpy can only have a 12 bit unsigned

  /// immediate offset and no index register.

  LLVM_ABI bool LSRWithInstrQueries() const;


  /// Return true if it's free to truncate a value of type Ty1 to type

  /// Ty2. e.g. On x86 it's free to truncate a i32 value in register EAX to i16

  /// by referencing its sub-register AX.

  LLVM_ABI bool isTruncateFree(Type *Ty1, Type *Ty2) const;


  /// Return true if it is profitable to hoist instruction in the

  /// then/else to before if.

  LLVM_ABI bool isProfitableToHoist(Instruction *I) const;


  LLVM_ABI bool useAA() const;


  /// Return true if this type is legal.

  LLVM_ABI bool isTypeLegal(Type *Ty) const;


  /// Returns the estimated number of registers required to represent \p Ty.

  LLVM_ABI unsigned getRegUsageForType(Type *Ty) const;


  /// Return true if switches should be turned into lookup tables for the

  /// target.

  LLVM_ABI bool shouldBuildLookupTables() const;


  /// Return true if switches should be turned into lookup tables

  /// containing this constant value for the target.

  LLVM_ABI bool shouldBuildLookupTablesForConstant(Constant *C) const;


  /// Return true if lookup tables should be turned into relative lookup tables.

  LLVM_ABI bool shouldBuildRelLookupTables() const;


  /// Return true if the input function which is cold at all call sites,

  ///  should use coldcc calling convention.

  LLVM_ABI bool useColdCCForColdCall(Function &F) const;


  /// Return true if the input function is internal, should use fastcc calling

  /// convention.

  LLVM_ABI bool useFastCCForInternalCall(Function &F) const;


  LLVM_ABI bool isTargetIntrinsicTriviallyScalarizable(Intrinsic::ID ID) const;


  /// Identifies if the vector form of the intrinsic has a scalar operand.

  LLVM_ABI bool isTargetIntrinsicWithScalarOpAtArg(Intrinsic::ID ID,

                                                   unsigned ScalarOpdIdx) const;


  /// Identifies if the vector form of the intrinsic is overloaded on the type

  /// of the operand at index \p OpdIdx, or on the return type if \p OpdIdx is

  /// -1.

  LLVM_ABI bool isTargetIntrinsicWithOverloadTypeAtArg(Intrinsic::ID ID,

                                                       int OpdIdx) const;


  /// Identifies if the vector form of the intrinsic that returns a struct is

  /// overloaded at the struct element index \p RetIdx.

  LLVM_ABI bool

  isTargetIntrinsicWithStructReturnOverloadAtField(Intrinsic::ID ID,

                                                   int RetIdx) const;


  /// Estimate the overhead of scalarizing an instruction. Insert and Extract

  /// are set if the demanded result elements need to be inserted and/or

  /// extracted from vectors.  The involved values may be passed in VL if

  /// Insert is true.

  LLVM_ABI InstructionCost getScalarizationOverhead(

      VectorType *Ty, const APInt &DemandedElts, bool Insert, bool Extract,

      TTI::TargetCostKind CostKind, bool ForPoisonSrc = true,

      ArrayRef<Value *> VL = {}) const;


  /// Estimate the overhead of scalarizing operands with the given types. The

  /// (potentially vector) types to use for each of argument are passes via Tys.

  LLVM_ABI InstructionCost getOperandsScalarizationOverhead(

      ArrayRef<Type *> Tys, TTI::TargetCostKind CostKind) const;


  /// If target has efficient vector element load/store instructions, it can

  /// return true here so that insertion/extraction costs are not added to

  /// the scalarization cost of a load/store.

  LLVM_ABI bool supportsEfficientVectorElementLoadStore() const;


  /// If the target supports tail calls.

  LLVM_ABI bool supportsTailCalls() const;


  /// If target supports tail call on \p CB

  LLVM_ABI bool supportsTailCallFor(const CallBase *CB) const;


  /// Don't restrict interleaved unrolling to small loops.

  LLVM_ABI bool enableAggressiveInterleaving(bool LoopHasReductions) const;


  /// Returns options for expansion of memcmp. IsZeroCmp is

  // true if this is the expansion of memcmp(p1, p2, s) == 0.


  struct MemCmpExpansionOptions {

    // Return true if memcmp expansion is enabled.

    operator bool() const { return MaxNumLoads > 0; }


    // Maximum number of load operations.

    unsigned MaxNumLoads = 0;


    // The list of available load sizes (in bytes), sorted in decreasing order.

    SmallVector<unsigned, 8> LoadSizes;


    // For memcmp expansion when the memcmp result is only compared equal or

    // not-equal to 0, allow up to this number of load pairs per block. As an

    // example, this may allow 'memcmp(a, b, 3) == 0' in a single block:

    //   a0 = load2bytes &a[0]

    //   b0 = load2bytes &b[0]

    //   a2 = load1byte  &a[2]

    //   b2 = load1byte  &b[2]

    //   r  = cmp eq (a0 ^ b0 | a2 ^ b2), 0

    unsigned NumLoadsPerBlock = 1;


    // Set to true to allow overlapping loads. For example, 7-byte compares can

    // be done with two 4-byte compares instead of 4+2+1-byte compares. This

    // requires all loads in LoadSizes to be doable in an unaligned way.

    bool AllowOverlappingLoads = false;


    // Sometimes, the amount of data that needs to be compared is smaller than

    // the standard register size, but it cannot be loaded with just one load

    // instruction. For example, if the size of the memory comparison is 6

    // bytes, we can handle it more efficiently by loading all 6 bytes in a

    // single block and generating an 8-byte number, instead of generating two

    // separate blocks with conditional jumps for 4 and 2 byte loads. This

    // approach simplifies the process and produces the comparison result as

    // normal. This array lists the allowed sizes of memcmp tails that can be

    // merged into one block

    SmallVector<unsigned, 4> AllowedTailExpansions;

  };


  LLVM_ABI MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize,

                                                        bool IsZeroCmp) const;


  /// Should the Select Optimization pass be enabled and ran.

  LLVM_ABI bool enableSelectOptimize() const;


  /// Should the Select Optimization pass treat the given instruction like a

  /// select, potentially converting it to a conditional branch. This can

  /// include select-like instructions like or(zext(c), x) that can be converted

  /// to selects.

  LLVM_ABI bool shouldTreatInstructionLikeSelect(const Instruction *I) const;


  /// Enable matching of interleaved access groups.

  LLVM_ABI bool enableInterleavedAccessVectorization() const;


  /// Enable matching of interleaved access groups that contain predicated

  /// accesses or gaps and therefore vectorized using masked

  /// vector loads/stores.

  LLVM_ABI bool enableMaskedInterleavedAccessVectorization() const;


  /// Indicate that it is potentially unsafe to automatically vectorize

  /// floating-point operations because the semantics of vector and scalar

  /// floating-point semantics may differ. For example, ARM NEON v7 SIMD math

  /// does not support IEEE-754 denormal numbers, while depending on the

  /// platform, scalar floating-point math does.

  /// This applies to floating-point math operations and calls, not memory

  /// operations, shuffles, or casts.

  LLVM_ABI bool isFPVectorizationPotentiallyUnsafe() const;


  /// Determine if the target supports unaligned memory accesses.

  LLVM_ABI bool allowsMisalignedMemoryAccesses(LLVMContext &Context,

                                               unsigned BitWidth,

                                               unsigned AddressSpace = 0,

                                               Align Alignment = Align(1),

                                               unsigned *Fast = nullptr) const;


  /// Return hardware support for population count.

  LLVM_ABI PopcntSupportKind getPopcntSupport(unsigned IntTyWidthInBit) const;


  /// Return true if the hardware has a fast square-root instruction.

  LLVM_ABI bool haveFastSqrt(Type *Ty) const;


  /// Return true if the cost of the instruction is too high to speculatively

  /// execute and should be kept behind a branch.

  /// This normally just wraps around a getInstructionCost() call, but some

  /// targets might report a low TCK_SizeAndLatency value that is incompatible

  /// with the fixed TCC_Expensive value.

  /// NOTE: This assumes the instruction passes isSafeToSpeculativelyExecute().

  LLVM_ABI bool isExpensiveToSpeculativelyExecute(const Instruction *I) const;


  /// Return true if it is faster to check if a floating-point value is NaN

  /// (or not-NaN) versus a comparison against a constant FP zero value.

  /// Targets should override this if materializing a 0.0 for comparison is

  /// generally as cheap as checking for ordered/unordered.

  LLVM_ABI bool isFCmpOrdCheaperThanFCmpZero(Type *Ty) const;


  /// Return the expected cost of supporting the floating point operation

  /// of the specified type.

  LLVM_ABI InstructionCost getFPOpCost(Type *Ty) const;


  /// Return the expected cost of materializing for the given integer

  /// immediate of the specified type.

  LLVM_ABI InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                         TargetCostKind CostKind) const;


  /// Return the expected cost of materialization for the given integer

  /// immediate of the specified type for a given instruction. The cost can be

  /// zero if the immediate can be folded into the specified instruction.

  LLVM_ABI InstructionCost getIntImmCostInst(unsigned Opc, unsigned Idx,

                                             const APInt &Imm, Type *Ty,

                                             TargetCostKind CostKind,

                                             Instruction *Inst = nullptr) const;

  LLVM_ABI InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx,

                                               const APInt &Imm, Type *Ty,

                                               TargetCostKind CostKind) const;


  /// Return the expected cost for the given integer when optimising

  /// for size. This is different than the other integer immediate cost

  /// functions in that it is subtarget agnostic. This is useful when you e.g.

  /// target one ISA such as Aarch32 but smaller encodings could be possible

  /// with another such as Thumb. This return value is used as a penalty when

  /// the total costs for a constant is calculated (the bigger the cost, the

  /// more beneficial constant hoisting is).

  LLVM_ABI InstructionCost getIntImmCodeSizeCost(unsigned Opc, unsigned Idx,

                                                 const APInt &Imm,

                                                 Type *Ty) const;


  /// It can be advantageous to detach complex constants from their uses to make

  /// their generation cheaper. This hook allows targets to report when such

  /// transformations might negatively effect the code generation of the

  /// underlying operation. The motivating example is divides whereby hoisting

  /// constants prevents the code generator's ability to transform them into

  /// combinations of simpler operations.

  LLVM_ABI bool preferToKeepConstantsAttached(const Instruction &Inst,

                                              const Function &Fn) const;


  /// @}


  /// \name Vector Target Information

  /// @{


  /// The various kinds of shuffle patterns for vector queries.


  enum ShuffleKind {

    SK_Broadcast,        ///< Broadcast element 0 to all other elements.

    SK_Reverse,          ///< Reverse the order of the vector.

    SK_Select,           ///< Selects elements from the corresponding lane of

                         ///< either source operand. This is equivalent to a

                         ///< vector select with a constant condition operand.

    SK_Transpose,        ///< Transpose two vectors.

    SK_InsertSubvector,  ///< InsertSubvector. Index indicates start offset.

    SK_ExtractSubvector, ///< ExtractSubvector Index indicates start offset.

    SK_PermuteTwoSrc,    ///< Merge elements from two source vectors into one

                         ///< with any shuffle mask.

    SK_PermuteSingleSrc, ///< Shuffle elements of single source vector with any

                         ///< shuffle mask.

    SK_Splice            ///< Concatenates elements from the first input vector

                         ///< with elements of the second input vector. Returning

                         ///< a vector of the same type as the input vectors.

                         ///< Index indicates start offset in first input vector.

  };


  /// Additional information about an operand's possible values.


  enum OperandValueKind {

    OK_AnyValue,               // Operand can have any value.

    OK_UniformValue,           // Operand is uniform (splat of a value).

    OK_UniformConstantValue,   // Operand is uniform constant.

    OK_NonUniformConstantValue // Operand is a non uniform constant value.

  };


  /// Additional properties of an operand's values.


  enum OperandValueProperties {

    OP_None = 0,

    OP_PowerOf2 = 1,

    OP_NegatedPowerOf2 = 2,

  };


  // Describe the values an operand can take.  We're in the process

  // of migrating uses of OperandValueKind and OperandValueProperties

  // to use this class, and then will change the internal representation.


  struct OperandValueInfo {

    OperandValueKind Kind = OK_AnyValue;

    OperandValueProperties Properties = OP_None;


    bool isConstant() const {

      return Kind == OK_UniformConstantValue || Kind == OK_NonUniformConstantValue;

    }


    bool isUniform() const {

      return Kind == OK_UniformConstantValue || Kind == OK_UniformValue;

    }


    bool isPowerOf2() const {

      return Properties == OP_PowerOf2;

    }


    bool isNegatedPowerOf2() const {

      return Properties == OP_NegatedPowerOf2;

    }


    OperandValueInfo getNoProps() const {

      return {Kind, OP_None};

    }


  };


  /// \return the number of registers in the target-provided register class.

  LLVM_ABI unsigned getNumberOfRegisters(unsigned ClassID) const;


  /// \return true if the target supports load/store that enables fault

  /// suppression of memory operands when the source condition is false.

  LLVM_ABI bool hasConditionalLoadStoreForType(Type *Ty, bool IsStore) const;


  /// \return the target-provided register class ID for the provided type,

  /// accounting for type promotion and other type-legalization techniques that

  /// the target might apply. However, it specifically does not account for the

  /// scalarization or splitting of vector types. Should a vector type require

  /// scalarization or splitting into multiple underlying vector registers, that

  /// type should be mapped to a register class containing no registers.

  /// Specifically, this is designed to provide a simple, high-level view of the

  /// register allocation later performed by the backend. These register classes

  /// don't necessarily map onto the register classes used by the backend.

  /// FIXME: It's not currently possible to determine how many registers

  /// are used by the provided type.

  LLVM_ABI unsigned getRegisterClassForType(bool Vector,

                                            Type *Ty = nullptr) const;


  /// \return the target-provided register class name

  LLVM_ABI const char *getRegisterClassName(unsigned ClassID) const;


  enum RegisterKind { RGK_Scalar, RGK_FixedWidthVector, RGK_ScalableVector };


  /// \return The width of the largest scalar or vector register type.

  LLVM_ABI TypeSize getRegisterBitWidth(RegisterKind K) const;


  /// \return The width of the smallest vector register type.

  LLVM_ABI unsigned getMinVectorRegisterBitWidth() const;


  /// \return The maximum value of vscale if the target specifies an

  ///  architectural maximum vector length, and std::nullopt otherwise.

  LLVM_ABI std::optional<unsigned> getMaxVScale() const;


  /// \return the value of vscale to tune the cost model for.

  LLVM_ABI std::optional<unsigned> getVScaleForTuning() const;


  /// \return true if vscale is known to be a power of 2

  LLVM_ABI bool isVScaleKnownToBeAPowerOfTwo() const;


  /// \return True if the vectorization factor should be chosen to

  /// make the vector of the smallest element type match the size of a

  /// vector register. For wider element types, this could result in

  /// creating vectors that span multiple vector registers.

  /// If false, the vectorization factor will be chosen based on the

  /// size of the widest element type.

  /// \p K Register Kind for vectorization.

  LLVM_ABI bool

  shouldMaximizeVectorBandwidth(TargetTransformInfo::RegisterKind K) const;


  /// \return The minimum vectorization factor for types of given element

  /// bit width, or 0 if there is no minimum VF. The returned value only

  /// applies when shouldMaximizeVectorBandwidth returns true.

  /// If IsScalable is true, the returned ElementCount must be a scalable VF.

  LLVM_ABI ElementCount getMinimumVF(unsigned ElemWidth, bool IsScalable) const;


  /// \return The maximum vectorization factor for types of given element

  /// bit width and opcode, or 0 if there is no maximum VF.

  /// Currently only used by the SLP vectorizer.

  LLVM_ABI unsigned getMaximumVF(unsigned ElemWidth, unsigned Opcode) const;


  /// \return The minimum vectorization factor for the store instruction. Given

  /// the initial estimation of the minimum vector factor and store value type,

  /// it tries to find possible lowest VF, which still might be profitable for

  /// the vectorization.

  /// \param VF Initial estimation of the minimum vector factor.

  /// \param ScalarMemTy Scalar memory type of the store operation.

  /// \param ScalarValTy Scalar type of the stored value.

  /// Currently only used by the SLP vectorizer.

  LLVM_ABI unsigned getStoreMinimumVF(unsigned VF, Type *ScalarMemTy,

                                      Type *ScalarValTy) const;


  /// \return True if it should be considered for address type promotion.

  /// \p AllowPromotionWithoutCommonHeader Set true if promoting \p I is

  /// profitable without finding other extensions fed by the same input.

  LLVM_ABI bool shouldConsiderAddressTypePromotion(

      const Instruction &I, bool &AllowPromotionWithoutCommonHeader) const;


  /// \return The size of a cache line in bytes.

  LLVM_ABI unsigned getCacheLineSize() const;


  /// The possible cache levels


  enum class CacheLevel {

    L1D, // The L1 data cache

    L2D, // The L2 data cache


    // We currently do not model L3 caches, as their sizes differ widely between

    // microarchitectures. Also, we currently do not have a use for L3 cache

    // size modeling yet.

  };


  /// \return The size of the cache level in bytes, if available.

  LLVM_ABI std::optional<unsigned> getCacheSize(CacheLevel Level) const;


  /// \return The associativity of the cache level, if available.

  LLVM_ABI std::optional<unsigned>

  getCacheAssociativity(CacheLevel Level) const;


  /// \return The minimum architectural page size for the target.

  LLVM_ABI std::optional<unsigned> getMinPageSize() const;


  /// \return How much before a load we should place the prefetch

  /// instruction.  This is currently measured in number of

  /// instructions.

  LLVM_ABI unsigned getPrefetchDistance() const;


  /// Some HW prefetchers can handle accesses up to a certain constant stride.

  /// Sometimes prefetching is beneficial even below the HW prefetcher limit,

  /// and the arguments provided are meant to serve as a basis for deciding this

  /// for a particular loop.

  ///

  /// \param NumMemAccesses        Number of memory accesses in the loop.

  /// \param NumStridedMemAccesses Number of the memory accesses that

  ///                              ScalarEvolution could find a known stride

  ///                              for.

  /// \param NumPrefetches         Number of software prefetches that will be

  ///                              emitted as determined by the addresses

  ///                              involved and the cache line size.

  /// \param HasCall               True if the loop contains a call.

  ///

  /// \return This is the minimum stride in bytes where it makes sense to start

  ///         adding SW prefetches. The default is 1, i.e. prefetch with any

  ///         stride.

  LLVM_ABI unsigned getMinPrefetchStride(unsigned NumMemAccesses,

                                         unsigned NumStridedMemAccesses,

                                         unsigned NumPrefetches,

                                         bool HasCall) const;


  /// \return The maximum number of iterations to prefetch ahead.  If

  /// the required number of iterations is more than this number, no

  /// prefetching is performed.

  LLVM_ABI unsigned getMaxPrefetchIterationsAhead() const;


  /// \return True if prefetching should also be done for writes.

  LLVM_ABI bool enableWritePrefetching() const;


  /// \return if target want to issue a prefetch in address space \p AS.

  LLVM_ABI bool shouldPrefetchAddressSpace(unsigned AS) const;


  /// \return The cost of a partial reduction, which is a reduction from a

  /// vector to another vector with fewer elements of larger size. They are

  /// represented by the llvm.vector.partial.reduce.add intrinsic, which

  /// takes an accumulator of type \p AccumType and a second vector operand to

  /// be accumulated, whose element count is specified by \p VF. The type of

  /// reduction is specified by \p Opcode. The second operand passed to the

  /// intrinsic could be the result of an extend, such as sext or zext. In

  /// this case \p BinOp is nullopt, \p InputTypeA represents the type being

  /// extended and \p OpAExtend the operation, i.e. sign- or zero-extend.

  /// Also, \p InputTypeB should be nullptr and OpBExtend should be None.

  /// Alternatively, the second operand could be the result of a binary

  /// operation performed on two extends, i.e.

  ///   mul(zext i8 %a -> i32, zext i8 %b -> i32).

  /// In this case \p BinOp may specify the opcode of the binary operation,

  /// \p InputTypeA and \p InputTypeB the types being extended, and

  /// \p OpAExtend, \p OpBExtend the form of extensions. An example of an

  /// operation that uses a partial reduction is a dot product, which reduces

  /// two vectors in binary mul operation to another of 4 times fewer and 4

  /// times larger elements.

  LLVM_ABI InstructionCost getPartialReductionCost(

      unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType,

      ElementCount VF, PartialReductionExtendKind OpAExtend,

      PartialReductionExtendKind OpBExtend, std::optional<unsigned> BinOp,

      TTI::TargetCostKind CostKind) const;


  /// \return The maximum interleave factor that any transform should try to

  /// perform for this target. This number depends on the level of parallelism

  /// and the number of execution units in the CPU.

  LLVM_ABI unsigned getMaxInterleaveFactor(ElementCount VF) const;


  /// Collect properties of V used in cost analysis, e.g. OP_PowerOf2.

  LLVM_ABI static OperandValueInfo getOperandInfo(const Value *V);


  /// This is an approximation of reciprocal throughput of a math/logic op.

  /// A higher cost indicates less expected throughput.

  /// From Agner Fog's guides, reciprocal throughput is "the average number of

  /// clock cycles per instruction when the instructions are not part of a

  /// limiting dependency chain."

  /// Therefore, costs should be scaled to account for multiple execution units

  /// on the target that can process this type of instruction. For example, if

  /// there are 5 scalar integer units and 2 vector integer units that can

  /// calculate an 'add' in a single cycle, this model should indicate that the

  /// cost of the vector add instruction is 2.5 times the cost of the scalar

  /// add instruction.

  /// \p Args is an optional argument which holds the instruction operands

  /// values so the TTI can analyze those values searching for special

  /// cases or optimizations based on those values.

  /// \p CxtI is the optional original context instruction, if one exists, to

  /// provide even more information.

  /// \p TLibInfo is used to search for platform specific vector library

  /// functions for instructions that might be converted to calls (e.g. frem).

  LLVM_ABI InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty,

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput,

      TTI::OperandValueInfo Opd1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Opd2Info = {TTI::OK_AnyValue, TTI::OP_None},

      ArrayRef<const Value *> Args = {}, const Instruction *CxtI = nullptr,

      const TargetLibraryInfo *TLibInfo = nullptr) const;


  /// Returns the cost estimation for alternating opcode pattern that can be

  /// lowered to a single instruction on the target. In X86 this is for the

  /// addsub instruction which corrsponds to a Shuffle + Fadd + FSub pattern in

  /// IR. This function expects two opcodes: \p Opcode1 and \p Opcode2 being

  /// selected by \p OpcodeMask. The mask contains one bit per lane and is a `0`

  /// when \p Opcode0 is selected and `1` when Opcode1 is selected.

  /// \p VecTy is the vector type of the instruction to be generated.

  LLVM_ABI InstructionCost getAltInstrCost(

      VectorType *VecTy, unsigned Opcode0, unsigned Opcode1,

      const SmallBitVector &OpcodeMask,

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput) const;


  /// \return The cost of a shuffle instruction of kind Kind with inputs of type

  /// SrcTy, producing a vector of type DstTy. The exact mask may be passed as

  /// Mask, or else the array will be empty. The Index and SubTp parameters

  /// are used by the subvector insertions shuffle kinds to show the insert

  /// point and the type of the subvector being inserted. The operands of the

  /// shuffle can be passed through \p Args, which helps improve the cost

  /// estimation in some cases, like in broadcast loads.

  LLVM_ABI InstructionCost getShuffleCost(

      ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy,

      ArrayRef<int> Mask = {},

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput, int Index = 0,

      VectorType *SubTp = nullptr, ArrayRef<const Value *> Args = {},

      const Instruction *CxtI = nullptr) const;


  /// Represents a hint about the context in which a cast is used.

  ///

  /// For zext/sext, the context of the cast is the operand, which must be a

  /// load of some kind. For trunc, the context is of the cast is the single

  /// user of the instruction, which must be a store of some kind.

  ///

  /// This enum allows the vectorizer to give getCastInstrCost an idea of the

  /// type of cast it's dealing with, as not every cast is equal. For instance,

  /// the zext of a load may be free, but the zext of an interleaving load can

  //// be (very) expensive!

  ///

  /// See \c getCastContextHint to compute a CastContextHint from a cast

  /// Instruction*. Callers can use it if they don't need to override the

  /// context and just want it to be calculated from the instruction.

  ///

  /// FIXME: This handles the types of load/store that the vectorizer can

  /// produce, which are the cases where the context instruction is most

  /// likely to be incorrect. There are other situations where that can happen

  /// too, which might be handled here but in the long run a more general

  /// solution of costing multiple instructions at the same times may be better.


  enum class CastContextHint : uint8_t {

    None,          ///< The cast is not used with a load/store of any kind.

    Normal,        ///< The cast is used with a normal load/store.

    Masked,        ///< The cast is used with a masked load/store.

    GatherScatter, ///< The cast is used with a gather/scatter.

    Interleave,    ///< The cast is used with an interleaved load/store.

    Reversed,      ///< The cast is used with a reversed load/store.

  };


  /// Calculates a CastContextHint from \p I.

  /// This should be used by callers of getCastInstrCost if they wish to

  /// determine the context from some instruction.

  /// \returns the CastContextHint for ZExt/SExt/Trunc, None if \p I is nullptr,

  /// or if it's another type of cast.

  LLVM_ABI static CastContextHint getCastContextHint(const Instruction *I);


  /// \return The expected cost of cast instructions, such as bitcast, trunc,

  /// zext, etc. If there is an existing instruction that holds Opcode, it

  /// may be passed in the 'I' parameter.

  LLVM_ABI InstructionCost getCastInstrCost(

      unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH,

      TTI::TargetCostKind CostKind = TTI::TCK_SizeAndLatency,

      const Instruction *I = nullptr) const;


  /// \return The expected cost of a sign- or zero-extended vector extract. Use

  /// Index = -1 to indicate that there is no information about the index value.

  LLVM_ABI InstructionCost

  getExtractWithExtendCost(unsigned Opcode, Type *Dst, VectorType *VecTy,

                           unsigned Index, TTI::TargetCostKind CostKind) const;


  /// \return The expected cost of control-flow related instructions such as

  /// Phi, Ret, Br, Switch.

  LLVM_ABI InstructionCost getCFInstrCost(

      unsigned Opcode, TTI::TargetCostKind CostKind = TTI::TCK_SizeAndLatency,

      const Instruction *I = nullptr) const;


  /// \returns The expected cost of compare and select instructions. If there

  /// is an existing instruction that holds Opcode, it may be passed in the

  /// 'I' parameter. The \p VecPred parameter can be used to indicate the select

  /// is using a compare with the specified predicate as condition. When vector

  /// types are passed, \p VecPred must be used for all lanes.  For a

  /// comparison, the two operands are the natural values.  For a select, the

  /// two operands are the *value* operands, not the condition operand.

  LLVM_ABI InstructionCost getCmpSelInstrCost(

      unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred,

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput,

      OperandValueInfo Op1Info = {OK_AnyValue, OP_None},

      OperandValueInfo Op2Info = {OK_AnyValue, OP_None},

      const Instruction *I = nullptr) const;


  /// \return The expected cost of vector Insert and Extract.

  /// Use -1 to indicate that there is no information on the index value.

  /// This is used when the instruction is not available; a typical use

  /// case is to provision the cost of vectorization/scalarization in

  /// vectorizer passes.

  LLVM_ABI InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val,

                                              TTI::TargetCostKind CostKind,

                                              unsigned Index = -1,

                                              const Value *Op0 = nullptr,

                                              const Value *Op1 = nullptr) const;


  /// \return The expected cost of vector Insert and Extract.

  /// Use -1 to indicate that there is no information on the index value.

  /// This is used when the instruction is not available; a typical use

  /// case is to provision the cost of vectorization/scalarization in

  /// vectorizer passes.

  /// \param ScalarUserAndIdx encodes the information about extracts from a

  /// vector with 'Scalar' being the value being extracted,'User' being the user

  /// of the extract(nullptr if user is not known before vectorization) and

  /// 'Idx' being the extract lane.

  LLVM_ABI InstructionCost getVectorInstrCost(

      unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index,

      Value *Scalar,

      ArrayRef<std::tuple<Value *, User *, int>> ScalarUserAndIdx) const;


  /// \return The expected cost of vector Insert and Extract.

  /// This is used when instruction is available, and implementation

  /// asserts 'I' is not nullptr.

  ///

  /// A typical suitable use case is cost estimation when vector instruction

  /// exists (e.g., from basic blocks during transformation).

  LLVM_ABI InstructionCost getVectorInstrCost(const Instruction &I, Type *Val,

                                              TTI::TargetCostKind CostKind,

                                              unsigned Index = -1) const;


  /// \return The expected cost of inserting or extracting a lane that is \p

  /// Index elements from the end of a vector, i.e. the mathematical expression

  /// for the lane is (VF - 1 - Index). This is required for scalable vectors

  /// where the exact lane index is unknown at compile time.

  LLVM_ABI InstructionCost getIndexedVectorInstrCostFromEnd(

      unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind,

      unsigned Index) const;


  /// \return The expected cost of aggregate inserts and extracts. This is

  /// used when the instruction is not available; a typical use case is to

  /// provision the cost of vectorization/scalarization in vectorizer passes.

  LLVM_ABI InstructionCost getInsertExtractValueCost(

      unsigned Opcode, TTI::TargetCostKind CostKind) const;


  /// \return The cost of replication shuffle of \p VF elements typed \p EltTy

  /// \p ReplicationFactor times.

  ///

  /// For example, the mask for \p ReplicationFactor=3 and \p VF=4 is:

  ///   <0,0,0,1,1,1,2,2,2,3,3,3>

  LLVM_ABI InstructionCost getReplicationShuffleCost(

      Type *EltTy, int ReplicationFactor, int VF, const APInt &DemandedDstElts,

      TTI::TargetCostKind CostKind) const;


  /// \return The cost of Load and Store instructions. The operand info

  /// \p OpdInfo should refer to the stored value for stores and the address

  /// for loads.

  LLVM_ABI InstructionCost getMemoryOpCost(

      unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace,

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput,

      OperandValueInfo OpdInfo = {OK_AnyValue, OP_None},

      const Instruction *I = nullptr) const;


  /// \return The cost of the interleaved memory operation.

  /// \p Opcode is the memory operation code

  /// \p VecTy is the vector type of the interleaved access.

  /// \p Factor is the interleave factor

  /// \p Indices is the indices for interleaved load members (as interleaved

  ///    load allows gaps)

  /// \p Alignment is the alignment of the memory operation

  /// \p AddressSpace is address space of the pointer.

  /// \p UseMaskForCond indicates if the memory access is predicated.

  /// \p UseMaskForGaps indicates if gaps should be masked.

  LLVM_ABI InstructionCost getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace,

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput,

      bool UseMaskForCond = false, bool UseMaskForGaps = false) const;


  /// A helper function to determine the type of reduction algorithm used

  /// for a given \p Opcode and set of FastMathFlags \p FMF.


  static bool requiresOrderedReduction(std::optional<FastMathFlags> FMF) {

    return FMF && !(*FMF).allowReassoc();

  }


  /// Calculate the cost of vector reduction intrinsics.

  ///

  /// This is the cost of reducing the vector value of type \p Ty to a scalar

  /// value using the operation denoted by \p Opcode. The FastMathFlags

  /// parameter \p FMF indicates what type of reduction we are performing:

  ///   1. Tree-wise. This is the typical 'fast' reduction performed that

  ///   involves successively splitting a vector into half and doing the

  ///   operation on the pair of halves until you have a scalar value. For

  ///   example:

  ///     (v0, v1, v2, v3)

  ///     ((v0+v2), (v1+v3), undef, undef)

  ///     ((v0+v2+v1+v3), undef, undef, undef)

  ///   This is the default behaviour for integer operations, whereas for

  ///   floating point we only do this if \p FMF indicates that

  ///   reassociation is allowed.

  ///   2. Ordered. For a vector with N elements this involves performing N

  ///   operations in lane order, starting with an initial scalar value, i.e.

  ///     result = InitVal + v0

  ///     result = result + v1

  ///     result = result + v2

  ///     result = result + v3

  ///   This is only the case for FP operations and when reassociation is not

  ///   allowed.

  ///

  LLVM_ABI InstructionCost getArithmeticReductionCost(

      unsigned Opcode, VectorType *Ty, std::optional<FastMathFlags> FMF,

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput) const;


  LLVM_ABI InstructionCost getMinMaxReductionCost(

      Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF = FastMathFlags(),

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput) const;


  /// Calculate the cost of an extended reduction pattern, similar to

  /// getArithmeticReductionCost of an Add/Sub reduction with multiply and

  /// optional extensions. This is the cost of as:

  /// * ResTy vecreduce.add/sub(mul (A, B)) or,

  /// * ResTy vecreduce.add/sub(mul(ext(Ty A), ext(Ty B)).

  LLVM_ABI InstructionCost getMulAccReductionCost(

      bool IsUnsigned, unsigned RedOpcode, Type *ResTy, VectorType *Ty,

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput) const;


  /// Calculate the cost of an extended reduction pattern, similar to

  /// getArithmeticReductionCost of a reduction with an extension.

  /// This is the cost of as:

  /// ResTy vecreduce.opcode(ext(Ty A)).

  LLVM_ABI InstructionCost getExtendedReductionCost(

      unsigned Opcode, bool IsUnsigned, Type *ResTy, VectorType *Ty,

      std::optional<FastMathFlags> FMF,

      TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput) const;


  /// \returns The cost of Intrinsic instructions. Analyses the real arguments.

  /// Three cases are handled: 1. scalar instruction 2. vector instruction

  /// 3. scalar instruction which is to be vectorized.

  LLVM_ABI InstructionCost getIntrinsicInstrCost(

      const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const;


  /// \returns The cost of memory intrinsic instructions.

  /// Used when IntrinsicInst is not materialized.

  LLVM_ABI InstructionCost

  getMemIntrinsicInstrCost(const MemIntrinsicCostAttributes &MICA,

                           TTI::TargetCostKind CostKind) const;


  /// \returns The cost of Call instructions.

  LLVM_ABI InstructionCost getCallInstrCost(

      Function *F, Type *RetTy, ArrayRef<Type *> Tys,

      TTI::TargetCostKind CostKind = TTI::TCK_SizeAndLatency) const;


  /// \returns The number of pieces into which the provided type must be

  /// split during legalization. Zero is returned when the answer is unknown.

  LLVM_ABI unsigned getNumberOfParts(Type *Tp) const;


  /// \returns The cost of the address computation. For most targets this can be

  /// merged into the instruction indexing mode. Some targets might want to

  /// distinguish between address computation for memory operations with vector

  /// pointer types and scalar pointer types. Such targets should override this

  /// function. \p SE holds the pointer for the scalar evolution object which

  /// was used in order to get the Ptr step value. \p Ptr holds the SCEV of the

  /// access pointer.

  LLVM_ABI InstructionCost

  getAddressComputationCost(Type *PtrTy, ScalarEvolution *SE, const SCEV *Ptr,

                            TTI::TargetCostKind CostKind) const;


  /// \returns The cost, if any, of keeping values of the given types alive

  /// over a callsite.

  ///

  /// Some types may require the use of register classes that do not have

  /// any callee-saved registers, so would require a spill and fill.

  LLVM_ABI InstructionCost

  getCostOfKeepingLiveOverCall(ArrayRef<Type *> Tys) const;


  /// \returns True if the intrinsic is a supported memory intrinsic.  Info

  /// will contain additional information - whether the intrinsic may write

  /// or read to memory, volatility and the pointer.  Info is undefined

  /// if false is returned.

  LLVM_ABI bool getTgtMemIntrinsic(IntrinsicInst *Inst,

                                   MemIntrinsicInfo &Info) const;


  /// \returns The maximum element size, in bytes, for an element

  /// unordered-atomic memory intrinsic.

  LLVM_ABI unsigned getAtomicMemIntrinsicMaxElementSize() const;


  /// \returns A value which is the result of the given memory intrinsic. If \p

  /// CanCreate is true, new instructions may be created to extract the result

  /// from the given intrinsic memory operation. Returns nullptr if the target

  /// cannot create a result from the given intrinsic.

  LLVM_ABI Value *

  getOrCreateResultFromMemIntrinsic(IntrinsicInst *Inst, Type *ExpectedType,

                                    bool CanCreate = true) const;


  /// \returns The type to use in a loop expansion of a memcpy call.

  LLVM_ABI Type *getMemcpyLoopLoweringType(

      LLVMContext &Context, Value *Length, unsigned SrcAddrSpace,

      unsigned DestAddrSpace, Align SrcAlign, Align DestAlign,

      std::optional<uint32_t> AtomicElementSize = std::nullopt) const;


  /// \param[out] OpsOut The operand types to copy RemainingBytes of memory.

  /// \param RemainingBytes The number of bytes to copy.

  ///

  /// Calculates the operand types to use when copying \p RemainingBytes of

  /// memory, where source and destination alignments are \p SrcAlign and

  /// \p DestAlign respectively.

  LLVM_ABI void getMemcpyLoopResidualLoweringType(

      SmallVectorImpl<Type *> &OpsOut, LLVMContext &Context,

      unsigned RemainingBytes, unsigned SrcAddrSpace, unsigned DestAddrSpace,

      Align SrcAlign, Align DestAlign,

      std::optional<uint32_t> AtomicCpySize = std::nullopt) const;


  /// \returns True if the two functions have compatible attributes for inlining

  /// purposes.

  LLVM_ABI bool areInlineCompatible(const Function *Caller,

                                    const Function *Callee) const;


  /// Returns a penalty for invoking call \p Call in \p F.

  /// For example, if a function F calls a function G, which in turn calls

  /// function H, then getInlineCallPenalty(F, H()) would return the

  /// penalty of calling H from F, e.g. after inlining G into F.

  /// \p DefaultCallPenalty is passed to give a default penalty that

  /// the target can amend or override.

  LLVM_ABI unsigned getInlineCallPenalty(const Function *F,

                                         const CallBase &Call,

                                         unsigned DefaultCallPenalty) const;


  /// \returns True if the caller and callee agree on how \p Types will be

  /// passed to or returned from the callee.

  /// to the callee.

  /// \param Types List of types to check.

  LLVM_ABI bool areTypesABICompatible(const Function *Caller,

                                      const Function *Callee,

                                      ArrayRef<Type *> Types) const;


  /// The type of load/store indexing.


  enum MemIndexedMode {

    MIM_Unindexed, ///< No indexing.

    MIM_PreInc,    ///< Pre-incrementing.

    MIM_PreDec,    ///< Pre-decrementing.

    MIM_PostInc,   ///< Post-incrementing.

    MIM_PostDec    ///< Post-decrementing.

  };


  /// \returns True if the specified indexed load for the given type is legal.

  LLVM_ABI bool isIndexedLoadLegal(enum MemIndexedMode Mode, Type *Ty) const;


  /// \returns True if the specified indexed store for the given type is legal.

  LLVM_ABI bool isIndexedStoreLegal(enum MemIndexedMode Mode, Type *Ty) const;


  /// \returns The bitwidth of the largest vector type that should be used to

  /// load/store in the given address space.

  LLVM_ABI unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const;


  /// \returns True if the load instruction is legal to vectorize.

  LLVM_ABI bool isLegalToVectorizeLoad(LoadInst *LI) const;


  /// \returns True if the store instruction is legal to vectorize.

  LLVM_ABI bool isLegalToVectorizeStore(StoreInst *SI) const;


  /// \returns True if it is legal to vectorize the given load chain.

  LLVM_ABI bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes,

                                            Align Alignment,

                                            unsigned AddrSpace) const;


  /// \returns True if it is legal to vectorize the given store chain.

  LLVM_ABI bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes,

                                             Align Alignment,

                                             unsigned AddrSpace) const;


  /// \returns True if it is legal to vectorize the given reduction kind.

  LLVM_ABI bool isLegalToVectorizeReduction(const RecurrenceDescriptor &RdxDesc,

                                            ElementCount VF) const;


  /// \returns True if the given type is supported for scalable vectors

  LLVM_ABI bool isElementTypeLegalForScalableVector(Type *Ty) const;


  /// \returns The new vector factor value if the target doesn't support \p

  /// SizeInBytes loads or has a better vector factor.

  LLVM_ABI unsigned getLoadVectorFactor(unsigned VF, unsigned LoadSize,

                                        unsigned ChainSizeInBytes,

                                        VectorType *VecTy) const;


  /// \returns The new vector factor value if the target doesn't support \p

  /// SizeInBytes stores or has a better vector factor.

  LLVM_ABI unsigned getStoreVectorFactor(unsigned VF, unsigned StoreSize,

                                         unsigned ChainSizeInBytes,

                                         VectorType *VecTy) const;


  /// \returns True if the target prefers fixed width vectorization if the

  /// loop vectorizer's cost-model assigns an equal cost to the fixed and

  /// scalable version of the vectorized loop.

  /// \p IsEpilogue is true if the decision is for the epilogue loop.

  LLVM_ABI bool preferFixedOverScalableIfEqualCost(bool IsEpilogue) const;


  /// \returns True if target prefers SLP vectorizer with altermate opcode

  /// vectorization, false - otherwise.

  LLVM_ABI bool preferAlternateOpcodeVectorization() const;


  /// \returns True if the target prefers reductions of \p Kind to be performed

  /// in the loop.

  LLVM_ABI bool preferInLoopReduction(RecurKind Kind, Type *Ty) const;


  /// \returns True if the target prefers reductions select kept in the loop

  /// when tail folding. i.e.

  /// loop:

  ///   p = phi (0, s)

  ///   a = add (p, x)

  ///   s = select (mask, a, p)

  /// vecreduce.add(s)

  ///

  /// As opposed to the normal scheme of p = phi (0, a) which allows the select

  /// to be pulled out of the loop. If the select(.., add, ..) can be predicated

  /// by the target, this can lead to cleaner code generation.

  LLVM_ABI bool preferPredicatedReductionSelect() const;


  /// Return true if the loop vectorizer should consider vectorizing an

  /// otherwise scalar epilogue loop.

  LLVM_ABI bool preferEpilogueVectorization() const;


  /// \returns True if the loop vectorizer should discard any VFs where the

  /// maximum register pressure exceeds getNumberOfRegisters.

  LLVM_ABI bool shouldConsiderVectorizationRegPressure() const;


  /// \returns True if the target wants to expand the given reduction intrinsic

  /// into a shuffle sequence.

  LLVM_ABI bool shouldExpandReduction(const IntrinsicInst *II) const;


  enum struct ReductionShuffle { SplitHalf, Pairwise };


  /// \returns The shuffle sequence pattern used to expand the given reduction

  /// intrinsic.

  LLVM_ABI ReductionShuffle

  getPreferredExpandedReductionShuffle(const IntrinsicInst *II) const;


  /// \returns the size cost of rematerializing a GlobalValue address relative

  /// to a stack reload.

  LLVM_ABI unsigned getGISelRematGlobalCost() const;


  /// \returns the lower bound of a trip count to decide on vectorization

  /// while tail-folding.

  LLVM_ABI unsigned getMinTripCountTailFoldingThreshold() const;


  /// \returns True if the target supports scalable vectors.

  LLVM_ABI bool supportsScalableVectors() const;


  /// \return true when scalable vectorization is preferred.

  LLVM_ABI bool enableScalableVectorization() const;


  /// \name Vector Predication Information

  /// @{

  /// Whether the target supports the %evl parameter of VP intrinsic efficiently

  /// in hardware. (see LLVM Language Reference - "Vector Predication

  /// Intrinsics"). Use of %evl is discouraged when that is not the case.

  LLVM_ABI bool hasActiveVectorLength() const;


  /// Return true if sinking I's operands to the same basic block as I is

  /// profitable, e.g. because the operands can be folded into a target

  /// instruction during instruction selection. After calling the function

  /// \p Ops contains the Uses to sink ordered by dominance (dominating users

  /// come first).

  LLVM_ABI bool isProfitableToSinkOperands(Instruction *I,

                                           SmallVectorImpl<Use *> &Ops) const;


  /// Return true if it's significantly cheaper to shift a vector by a uniform

  /// scalar than by an amount which will vary across each lane. On x86 before

  /// AVX2 for example, there is a "psllw" instruction for the former case, but

  /// no simple instruction for a general "a << b" operation on vectors.

  /// This should also apply to lowering for vector funnel shifts (rotates).

  LLVM_ABI bool isVectorShiftByScalarCheap(Type *Ty) const;


  struct VPLegalization {


    enum VPTransform {

      // keep the predicating parameter

      Legal = 0,

      // where legal, discard the predicate parameter

      Discard = 1,

      // transform into something else that is also predicating

      Convert = 2

    };


    // How to transform the EVL parameter.

    // Legal:   keep the EVL parameter as it is.

    // Discard: Ignore the EVL parameter where it is safe to do so.

    // Convert: Fold the EVL into the mask parameter.

    VPTransform EVLParamStrategy;


    // How to transform the operator.

    // Legal:   The target supports this operator.

    // Convert: Convert this to a non-VP operation.

    // The 'Discard' strategy is invalid.

    VPTransform OpStrategy;


    bool shouldDoNothing() const {

      return (EVLParamStrategy == Legal) && (OpStrategy == Legal);

    }


    VPLegalization(VPTransform EVLParamStrategy, VPTransform OpStrategy)

        : EVLParamStrategy(EVLParamStrategy), OpStrategy(OpStrategy) {}


  };


  /// \returns How the target needs this vector-predicated operation to be

  /// transformed.

  LLVM_ABI VPLegalization

  getVPLegalizationStrategy(const VPIntrinsic &PI) const;

  /// @}


  /// \returns Whether a 32-bit branch instruction is available in Arm or Thumb

  /// state.

  ///

  /// Used by the LowerTypeTests pass, which constructs an IR inline assembler

  /// node containing a jump table in a format suitable for the target, so it

  /// needs to know what format of jump table it can legally use.

  ///

  /// For non-Arm targets, this function isn't used. It defaults to returning

  /// false, but it shouldn't matter what it returns anyway.

  LLVM_ABI bool hasArmWideBranch(bool Thumb) const;


  /// Returns a bitmask constructed from the target-features or fmv-features

  /// metadata of a function corresponding to its Arch Extensions.

  LLVM_ABI APInt getFeatureMask(const Function &F) const;


  /// Returns a bitmask constructed from the target-features or fmv-features

  /// metadata of a function corresponding to its FMV priority.

  LLVM_ABI APInt getPriorityMask(const Function &F) const;


  /// Returns true if this is an instance of a function with multiple versions.

  LLVM_ABI bool isMultiversionedFunction(const Function &F) const;


  /// \return The maximum number of function arguments the target supports.

  LLVM_ABI unsigned getMaxNumArgs() const;


  /// \return For an array of given Size, return alignment boundary to

  /// pad to. Default is no padding.

  LLVM_ABI unsigned getNumBytesToPadGlobalArray(unsigned Size,

                                                Type *ArrayType) const;


  /// @}


  /// Collect kernel launch bounds for \p F into \p LB.

  LLVM_ABI void collectKernelLaunchBounds(

      const Function &F,

      SmallVectorImpl<std::pair<StringRef, int64_t>> &LB) const;


  /// Returns true if GEP should not be used to index into vectors for this

  /// target.

  LLVM_ABI bool allowVectorElementIndexingUsingGEP() const;


private:

  std::unique_ptr<const TargetTransformInfoImplBase> TTIImpl;

};


/// Analysis pass providing the \c TargetTransformInfo.

///

/// The core idea of the TargetIRAnalysis is to expose an interface through

/// which LLVM targets can analyze and provide information about the middle

/// end's target-independent IR. This supports use cases such as target-aware

/// cost modeling of IR constructs.

///

/// This is a function analysis because much of the cost modeling for targets

/// is done in a subtarget specific way and LLVM supports compiling different

/// functions targeting different subtargets in order to support runtime

/// dispatch according to the observed subtarget.


class TargetIRAnalysis : public AnalysisInfoMixin<TargetIRAnalysis> {

public:

  typedef TargetTransformInfo Result;


  /// Default construct a target IR analysis.

  ///

  /// This will use the module's datalayout to construct a baseline

  /// conservative TTI result.

  LLVM_ABI TargetIRAnalysis();


  /// Construct an IR analysis pass around a target-provide callback.

  ///

  /// The callback will be called with a particular function for which the TTI

  /// is needed and must return a TTI object for that function.

  LLVM_ABI

  TargetIRAnalysis(std::function<Result(const Function &)> TTICallback);


  // Value semantics. We spell out the constructors for MSVC.


  TargetIRAnalysis(const TargetIRAnalysis &Arg)

      : TTICallback(Arg.TTICallback) {}


  TargetIRAnalysis(TargetIRAnalysis &&Arg)

      : TTICallback(std::move(Arg.TTICallback)) {}


  TargetIRAnalysis &operator=(const TargetIRAnalysis &RHS) {

    TTICallback = RHS.TTICallback;

    return *this;

  }


  TargetIRAnalysis &operator=(TargetIRAnalysis &&RHS) {

    TTICallback = std::move(RHS.TTICallback);

    return *this;

  }


  LLVM_ABI Result run(const Function &F, FunctionAnalysisManager &);


private:

  friend AnalysisInfoMixin<TargetIRAnalysis>;

  LLVM_ABI static AnalysisKey Key;


  /// The callback used to produce a result.

  ///

  /// We use a completely opaque callback so that targets can provide whatever

  /// mechanism they desire for constructing the TTI for a given function.

  ///

  /// FIXME: Should we really use std::function? It's relatively inefficient.

  /// It might be possible to arrange for even stateful callbacks to outlive

  /// the analysis and thus use a function_ref which would be lighter weight.

  /// This may also be less error prone as the callback is likely to reference

  /// the external TargetMachine, and that reference needs to never dangle.

  std::function<Result(const Function &)> TTICallback;


  /// Helper function used as the callback in the default constructor.

  static Result getDefaultTTI(const Function &F);

};


/// Wrapper pass for TargetTransformInfo.

///

/// This pass can be constructed from a TTI object which it stores internally

/// and is queried by passes.


class LLVM_ABI TargetTransformInfoWrapperPass : public ImmutablePass {

  TargetIRAnalysis TIRA;

  std::optional<TargetTransformInfo> TTI;


  virtual void anchor();


public:

  static char ID;


  /// We must provide a default constructor for the pass but it should

  /// never be used.

  ///

  /// Use the constructor below or call one of the creation routines.

  TargetTransformInfoWrapperPass();


  explicit TargetTransformInfoWrapperPass(TargetIRAnalysis TIRA);


  TargetTransformInfo &getTTI(const Function &F);

};


/// Create an analysis pass wrapper around a TTI object.

///

/// This analysis pass just holds the TTI instance and makes it available to

/// clients.

LLVM_ABI ImmutablePass *

createTargetTransformInfoWrapperPass(TargetIRAnalysis TIRA);


} // namespace llvm


#endif

APInt.h
This file implements a class to represent arbitrary precision integral constant values and operations...

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition ARMSLSHardening.cpp:73

ArrayRef.h

AtomicOrdering.h
Atomic ordering constants.

BitmaskEnum.h

BranchProbability.h

Info
Analysis containing CSE Info
Definition CSEInfo.cpp:27

Compiler.h

LLVM_ABI
#define LLVM_ABI
Definition Compiler.h:213

CostKind
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))

IntrinsicCostStrategy::InstructionCost
@ InstructionCost
Definition CostModel.cpp:52

VPLegalization
TargetTransformInfo::VPLegalization VPLegalization
Definition ExpandVectorPredication.cpp:33

FMF.h

ForceNestedLoop
static cl::opt< bool > ForceNestedLoop("force-nested-hardware-loop", cl::Hidden, cl::init(false), cl::desc("Force allowance of nested hardware loops"))

ForceHardwareLoopPHI
static cl::opt< bool > ForceHardwareLoopPHI("force-hardware-loop-phi", cl::Hidden, cl::init(false), cl::desc("Force hardware loop counter to be updated through a phi"))

PassManager.h
This header defines various interfaces for pass management in LLVM.

IVDescriptors.h

InlinePriorityMode::Size
@ Size
Definition InlineOrder.cpp:25

InstrTypes.h

InstructionCost.h
This file defines an InstructionCost class that is used when calculating the cost of an instruction,...

InterestingMemoryOperand.h

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

Ops
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Definition ItaniumDemangle.h:3370

F
#define F(x, y, z)
Definition MD5.cpp:54

I
#define I(x, y, z)
Definition MD5.cpp:57

II
uint64_t IntrinsicInst * II
Definition NVVMIntrRange.cpp:46

Pass.h

Opc
auto Opc
Definition RISCVRedundantCopyElimination.cpp:75

Mode
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))

Uniformity.h

RHS
Value * RHS
Definition X86PartialReduction.cpp:81

bool

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::AllocaInst
an instruction to allocate memory on the stack
Definition Instructions.h:65

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40

llvm::ArrayType
Class to represent array types.
Definition DerivedTypes.h:398

llvm::AssumptionCache
A cache of @llvm.assume calls within a function.
Definition AssumptionCache.h:44

llvm::BasicBlock
LLVM Basic Block Representation.
Definition BasicBlock.h:62

llvm::BlockFrequencyInfo
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Definition BlockFrequencyInfo.h:38

llvm::BranchInst
Conditional or Unconditional Branch instruction.
Definition Instructions.h:3058

llvm::BranchProbability
Definition BranchProbability.h:32

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition InstrTypes.h:1114

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:676

llvm::Constant
This is an important base class in LLVM.
Definition Constant.h:43

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:164

llvm::ElementCount
Definition TypeSize.h:298

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition FMF.h:22

llvm::Function
Definition Function.h:64

llvm::GlobalValue
Definition GlobalValue.h:49

llvm::ImmutablePass
ImmutablePass class - This class is used to provide information that does not need to be run.
Definition Pass.h:285

llvm::ImmutablePass::ImmutablePass
ImmutablePass(char &pid)
Definition Pass.h:287

llvm::InstCombiner
The core instruction combiner logic.
Definition InstCombiner.h:48

llvm::InstructionCost
Definition InstructionCost.h:30

llvm::InstructionCost::getInvalid
static InstructionCost getInvalid(CostType Val=0)
Definition InstructionCost.h:74

llvm::Instruction
Definition Instruction.h:69

llvm::Instruction::CastOps
CastOps
Definition Instruction.h:1012

llvm::IntegerType
Class to represent integer types.
Definition DerivedTypes.h:42

llvm::InterleavedAccessInfo
Drive the analysis of interleaved memory accesses in the loop.
Definition VectorUtils.h:669

llvm::IntrinsicCostAttributes
Definition TargetTransformInfo.h:181

llvm::IntrinsicCostAttributes::getFlags
FastMathFlags getFlags() const
Definition TargetTransformInfo.h:217

llvm::IntrinsicCostAttributes::getLibInfo
const TargetLibraryInfo * getLibInfo() const
Definition TargetTransformInfo.h:221

llvm::IntrinsicCostAttributes::getArgTypes
const SmallVectorImpl< Type * > & getArgTypes() const
Definition TargetTransformInfo.h:220

llvm::IntrinsicCostAttributes::getReturnType
Type * getReturnType() const
Definition TargetTransformInfo.h:216

llvm::IntrinsicCostAttributes::skipScalarizationCost
bool skipScalarizationCost() const
Definition TargetTransformInfo.h:227

llvm::IntrinsicCostAttributes::getArgs
const SmallVectorImpl< const Value * > & getArgs() const
Definition TargetTransformInfo.h:219

llvm::IntrinsicCostAttributes::IntrinsicCostAttributes
LLVM_ABI IntrinsicCostAttributes(Intrinsic::ID Id, const CallBase &CI, InstructionCost ScalarCost=InstructionCost::getInvalid(), bool TypeBasedOnly=false, TargetLibraryInfo const *LibInfo=nullptr)
Definition TargetTransformInfo.cpp:75

llvm::IntrinsicCostAttributes::getScalarizationCost
InstructionCost getScalarizationCost() const
Definition TargetTransformInfo.h:218

llvm::IntrinsicCostAttributes::getInst
const IntrinsicInst * getInst() const
Definition TargetTransformInfo.h:215

llvm::IntrinsicCostAttributes::getID
Intrinsic::ID getID() const
Definition TargetTransformInfo.h:214

llvm::IntrinsicCostAttributes::isTypeBasedOnly
bool isTypeBasedOnly() const
Definition TargetTransformInfo.h:223

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition IntrinsicInst.h:49

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68

llvm::LoadInst
An instruction for reading from memory.
Definition Instructions.h:181

llvm::LoopInfo
Definition LoopInfo.h:408

llvm::LoopVectorizationLegality
LoopVectorizationLegality checks if it is legal to vectorize a loop, and to what vectorization factor...
Definition LoopVectorizationLegality.h:261

llvm::Loop
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40

llvm::MemIntrinsicCostAttributes
Information for memory intrinsic cost model.
Definition TargetTransformInfo.h:128

llvm::MemIntrinsicCostAttributes::getAlignment
Align getAlignment() const
Definition TargetTransformInfo.h:178

llvm::MemIntrinsicCostAttributes::getAddressSpace
unsigned getAddressSpace() const
Definition TargetTransformInfo.h:177

llvm::MemIntrinsicCostAttributes::getDataType
Type * getDataType() const
Definition TargetTransformInfo.h:175

llvm::MemIntrinsicCostAttributes::getPointer
const Value * getPointer() const
Definition TargetTransformInfo.h:174

llvm::MemIntrinsicCostAttributes::MemIntrinsicCostAttributes
LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy, bool VariableMask, Align Alignment, const Instruction *I=nullptr)
Definition TargetTransformInfo.h:166

llvm::MemIntrinsicCostAttributes::getVariableMask
bool getVariableMask() const
Definition TargetTransformInfo.h:176

llvm::MemIntrinsicCostAttributes::MemIntrinsicCostAttributes
LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy, Align Alignment, unsigned AddressSpace=0)
Definition TargetTransformInfo.h:160

llvm::MemIntrinsicCostAttributes::getID
Intrinsic::ID getID() const
Definition TargetTransformInfo.h:172

llvm::MemIntrinsicCostAttributes::getInst
const Instruction * getInst() const
Definition TargetTransformInfo.h:173

llvm::MemIntrinsicCostAttributes::MemIntrinsicCostAttributes
LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, const Instruction *I=nullptr)
Definition TargetTransformInfo.h:153

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition OptimizationRemarkEmitter.h:33

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition Analysis.h:112

llvm::ProfileSummaryInfo
Analysis providing profile information.
Definition ProfileSummaryInfo.h:42

llvm::RecurrenceDescriptor
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
Definition IVDescriptors.h:90

llvm::SCEV
This class represents an analyzed expression in the program.
Definition ScalarEvolution.h:72

llvm::ScalarEvolution
The main scalar evolution driver.
Definition ScalarEvolution.h:457

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition SmallBitVector.h:35

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:574

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1203

llvm::StackOffset
StackOffset holds a fixed and a scalable offset in bytes.
Definition TypeSize.h:30

llvm::StoreInst
An instruction for storing to memory.
Definition Instructions.h:297

llvm::SwitchInst
Multiway switch.
Definition Instructions.h:3196

llvm::TargetIRAnalysis
Analysis pass providing the TargetTransformInfo.
Definition TargetTransformInfo.h:2021

llvm::TargetIRAnalysis::TargetIRAnalysis
TargetIRAnalysis(const TargetIRAnalysis &Arg)
Definition TargetTransformInfo.h:2039

llvm::TargetIRAnalysis::operator=
TargetIRAnalysis & operator=(const TargetIRAnalysis &RHS)
Definition TargetTransformInfo.h:2043

llvm::TargetIRAnalysis::run
LLVM_ABI Result run(const Function &F, FunctionAnalysisManager &)
Definition TargetTransformInfo.cpp:1510

llvm::TargetIRAnalysis::Result
TargetTransformInfo Result
Definition TargetTransformInfo.h:2023

llvm::TargetIRAnalysis::TargetIRAnalysis
LLVM_ABI TargetIRAnalysis()
Default construct a target IR analysis.
Definition TargetTransformInfo.cpp:1504

llvm::TargetIRAnalysis::operator=
TargetIRAnalysis & operator=(TargetIRAnalysis &&RHS)
Definition TargetTransformInfo.h:2047

llvm::TargetIRAnalysis::TargetIRAnalysis
TargetIRAnalysis(TargetIRAnalysis &&Arg)
Definition TargetTransformInfo.h:2041

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition TargetLibraryInfo.h:266

llvm::TargetTransformInfoImplBase
Base class for use as a mix-in that aids implementing a TargetTransformInfo-compatible class.
Definition TargetTransformInfoImpl.h:34

llvm::TargetTransformInfoWrapperPass::TargetTransformInfoWrapperPass
TargetTransformInfoWrapperPass()
We must provide a default constructor for the pass but it should never be used.
Definition TargetTransformInfo.cpp:1529

llvm::TargetTransformInfoWrapperPass::getTTI
TargetTransformInfo & getTTI(const Function &F)
Definition TargetTransformInfo.cpp:1536

llvm::TargetTransformInfoWrapperPass::ID
static char ID
Definition TargetTransformInfo.h:2085

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition TargetTransformInfo.h:278

llvm::TargetTransformInfo::getTgtMemIntrinsic
LLVM_ABI bool getTgtMemIntrinsic(IntrinsicInst *Inst, MemIntrinsicInfo &Info) const
Definition TargetTransformInfo.cpp:1287

llvm::TargetTransformInfo::getOrCreateResultFromMemIntrinsic
LLVM_ABI Value * getOrCreateResultFromMemIntrinsic(IntrinsicInst *Inst, Type *ExpectedType, bool CanCreate=true) const
Definition TargetTransformInfo.cpp:1296

llvm::TargetTransformInfo::isLegalToVectorizeLoad
LLVM_ABI bool isLegalToVectorizeLoad(LoadInst *LI) const
Definition TargetTransformInfo.cpp:1353

llvm::TargetTransformInfo::getVScaleForTuning
LLVM_ABI std::optional< unsigned > getVScaleForTuning() const
Definition TargetTransformInfo.cpp:800

llvm::TargetTransformInfo::ReductionShuffle
ReductionShuffle
Definition TargetTransformInfo.h:1887

llvm::TargetTransformInfo::ReductionShuffle::Pairwise
@ Pairwise
Definition TargetTransformInfo.h:1887

llvm::TargetTransformInfo::ReductionShuffle::SplitHalf
@ SplitHalf
Definition TargetTransformInfo.h:1887

llvm::TargetTransformInfo::getCastContextHint
static LLVM_ABI CastContextHint getCastContextHint(const Instruction *I)
Calculates a CastContextHint from I.
Definition TargetTransformInfo.cpp:1030

llvm::TargetTransformInfo::getMaxNumArgs
LLVM_ABI unsigned getMaxNumArgs() const
Definition TargetTransformInfo.cpp:1443

llvm::TargetTransformInfo::addrspacesMayAlias
LLVM_ABI bool addrspacesMayAlias(unsigned AS0, unsigned AS1) const
Return false if a AS0 address cannot possibly alias a AS1 address.
Definition TargetTransformInfo.cpp:312

llvm::TargetTransformInfo::isLegalMaskedScatter
LLVM_ABI bool isLegalMaskedScatter(Type *DataType, Align Alignment) const
Return true if the target supports masked scatter.
Definition TargetTransformInfo.cpp:507

llvm::TargetTransformInfo::shouldBuildLookupTables
LLVM_ABI bool shouldBuildLookupTables() const
Return true if switches should be turned into lookup tables for the target.
Definition TargetTransformInfo.cpp:597

llvm::TargetTransformInfo::isLegalToVectorizeStore
LLVM_ABI bool isLegalToVectorizeStore(StoreInst *SI) const
Definition TargetTransformInfo.cpp:1357

llvm::TargetTransformInfo::getVectorInstrCost
LLVM_ABI InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index=-1, const Value *Op0=nullptr, const Value *Op1=nullptr) const
Definition TargetTransformInfo.cpp:1114

llvm::TargetTransformInfo::getMulAccReductionCost
LLVM_ABI InstructionCost getMulAccReductionCost(bool IsUnsigned, unsigned RedOpcode, Type *ResTy, VectorType *Ty, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput) const
Calculate the cost of an extended reduction pattern, similar to getArithmeticReductionCost of an Add/...
Definition TargetTransformInfo.cpp:1275

llvm::TargetTransformInfo::areTypesABICompatible
LLVM_ABI bool areTypesABICompatible(const Function *Caller, const Function *Callee, ArrayRef< Type * > Types) const
Definition TargetTransformInfo.cpp:1333

llvm::TargetTransformInfo::enableAggressiveInterleaving
LLVM_ABI bool enableAggressiveInterleaving(bool LoopHasReductions) const
Don't restrict interleaved unrolling to small loops.
Definition TargetTransformInfo.cpp:663

llvm::TargetTransformInfo::getScalarizationOverhead
LLVM_ABI InstructionCost getScalarizationOverhead(VectorType *Ty, const APInt &DemandedElts, bool Insert, bool Extract, TTI::TargetCostKind CostKind, bool ForPoisonSrc=true, ArrayRef< Value * > VL={}) const
Estimate the overhead of scalarizing an instruction.
Definition TargetTransformInfo.cpp:638

llvm::TargetTransformInfo::isMultiversionedFunction
LLVM_ABI bool isMultiversionedFunction(const Function &F) const
Returns true if this is an instance of a function with multiple versions.
Definition TargetTransformInfo.cpp:1439

llvm::TargetTransformInfo::getInstructionUniformity
LLVM_ABI InstructionUniformity getInstructionUniformity(const Value *V) const
Get target-specific uniformity information for an instruction.
Definition TargetTransformInfo.cpp:298

llvm::TargetTransformInfo::isFCmpOrdCheaperThanFCmpZero
LLVM_ABI bool isFCmpOrdCheaperThanFCmpZero(Type *Ty) const
Return true if it is faster to check if a floating-point value is NaN (or not-NaN) versus a compariso...
Definition TargetTransformInfo.cpp:718

llvm::TargetTransformInfo::isLegalMaskedStore
LLVM_ABI bool isLegalMaskedStore(Type *DataType, Align Alignment, unsigned AddressSpace, MaskKind MaskKind=VariableOrConstantMask) const
Return true if the target supports masked store.
Definition TargetTransformInfo.cpp:468

llvm::TargetTransformInfo::supportsEfficientVectorElementLoadStore
LLVM_ABI bool supportsEfficientVectorElementLoadStore() const
If target has efficient vector element load/store instructions, it can return true here so that inser...
Definition TargetTransformInfo.cpp:651

llvm::TargetTransformInfo::getAssumedAddrSpace
LLVM_ABI unsigned getAssumedAddrSpace(const Value *V) const
Definition TargetTransformInfo.cpp:336

llvm::TargetTransformInfo::preferAlternateOpcodeVectorization
LLVM_ABI bool preferAlternateOpcodeVectorization() const
Definition TargetTransformInfo.cpp:1406

llvm::TargetTransformInfo::shouldDropLSRSolutionIfLessProfitable
LLVM_ABI bool shouldDropLSRSolutionIfLessProfitable() const
Return true if LSR should drop a found solution if it's calculated to be less profitable than the bas...
Definition TargetTransformInfo.cpp:443

llvm::TargetTransformInfo::isLSRCostLess
LLVM_ABI bool isLSRCostLess(const TargetTransformInfo::LSRCost &C1, const TargetTransformInfo::LSRCost &C2) const
Return true if LSR cost of C1 is lower than C2.
Definition TargetTransformInfo.cpp:434

llvm::TargetTransformInfo::getPrefetchDistance
LLVM_ABI unsigned getPrefetchDistance() const
Definition TargetTransformInfo.cpp:854

llvm::TargetTransformInfo::getMemcpyLoopLoweringType
LLVM_ABI Type * getMemcpyLoopLoweringType(LLVMContext &Context, Value *Length, unsigned SrcAddrSpace, unsigned DestAddrSpace, Align SrcAlign, Align DestAlign, std::optional< uint32_t > AtomicElementSize=std::nullopt) const
Definition TargetTransformInfo.cpp:1302

llvm::TargetTransformInfo::isLegalMaskedExpandLoad
LLVM_ABI bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment) const
Return true if the target supports masked expand load.
Definition TargetTransformInfo.cpp:527

llvm::TargetTransformInfo::prefersVectorizedAddressing
LLVM_ABI bool prefersVectorizedAddressing() const
Return true if target doesn't mind addresses in vectors.
Definition TargetTransformInfo.cpp:562

llvm::TargetTransformInfo::getCmpSelInstrCost
LLVM_ABI InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput, OperandValueInfo Op1Info={OK_AnyValue, OP_None}, OperandValueInfo Op2Info={OK_AnyValue, OP_None}, const Instruction *I=nullptr) const
Definition TargetTransformInfo.cpp:1102

llvm::TargetTransformInfo::hasBranchDivergence
LLVM_ABI bool hasBranchDivergence(const Function *F=nullptr) const
Return true if branch divergence exists.
Definition TargetTransformInfo.cpp:293

llvm::TargetTransformInfo::enableMemCmpExpansion
LLVM_ABI MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const
Definition TargetTransformInfo.cpp:669

llvm::TargetTransformInfo::invalidate
bool invalidate(Function &, const PreservedAnalyses &, FunctionAnalysisManager::Invalidator &)
Handle the invalidation of this information.
Definition TargetTransformInfo.h:317

llvm::TargetTransformInfo::getUnrollingPreferences
LLVM_ABI void getUnrollingPreferences(Loop *L, ScalarEvolution &, UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE) const
Get target-customized preferences for the generic loop unrolling transformation.
Definition TargetTransformInfo.cpp:401

llvm::TargetTransformInfo::shouldBuildLookupTablesForConstant
LLVM_ABI bool shouldBuildLookupTablesForConstant(Constant *C) const
Return true if switches should be turned into lookup tables containing this constant value for the ta...
Definition TargetTransformInfo.cpp:601

llvm::TargetTransformInfo::supportsTailCallFor
LLVM_ABI bool supportsTailCallFor(const CallBase *CB) const
If target supports tail call on CB.
Definition TargetTransformInfo.cpp:659

llvm::TargetTransformInfo::instCombineIntrinsic
LLVM_ABI std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const
Targets can implement their own combinations for target-specific intrinsics.
Definition TargetTransformInfo.cpp:379

llvm::TargetTransformInfo::isProfitableLSRChainElement
LLVM_ABI bool isProfitableLSRChainElement(Instruction *I) const
Definition TargetTransformInfo.cpp:447

llvm::TargetTransformInfo::getRegisterBitWidth
LLVM_ABI TypeSize getRegisterBitWidth(RegisterKind K) const
Definition TargetTransformInfo.cpp:787

llvm::TargetTransformInfo::MaskKind
MaskKind
Some targets only support masked load/store with a constant mask.
Definition TargetTransformInfo.h:873

llvm::TargetTransformInfo::VariableOrConstantMask
@ VariableOrConstantMask
Definition TargetTransformInfo.h:874

llvm::TargetTransformInfo::ConstantMask
@ ConstantMask
Definition TargetTransformInfo.h:875

llvm::TargetTransformInfo::getInlineCallPenalty
LLVM_ABI unsigned getInlineCallPenalty(const Function *F, const CallBase &Call, unsigned DefaultCallPenalty) const
Returns a penalty for invoking call Call in F.
Definition TargetTransformInfo.cpp:1327

llvm::TargetTransformInfo::hasActiveVectorLength
LLVM_ABI bool hasActiveVectorLength() const
Definition TargetTransformInfo.cpp:1473

llvm::TargetTransformInfo::isExpensiveToSpeculativelyExecute
LLVM_ABI bool isExpensiveToSpeculativelyExecute(const Instruction *I) const
Return true if the cost of the instruction is too high to speculatively execute and should be kept be...
Definition TargetTransformInfo.cpp:713

llvm::TargetTransformInfo::preferFixedOverScalableIfEqualCost
LLVM_ABI bool preferFixedOverScalableIfEqualCost(bool IsEpilogue) const
Definition TargetTransformInfo.cpp:1396

llvm::TargetTransformInfo::isLegalMaskedGather
LLVM_ABI bool isLegalMaskedGather(Type *DataType, Align Alignment) const
Return true if the target supports masked gather.
Definition TargetTransformInfo.cpp:496

llvm::TargetTransformInfo::getMemoryOpCost
LLVM_ABI InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput, OperandValueInfo OpdInfo={OK_AnyValue, OP_None}, const Instruction *I=nullptr) const
Definition TargetTransformInfo.cpp:1179

llvm::TargetTransformInfo::getMaxVScale
LLVM_ABI std::optional< unsigned > getMaxVScale() const
Definition TargetTransformInfo.cpp:796

llvm::TargetTransformInfo::getReplicationShuffleCost
LLVM_ABI InstructionCost getReplicationShuffleCost(Type *EltTy, int ReplicationFactor, int VF, const APInt &DemandedDstElts, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfo.cpp:1170

llvm::TargetTransformInfo::allowVectorElementIndexingUsingGEP
LLVM_ABI bool allowVectorElementIndexingUsingGEP() const
Returns true if GEP should not be used to index into vectors for this target.
Definition TargetTransformInfo.cpp:1498

llvm::TargetTransformInfo::getInterleavedMemoryOpCost
LLVM_ABI InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput, bool UseMaskForCond=false, bool UseMaskForGaps=false) const
Definition TargetTransformInfo.cpp:1191

llvm::TargetTransformInfo::isSingleThreaded
LLVM_ABI bool isSingleThreaded() const
Definition TargetTransformInfo.cpp:340

llvm::TargetTransformInfo::simplifyDemandedVectorEltsIntrinsic
LLVM_ABI std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const
Can be used to implement target-specific instruction combining.
Definition TargetTransformInfo.cpp:391

llvm::TargetTransformInfo::enableOrderedReductions
LLVM_ABI bool enableOrderedReductions() const
Return true if we should be enabling ordered reductions for the target.
Definition TargetTransformInfo.cpp:549

llvm::TargetTransformInfo::getInstructionCost
InstructionCost getInstructionCost(const User *U, TargetCostKind CostKind) const
This is a helper function which calls the three-argument getInstructionCost with Operands which are t...
Definition TargetTransformInfo.h:488

llvm::TargetTransformInfo::getInliningCostBenefitAnalysisProfitableMultiplier
LLVM_ABI unsigned getInliningCostBenefitAnalysisProfitableMultiplier() const
Definition TargetTransformInfo.cpp:229

llvm::TargetTransformInfo::getShuffleCost
LLVM_ABI InstructionCost getShuffleCost(ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy, ArrayRef< int > Mask={}, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput, int Index=0, VectorType *SubTp=nullptr, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const
Definition TargetTransformInfo.cpp:993

llvm::TargetTransformInfo::getIntrinsicInstrCost
LLVM_ABI InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfo.cpp:1203

llvm::TargetTransformInfo::getArithmeticReductionCost
LLVM_ABI InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *Ty, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput) const
Calculate the cost of vector reduction intrinsics.
Definition TargetTransformInfo.cpp:1250

llvm::TargetTransformInfo::getAtomicMemIntrinsicMaxElementSize
LLVM_ABI unsigned getAtomicMemIntrinsicMaxElementSize() const
Definition TargetTransformInfo.cpp:1292

llvm::TargetTransformInfo::getCastInstrCost
LLVM_ABI InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind=TTI::TCK_SizeAndLatency, const Instruction *I=nullptr) const
Definition TargetTransformInfo.cpp:1073

llvm::TargetTransformInfo::LSRWithInstrQueries
LLVM_ABI bool LSRWithInstrQueries() const
Return true if the loop strength reduce pass should make Instruction* based TTI queries to isLegalAdd...
Definition TargetTransformInfo.cpp:575

llvm::TargetTransformInfo::getStoreVectorFactor
LLVM_ABI unsigned getStoreVectorFactor(unsigned VF, unsigned StoreSize, unsigned ChainSizeInBytes, VectorType *VecTy) const
Definition TargetTransformInfo.cpp:1389

llvm::TargetTransformInfo::getVPLegalizationStrategy
LLVM_ABI VPLegalization getVPLegalizationStrategy(const VPIntrinsic &PI) const
Definition TargetTransformInfo.cpp:1423

llvm::TargetTransformInfo::getPartialReductionExtendKind
static LLVM_ABI PartialReductionExtendKind getPartialReductionExtendKind(Instruction *I)
Get the kind of extension that an instruction represents.
Definition TargetTransformInfo.cpp:1009

llvm::TargetTransformInfo::shouldConsiderVectorizationRegPressure
LLVM_ABI bool shouldConsiderVectorizationRegPressure() const
Definition TargetTransformInfo.cpp:1418

llvm::TargetTransformInfo::enableWritePrefetching
LLVM_ABI bool enableWritePrefetching() const
Definition TargetTransformInfo.cpp:869

llvm::TargetTransformInfo::shouldTreatInstructionLikeSelect
LLVM_ABI bool shouldTreatInstructionLikeSelect(const Instruction *I) const
Should the Select Optimization pass treat the given instruction like a select, potentially converting...
Definition TargetTransformInfo.cpp:677

llvm::TargetTransformInfo::isNoopAddrSpaceCast
LLVM_ABI bool isNoopAddrSpaceCast(unsigned FromAS, unsigned ToAS) const
Definition TargetTransformInfo.cpp:326

llvm::TargetTransformInfo::shouldMaximizeVectorBandwidth
LLVM_ABI bool shouldMaximizeVectorBandwidth(TargetTransformInfo::RegisterKind K) const
Definition TargetTransformInfo.cpp:808

llvm::TargetTransformInfo::getPreferredTailFoldingStyle
LLVM_ABI TailFoldingStyle getPreferredTailFoldingStyle(bool IVUpdateMayOverflow=true) const
Query the target what the preferred style of tail folding is.
Definition TargetTransformInfo.cpp:373

llvm::TargetTransformInfo::getGEPCost
LLVM_ABI InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr, ArrayRef< const Value * > Operands, Type *AccessType=nullptr, TargetCostKind CostKind=TCK_SizeAndLatency) const
Estimate the cost of a GEP operation when lowered.
Definition TargetTransformInfo.cpp:252

llvm::TargetTransformInfo::isLegalToVectorizeStoreChain
LLVM_ABI bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition TargetTransformInfo.cpp:1367

llvm::TargetTransformInfo::isLegalInterleavedAccessType
LLVM_ABI bool isLegalInterleavedAccessType(VectorType *VTy, unsigned Factor, Align Alignment, unsigned AddrSpace) const
Return true is the target supports interleaved access for the given vector type VTy,...
Definition TargetTransformInfo.cpp:537

llvm::TargetTransformInfo::getRegUsageForType
LLVM_ABI unsigned getRegUsageForType(Type *Ty) const
Returns the estimated number of registers required to represent Ty.
Definition TargetTransformInfo.cpp:593

llvm::TargetTransformInfo::isLegalBroadcastLoad
LLVM_ABI bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const
\Returns true if the target supports broadcasting a load to a vector of type <NumElements x ElementTy...
Definition TargetTransformInfo.cpp:491

llvm::TargetTransformInfo::isIndexedStoreLegal
LLVM_ABI bool isIndexedStoreLegal(enum MemIndexedMode Mode, Type *Ty) const
Definition TargetTransformInfo.cpp:1344

llvm::TargetTransformInfo::getPredicatedAddrSpace
LLVM_ABI std::pair< const Value *, unsigned > getPredicatedAddrSpace(const Value *V) const
Definition TargetTransformInfo.cpp:345

llvm::TargetTransformInfo::getExtendedReductionCost
LLVM_ABI InstructionCost getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy, VectorType *Ty, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput) const
Calculate the cost of an extended reduction pattern, similar to getArithmeticReductionCost of a reduc...
Definition TargetTransformInfo.cpp:1268

llvm::TargetTransformInfo::getLoadStoreVecRegBitWidth
LLVM_ABI unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const
Definition TargetTransformInfo.cpp:1349

llvm::TargetTransformInfo::getPreferredExpandedReductionShuffle
LLVM_ABI ReductionShuffle getPreferredExpandedReductionShuffle(const IntrinsicInst *II) const
Definition TargetTransformInfo.cpp:1452

llvm::TargetTransformInfo::getOperandInfo
static LLVM_ABI OperandValueInfo getOperandInfo(const Value *V)
Collect properties of V used in cost analysis, e.g. OP_PowerOf2.
Definition TargetTransformInfo.cpp:892

llvm::TargetTransformInfo::getRegisterClassForType
LLVM_ABI unsigned getRegisterClassForType(bool Vector, Type *Ty=nullptr) const
Definition TargetTransformInfo.cpp:778

llvm::TargetTransformInfo::isLegalAddressingMode
LLVM_ABI bool isLegalAddressingMode(Type *Ty, GlobalValue *BaseGV, int64_t BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace=0, Instruction *I=nullptr, int64_t ScalableOffset=0) const
Return true if the addressing mode represented by AM is legal for this target, for a load/store of th...
Definition TargetTransformInfo.cpp:424

llvm::TargetTransformInfo::getPopcntSupport
LLVM_ABI PopcntSupportKind getPopcntSupport(unsigned IntTyWidthInBit) const
Return hardware support for population count.
Definition TargetTransformInfo.cpp:705

llvm::TargetTransformInfo::getEstimatedNumberOfCaseClusters
LLVM_ABI unsigned getEstimatedNumberOfCaseClusters(const SwitchInst &SI, unsigned &JTSize, ProfileSummaryInfo *PSI, BlockFrequencyInfo *BFI) const
Definition TargetTransformInfo.cpp:267

llvm::TargetTransformInfo::isElementTypeLegalForScalableVector
LLVM_ABI bool isElementTypeLegalForScalableVector(Type *Ty) const
Definition TargetTransformInfo.cpp:1378

llvm::TargetTransformInfo::forceScalarizeMaskedGather
LLVM_ABI bool forceScalarizeMaskedGather(VectorType *Type, Align Alignment) const
Return true if the target forces scalarizing of llvm.masked.gather intrinsics.
Definition TargetTransformInfo.cpp:512

llvm::TargetTransformInfo::getMaxPrefetchIterationsAhead
LLVM_ABI unsigned getMaxPrefetchIterationsAhead() const
Definition TargetTransformInfo.cpp:865

llvm::TargetTransformInfo::canHaveNonUndefGlobalInitializerInAddressSpace
LLVM_ABI bool canHaveNonUndefGlobalInitializerInAddressSpace(unsigned AS) const
Return true if globals in this address space can have initializers other than undef.
Definition TargetTransformInfo.cpp:331

llvm::TargetTransformInfo::getMinimumVF
LLVM_ABI ElementCount getMinimumVF(unsigned ElemWidth, bool IsScalable) const
Definition TargetTransformInfo.cpp:813

llvm::TargetTransformInfo::getIntImmCostIntrin
LLVM_ABI InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx, const APInt &Imm, Type *Ty, TargetCostKind CostKind) const
Definition TargetTransformInfo.cpp:755

llvm::TargetTransformInfo::enableMaskedInterleavedAccessVectorization
LLVM_ABI bool enableMaskedInterleavedAccessVectorization() const
Enable matching of interleaved access groups that contain predicated accesses or gaps and therefore v...
Definition TargetTransformInfo.cpp:686

llvm::TargetTransformInfo::getIntImmCostInst
LLVM_ABI InstructionCost getIntImmCostInst(unsigned Opc, unsigned Idx, const APInt &Imm, Type *Ty, TargetCostKind CostKind, Instruction *Inst=nullptr) const
Return the expected cost of materialization for the given integer immediate of the specified type for...
Definition TargetTransformInfo.cpp:745

llvm::TargetTransformInfo::isLegalStridedLoadStore
LLVM_ABI bool isLegalStridedLoadStore(Type *DataType, Align Alignment) const
Return true if the target supports strided load.
Definition TargetTransformInfo.cpp:532

llvm::TargetTransformInfo::operator=
LLVM_ABI TargetTransformInfo & operator=(TargetTransformInfo &&RHS)
Definition TargetTransformInfo.cpp:214

llvm::TargetTransformInfo::getMinMaxReductionCost
LLVM_ABI InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF=FastMathFlags(), TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput) const
Definition TargetTransformInfo.cpp:1259

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition TargetTransformInfo.h:333

llvm::TargetTransformInfo::TCK_RecipThroughput
@ TCK_RecipThroughput
Reciprocal throughput.
Definition TargetTransformInfo.h:334

llvm::TargetTransformInfo::TCK_CodeSize
@ TCK_CodeSize
Instruction code size.
Definition TargetTransformInfo.h:336

llvm::TargetTransformInfo::TCK_SizeAndLatency
@ TCK_SizeAndLatency
The weighted sum of size and latency.
Definition TargetTransformInfo.h:337

llvm::TargetTransformInfo::TCK_Latency
@ TCK_Latency
The latency of instruction.
Definition TargetTransformInfo.h:335

llvm::TargetTransformInfo::getArithmeticInstrCost
LLVM_ABI InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput, TTI::OperandValueInfo Opd1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Opd2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr, const TargetLibraryInfo *TLibInfo=nullptr) const
This is an approximation of reciprocal throughput of a math/logic op.
Definition TargetTransformInfo.cpp:957

llvm::TargetTransformInfo::enableSelectOptimize
LLVM_ABI bool enableSelectOptimize() const
Should the Select Optimization pass be enabled and ran.
Definition TargetTransformInfo.cpp:673

llvm::TargetTransformInfo::collectFlatAddressOperands
LLVM_ABI bool collectFlatAddressOperands(SmallVectorImpl< int > &OpIndexes, Intrinsic::ID IID) const
Return any intrinsic address operand indexes which may be rewritten if they use a flat address space ...
Definition TargetTransformInfo.cpp:321

llvm::TargetTransformInfo::OperandValueProperties
OperandValueProperties
Additional properties of an operand's values.
Definition TargetTransformInfo.h:1228

llvm::TargetTransformInfo::OP_NegatedPowerOf2
@ OP_NegatedPowerOf2
Definition TargetTransformInfo.h:1231

llvm::TargetTransformInfo::OP_None
@ OP_None
Definition TargetTransformInfo.h:1229

llvm::TargetTransformInfo::OP_PowerOf2
@ OP_PowerOf2
Definition TargetTransformInfo.h:1230

llvm::TargetTransformInfo::getInliningLastCallToStaticBonus
LLVM_ABI int getInliningLastCallToStaticBonus() const
Definition TargetTransformInfo.cpp:234

llvm::TargetTransformInfo::getPointersChainCost
LLVM_ABI InstructionCost getPointersChainCost(ArrayRef< const Value * > Ptrs, const Value *Base, const PointersChainInfo &Info, Type *AccessTy, TargetCostKind CostKind=TTI::TCK_RecipThroughput) const
Estimate the cost of a chain of pointers (typically pointer operands of a chain of loads or stores wi...
Definition TargetTransformInfo.cpp:258

llvm::TargetTransformInfo::isVScaleKnownToBeAPowerOfTwo
LLVM_ABI bool isVScaleKnownToBeAPowerOfTwo() const
Definition TargetTransformInfo.cpp:804

llvm::TargetTransformInfo::isIndexedLoadLegal
LLVM_ABI bool isIndexedLoadLegal(enum MemIndexedMode Mode, Type *Ty) const
Definition TargetTransformInfo.cpp:1339

llvm::TargetTransformInfo::getMaximumVF
LLVM_ABI unsigned getMaximumVF(unsigned ElemWidth, unsigned Opcode) const
Definition TargetTransformInfo.cpp:818

llvm::TargetTransformInfo::isLegalICmpImmediate
LLVM_ABI bool isLegalICmpImmediate(int64_t Imm) const
Return true if the specified immediate is legal icmp immediate, that is the target has icmp instructi...
Definition TargetTransformInfo.cpp:420

llvm::TargetTransformInfo::isTypeLegal
LLVM_ABI bool isTypeLegal(Type *Ty) const
Return true if this type is legal.
Definition TargetTransformInfo.cpp:589

llvm::TargetTransformInfo::requiresOrderedReduction
static bool requiresOrderedReduction(std::optional< FastMathFlags > FMF)
A helper function to determine the type of reduction algorithm used for a given Opcode and set of Fas...
Definition TargetTransformInfo.h:1640

llvm::TargetTransformInfo::isLegalToVectorizeReduction
LLVM_ABI bool isLegalToVectorizeReduction(const RecurrenceDescriptor &RdxDesc, ElementCount VF) const
Definition TargetTransformInfo.cpp:1373

llvm::TargetTransformInfo::getCacheAssociativity
LLVM_ABI std::optional< unsigned > getCacheAssociativity(CacheLevel Level) const
Definition TargetTransformInfo.cpp:845

llvm::TargetTransformInfo::isLegalNTLoad
LLVM_ABI bool isLegalNTLoad(Type *DataType, Align Alignment) const
Return true if the target supports nontemporal load.
Definition TargetTransformInfo.cpp:487

llvm::TargetTransformInfo::getMemcpyCost
LLVM_ABI InstructionCost getMemcpyCost(const Instruction *I) const
Definition TargetTransformInfo.cpp:1240

llvm::TargetTransformInfo::adjustInliningThreshold
LLVM_ABI unsigned adjustInliningThreshold(const CallBase *CB) const
Definition TargetTransformInfo.cpp:239

llvm::TargetTransformInfo::isLegalAddImmediate
LLVM_ABI bool isLegalAddImmediate(int64_t Imm) const
Return true if the specified immediate is legal add immediate, that is the target has add instruction...
Definition TargetTransformInfo.cpp:412

llvm::TargetTransformInfo::isTargetIntrinsicWithStructReturnOverloadAtField
LLVM_ABI bool isTargetIntrinsicWithStructReturnOverloadAtField(Intrinsic::ID ID, int RetIdx) const
Identifies if the vector form of the intrinsic that returns a struct is overloaded at the struct elem...
Definition TargetTransformInfo.cpp:633

llvm::TargetTransformInfo::getLoadVectorFactor
LLVM_ABI unsigned getLoadVectorFactor(unsigned VF, unsigned LoadSize, unsigned ChainSizeInBytes, VectorType *VecTy) const
Definition TargetTransformInfo.cpp:1382

llvm::TargetTransformInfo::getMemIntrinsicInstrCost
LLVM_ABI InstructionCost getMemIntrinsicInstrCost(const MemIntrinsicCostAttributes &MICA, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfo.cpp:1210

llvm::TargetTransformInfo::canSaveCmp
LLVM_ABI bool canSaveCmp(Loop *L, BranchInst **BI, ScalarEvolution *SE, LoopInfo *LI, DominatorTree *DT, AssumptionCache *AC, TargetLibraryInfo *LibInfo) const
Return true if the target can save a compare for loop count, for example hardware loop saves a compar...
Definition TargetTransformInfo.cpp:455

llvm::TargetTransformInfo::isTargetIntrinsicTriviallyScalarizable
LLVM_ABI bool isTargetIntrinsicTriviallyScalarizable(Intrinsic::ID ID) const
Definition TargetTransformInfo.cpp:618

llvm::TargetTransformInfo::rewriteIntrinsicWithAddressSpace
LLVM_ABI Value * rewriteIntrinsicWithAddressSpace(IntrinsicInst *II, Value *OldV, Value *NewV) const
Rewrite intrinsic call II such that OldV will be replaced with NewV, which has a different address sp...
Definition TargetTransformInfo.cpp:349

llvm::TargetTransformInfo::getCostOfKeepingLiveOverCall
LLVM_ABI InstructionCost getCostOfKeepingLiveOverCall(ArrayRef< Type * > Tys) const
Definition TargetTransformInfo.cpp:1283

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition TargetTransformInfo.h:1283

llvm::TargetTransformInfo::RGK_FixedWidthVector
@ RGK_FixedWidthVector
Definition TargetTransformInfo.h:1283

llvm::TargetTransformInfo::RGK_ScalableVector
@ RGK_ScalableVector
Definition TargetTransformInfo.h:1283

llvm::TargetTransformInfo::RGK_Scalar
@ RGK_Scalar
Definition TargetTransformInfo.h:1283

llvm::TargetTransformInfo::getMinPrefetchStride
LLVM_ABI unsigned getMinPrefetchStride(unsigned NumMemAccesses, unsigned NumStridedMemAccesses, unsigned NumPrefetches, bool HasCall) const
Some HW prefetchers can handle accesses up to a certain constant stride.
Definition TargetTransformInfo.cpp:858

llvm::TargetTransformInfo::shouldPrefetchAddressSpace
LLVM_ABI bool shouldPrefetchAddressSpace(unsigned AS) const
Definition TargetTransformInfo.cpp:873

llvm::TargetTransformInfo::getIntImmCost
LLVM_ABI InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TargetCostKind CostKind) const
Return the expected cost of materializing for the given integer immediate of the specified type.
Definition TargetTransformInfo.cpp:738

llvm::TargetTransformInfo::getMinVectorRegisterBitWidth
LLVM_ABI unsigned getMinVectorRegisterBitWidth() const
Definition TargetTransformInfo.cpp:792

llvm::TargetTransformInfo::getAddressComputationCost
LLVM_ABI InstructionCost getAddressComputationCost(Type *PtrTy, ScalarEvolution *SE, const SCEV *Ptr, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfo.cpp:1231

llvm::TargetTransformInfo::isLegalNTStore
LLVM_ABI bool isLegalNTStore(Type *DataType, Align Alignment) const
Return true if the target supports nontemporal store.
Definition TargetTransformInfo.cpp:482

llvm::TargetTransformInfo::getPartialReductionCost
LLVM_ABI InstructionCost getPartialReductionCost(unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType, ElementCount VF, PartialReductionExtendKind OpAExtend, PartialReductionExtendKind OpBExtend, std::optional< unsigned > BinOp, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfo.cpp:877

llvm::TargetTransformInfo::getFlatAddressSpace
LLVM_ABI unsigned getFlatAddressSpace() const
Returns the address space ID for a target's 'flat' address space.
Definition TargetTransformInfo.cpp:317

llvm::TargetTransformInfo::preferToKeepConstantsAttached
LLVM_ABI bool preferToKeepConstantsAttached(const Instruction &Inst, const Function &Fn) const
It can be advantageous to detach complex constants from their uses to make their generation cheaper.
Definition TargetTransformInfo.cpp:764

llvm::TargetTransformInfo::hasArmWideBranch
LLVM_ABI bool hasArmWideBranch(bool Thumb) const
Definition TargetTransformInfo.cpp:1427

llvm::TargetTransformInfo::getRegisterClassName
LLVM_ABI const char * getRegisterClassName(unsigned ClassID) const
Definition TargetTransformInfo.cpp:783

llvm::TargetTransformInfo::preferEpilogueVectorization
LLVM_ABI bool preferEpilogueVectorization() const
Return true if the loop vectorizer should consider vectorizing an otherwise scalar epilogue loop.
Definition TargetTransformInfo.cpp:1414

llvm::TargetTransformInfo::shouldConsiderAddressTypePromotion
LLVM_ABI bool shouldConsiderAddressTypePromotion(const Instruction &I, bool &AllowPromotionWithoutCommonHeader) const
Definition TargetTransformInfo.cpp:828

llvm::TargetTransformInfo::useAA
LLVM_ABI bool useAA() const
Definition TargetTransformInfo.cpp:587

llvm::TargetTransformInfo::getPriorityMask
LLVM_ABI APInt getPriorityMask(const Function &F) const
Returns a bitmask constructed from the target-features or fmv-features metadata of a function corresp...
Definition TargetTransformInfo.cpp:1435

llvm::TargetTransformInfo::getPredictableBranchThreshold
LLVM_ABI BranchProbability getPredictableBranchThreshold() const
If a branch or a select condition is skewed in one direction by more than this factor,...
Definition TargetTransformInfo.cpp:283

llvm::TargetTransformInfo::TargetTransformInfo
LLVM_ABI TargetTransformInfo(std::unique_ptr< const TargetTransformInfoImplBase > Impl)
Construct a TTI object using a type implementing the Concept API below.
Definition TargetTransformInfo.cpp:61

llvm::TargetTransformInfo::preferInLoopReduction
LLVM_ABI bool preferInLoopReduction(RecurKind Kind, Type *Ty) const
Definition TargetTransformInfo.cpp:1401

llvm::TargetTransformInfo::getCallerAllocaCost
LLVM_ABI unsigned getCallerAllocaCost(const CallBase *CB, const AllocaInst *AI) const
Definition TargetTransformInfo.cpp:243

llvm::TargetTransformInfo::hasConditionalLoadStoreForType
LLVM_ABI bool hasConditionalLoadStoreForType(Type *Ty, bool IsStore) const
Definition TargetTransformInfo.cpp:773

llvm::TargetTransformInfo::getCacheLineSize
LLVM_ABI unsigned getCacheLineSize() const
Definition TargetTransformInfo.cpp:834

llvm::TargetTransformInfo::allowsMisalignedMemoryAccesses
LLVM_ABI bool allowsMisalignedMemoryAccesses(LLVMContext &Context, unsigned BitWidth, unsigned AddressSpace=0, Align Alignment=Align(1), unsigned *Fast=nullptr) const
Determine if the target supports unaligned memory accesses.
Definition TargetTransformInfo.cpp:695

llvm::TargetTransformInfo::getInlinerVectorBonusPercent
LLVM_ABI int getInlinerVectorBonusPercent() const
Definition TargetTransformInfo.cpp:248

llvm::TargetTransformInfo::getEpilogueVectorizationMinVF
LLVM_ABI unsigned getEpilogueVectorizationMinVF() const
Definition TargetTransformInfo.cpp:364

llvm::TargetTransformInfo::collectKernelLaunchBounds
LLVM_ABI void collectKernelLaunchBounds(const Function &F, SmallVectorImpl< std::pair< StringRef, int64_t > > &LB) const
Collect kernel launch bounds for F into LB.
Definition TargetTransformInfo.cpp:1492

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition TargetTransformInfo.h:797

llvm::TargetTransformInfo::PSK_SlowHardware
@ PSK_SlowHardware
Definition TargetTransformInfo.h:797

llvm::TargetTransformInfo::PSK_Software
@ PSK_Software
Definition TargetTransformInfo.h:797

llvm::TargetTransformInfo::PSK_FastHardware
@ PSK_FastHardware
Definition TargetTransformInfo.h:797

llvm::TargetTransformInfo::preferPredicatedReductionSelect
LLVM_ABI bool preferPredicatedReductionSelect() const
Definition TargetTransformInfo.cpp:1410

llvm::TargetTransformInfo::getIntImmCodeSizeCost
LLVM_ABI InstructionCost getIntImmCodeSizeCost(unsigned Opc, unsigned Idx, const APInt &Imm, Type *Ty) const
Return the expected cost for the given integer when optimising for size.
Definition TargetTransformInfo.cpp:728

llvm::TargetTransformInfo::getPreferredAddressingMode
LLVM_ABI AddressingModeKind getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const
Return the preferred addressing mode LSR should make efforts to generate.
Definition TargetTransformInfo.cpp:463

llvm::TargetTransformInfo::isLoweredToCall
LLVM_ABI bool isLoweredToCall(const Function *F) const
Test whether calls to a function lower to actual program function calls.
Definition TargetTransformInfo.cpp:354

llvm::TargetTransformInfo::isLegalToVectorizeLoadChain
LLVM_ABI bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition TargetTransformInfo.cpp:1361

llvm::TargetTransformInfo::isHardwareLoopProfitable
LLVM_ABI bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE, AssumptionCache &AC, TargetLibraryInfo *LibInfo, HardwareLoopInfo &HWLoopInfo) const
Query the target whether it would be profitable to convert the given loop into a hardware loop.
Definition TargetTransformInfo.cpp:358

llvm::TargetTransformInfo::getInliningThresholdMultiplier
LLVM_ABI unsigned getInliningThresholdMultiplier() const
Definition TargetTransformInfo.cpp:219

llvm::TargetTransformInfo::getBranchMispredictPenalty
LLVM_ABI InstructionCost getBranchMispredictPenalty() const
Returns estimated penalty of a branch misprediction in latency.
Definition TargetTransformInfo.cpp:289

llvm::TargetTransformInfo::getNumberOfRegisters
LLVM_ABI unsigned getNumberOfRegisters(unsigned ClassID) const
Definition TargetTransformInfo.cpp:769

llvm::TargetTransformInfo::isLegalAltInstr
LLVM_ABI bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask) const
Return true if this is an alternating opcode pattern that can be lowered to a single instruction on t...
Definition TargetTransformInfo.cpp:501

llvm::TargetTransformInfo::isProfitableToHoist
LLVM_ABI bool isProfitableToHoist(Instruction *I) const
Return true if it is profitable to hoist instruction in the then/else to before if.
Definition TargetTransformInfo.cpp:583

llvm::TargetTransformInfo::supportsScalableVectors
LLVM_ABI bool supportsScalableVectors() const
Definition TargetTransformInfo.cpp:1465

llvm::TargetTransformInfo::hasVolatileVariant
LLVM_ABI bool hasVolatileVariant(Instruction *I, unsigned AddrSpace) const
Return true if the given instruction (assumed to be a memory access instruction) has a volatile varia...
Definition TargetTransformInfo.cpp:557

llvm::TargetTransformInfo::isLegalMaskedCompressStore
LLVM_ABI bool isLegalMaskedCompressStore(Type *DataType, Align Alignment) const
Return true if the target supports masked compress store.
Definition TargetTransformInfo.cpp:522

llvm::TargetTransformInfo::getMinPageSize
LLVM_ABI std::optional< unsigned > getMinPageSize() const
Definition TargetTransformInfo.cpp:849

llvm::TargetTransformInfo::isFPVectorizationPotentiallyUnsafe
LLVM_ABI bool isFPVectorizationPotentiallyUnsafe() const
Indicate that it is potentially unsafe to automatically vectorize floating-point operations because t...
Definition TargetTransformInfo.cpp:690

llvm::TargetTransformInfo::getInsertExtractValueCost
LLVM_ABI InstructionCost getInsertExtractValueCost(unsigned Opcode, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfo.cpp:1160

llvm::TargetTransformInfo::shouldBuildRelLookupTables
LLVM_ABI bool shouldBuildRelLookupTables() const
Return true if lookup tables should be turned into relative lookup tables.
Definition TargetTransformInfo.cpp:606

llvm::TargetTransformInfo::PartialReductionExtendKind
PartialReductionExtendKind
Definition TargetTransformInfo.h:280

llvm::TargetTransformInfo::PR_SignExtend
@ PR_SignExtend
Definition TargetTransformInfo.h:280

llvm::TargetTransformInfo::PR_ZeroExtend
@ PR_ZeroExtend
Definition TargetTransformInfo.h:280

llvm::TargetTransformInfo::PR_None
@ PR_None
Definition TargetTransformInfo.h:280

llvm::TargetTransformInfo::getStoreMinimumVF
LLVM_ABI unsigned getStoreMinimumVF(unsigned VF, Type *ScalarMemTy, Type *ScalarValTy) const
Definition TargetTransformInfo.cpp:823

llvm::TargetTransformInfo::getCacheSize
LLVM_ABI std::optional< unsigned > getCacheSize(CacheLevel Level) const
Definition TargetTransformInfo.cpp:840

llvm::TargetTransformInfo::simplifyDemandedUseBitsIntrinsic
LLVM_ABI std::optional< Value * > simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedMask, KnownBits &Known, bool &KnownBitsComputed) const
Can be used to implement target-specific instruction combining.
Definition TargetTransformInfo.cpp:384

llvm::TargetTransformInfo::isLegalAddScalableImmediate
LLVM_ABI bool isLegalAddScalableImmediate(int64_t Imm) const
Return true if adding the specified scalable immediate is legal, that is the target has add instructi...
Definition TargetTransformInfo.cpp:416

llvm::TargetTransformInfo::isTargetIntrinsicWithScalarOpAtArg
LLVM_ABI bool isTargetIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx) const
Identifies if the vector form of the intrinsic has a scalar operand.
Definition TargetTransformInfo.cpp:623

llvm::TargetTransformInfo::hasDivRemOp
LLVM_ABI bool hasDivRemOp(Type *DataType, bool IsSigned) const
Return true if the target has a unified operation to calculate division and remainder.
Definition TargetTransformInfo.cpp:553

llvm::TargetTransformInfo::getAltInstrCost
LLVM_ABI InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask, TTI::TargetCostKind CostKind=TTI::TCK_RecipThroughput) const
Returns the cost estimation for alternating opcode pattern that can be lowered to a single instructio...
Definition TargetTransformInfo.cpp:984

llvm::TargetTransformInfo::TargetCostConstants
TargetCostConstants
Underlying constants for 'cost' values in this interface.
Definition TargetTransformInfo.h:358

llvm::TargetTransformInfo::TCC_Expensive
@ TCC_Expensive
The cost of a 'div' instruction on x86.
Definition TargetTransformInfo.h:361

llvm::TargetTransformInfo::TCC_Free
@ TCC_Free
Expected to fold away in lowering.
Definition TargetTransformInfo.h:359

llvm::TargetTransformInfo::TCC_Basic
@ TCC_Basic
The cost of a typical 'add' instruction.
Definition TargetTransformInfo.h:360

llvm::TargetTransformInfo::enableInterleavedAccessVectorization
LLVM_ABI bool enableInterleavedAccessVectorization() const
Enable matching of interleaved access groups.
Definition TargetTransformInfo.cpp:682

llvm::TargetTransformInfo::getMinTripCountTailFoldingThreshold
LLVM_ABI unsigned getMinTripCountTailFoldingThreshold() const
Definition TargetTransformInfo.cpp:1461

llvm::TargetTransformInfo::getInstructionCost
LLVM_ABI InstructionCost getInstructionCost(const User *U, ArrayRef< const Value * > Operands, TargetCostKind CostKind) const
Estimate the cost of a given IR user when lowered.
Definition TargetTransformInfo.cpp:274

llvm::TargetTransformInfo::getMaxInterleaveFactor
LLVM_ABI unsigned getMaxInterleaveFactor(ElementCount VF) const
Definition TargetTransformInfo.cpp:887

llvm::TargetTransformInfo::enableScalableVectorization
LLVM_ABI bool enableScalableVectorization() const
Definition TargetTransformInfo.cpp:1469

llvm::TargetTransformInfo::useFastCCForInternalCall
LLVM_ABI bool useFastCCForInternalCall(Function &F) const
Return true if the input function is internal, should use fastcc calling convention.
Definition TargetTransformInfo.cpp:614

llvm::TargetTransformInfo::isVectorShiftByScalarCheap
LLVM_ABI bool isVectorShiftByScalarCheap(Type *Ty) const
Return true if it's significantly cheaper to shift a vector by a uniform scalar than by an amount whi...
Definition TargetTransformInfo.cpp:1482

llvm::TargetTransformInfo::isNumRegsMajorCostOfLSR
LLVM_ABI bool isNumRegsMajorCostOfLSR() const
Return true if LSR major cost is number of registers.
Definition TargetTransformInfo.cpp:439

llvm::TargetTransformInfo::getInliningCostBenefitAnalysisSavingsMultiplier
LLVM_ABI unsigned getInliningCostBenefitAnalysisSavingsMultiplier() const
Definition TargetTransformInfo.cpp:224

llvm::TargetTransformInfo::isLegalMaskedVectorHistogram
LLVM_ABI bool isLegalMaskedVectorHistogram(Type *AddrType, Type *DataType) const
Definition TargetTransformInfo.cpp:544

llvm::TargetTransformInfo::getGISelRematGlobalCost
LLVM_ABI unsigned getGISelRematGlobalCost() const
Definition TargetTransformInfo.cpp:1457

llvm::TargetTransformInfo::getNumBytesToPadGlobalArray
LLVM_ABI unsigned getNumBytesToPadGlobalArray(unsigned Size, Type *ArrayType) const
Definition TargetTransformInfo.cpp:1487

llvm::TargetTransformInfo::MemIndexedMode
MemIndexedMode
The type of load/store indexing.
Definition TargetTransformInfo.h:1795

llvm::TargetTransformInfo::MIM_Unindexed
@ MIM_Unindexed
No indexing.
Definition TargetTransformInfo.h:1796

llvm::TargetTransformInfo::MIM_PostInc
@ MIM_PostInc
Post-incrementing.
Definition TargetTransformInfo.h:1799

llvm::TargetTransformInfo::MIM_PostDec
@ MIM_PostDec
Post-decrementing.
Definition TargetTransformInfo.h:1800

llvm::TargetTransformInfo::MIM_PreDec
@ MIM_PreDec
Pre-decrementing.
Definition TargetTransformInfo.h:1798

llvm::TargetTransformInfo::MIM_PreInc
@ MIM_PreInc
Pre-incrementing.
Definition TargetTransformInfo.h:1797

llvm::TargetTransformInfo::isLegalMaskedLoad
LLVM_ABI bool isLegalMaskedLoad(Type *DataType, Align Alignment, unsigned AddressSpace, MaskKind MaskKind=VariableOrConstantMask) const
Return true if the target supports masked load.
Definition TargetTransformInfo.cpp:475

llvm::TargetTransformInfo::getIndexedVectorInstrCostFromEnd
LLVM_ABI InstructionCost getIndexedVectorInstrCostFromEnd(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index) const
Definition TargetTransformInfo.cpp:1151

llvm::TargetTransformInfo::areInlineCompatible
LLVM_ABI bool areInlineCompatible(const Function *Caller, const Function *Callee) const
Definition TargetTransformInfo.cpp:1321

llvm::TargetTransformInfo::useColdCCForColdCall
LLVM_ABI bool useColdCCForColdCall(Function &F) const
Return true if the input function which is cold at all call sites, should use coldcc calling conventi...
Definition TargetTransformInfo.cpp:610

llvm::TargetTransformInfo::getFPOpCost
LLVM_ABI InstructionCost getFPOpCost(Type *Ty) const
Return the expected cost of supporting the floating point operation of the specified type.
Definition TargetTransformInfo.cpp:722

llvm::TargetTransformInfo::supportsTailCalls
LLVM_ABI bool supportsTailCalls() const
If the target supports tail calls.
Definition TargetTransformInfo.cpp:655

llvm::TargetTransformInfo::canMacroFuseCmp
LLVM_ABI bool canMacroFuseCmp() const
Return true if the target can fuse a compare and branch.
Definition TargetTransformInfo.cpp:451

llvm::TargetTransformInfo::isValidAddrSpaceCast
LLVM_ABI bool isValidAddrSpaceCast(unsigned FromAS, unsigned ToAS) const
Query the target whether the specified address space cast from FromAS to ToAS is valid.
Definition TargetTransformInfo.cpp:307

llvm::TargetTransformInfo::getNumberOfParts
LLVM_ABI unsigned getNumberOfParts(Type *Tp) const
Definition TargetTransformInfo.cpp:1227

llvm::TargetTransformInfo::getOperandsScalarizationOverhead
LLVM_ABI InstructionCost getOperandsScalarizationOverhead(ArrayRef< Type * > Tys, TTI::TargetCostKind CostKind) const
Estimate the overhead of scalarizing operands with the given types.
Definition TargetTransformInfo.cpp:646

llvm::TargetTransformInfo::AddressingModeKind
AddressingModeKind
Which addressing mode Loop Strength Reduction will try to generate.
Definition TargetTransformInfo.h:860

llvm::TargetTransformInfo::AMK_PostIndexed
@ AMK_PostIndexed
Prefer post-indexed addressing mode.
Definition TargetTransformInfo.h:863

llvm::TargetTransformInfo::AMK_All
@ AMK_All
Consider all addressing modes.
Definition TargetTransformInfo.h:864

llvm::TargetTransformInfo::AMK_PreIndexed
@ AMK_PreIndexed
Prefer pre-indexed addressing mode.
Definition TargetTransformInfo.h:862

llvm::TargetTransformInfo::AMK_None
@ AMK_None
Don't prefer any addressing mode.
Definition TargetTransformInfo.h:861

llvm::TargetTransformInfo::getScalingFactorCost
LLVM_ABI InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, StackOffset BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace=0) const
Return the cost of the scaling factor used in the addressing mode represented by AM for this target,...
Definition TargetTransformInfo.cpp:566

llvm::TargetTransformInfo::isTruncateFree
LLVM_ABI bool isTruncateFree(Type *Ty1, Type *Ty2) const
Return true if it's free to truncate a value of type Ty1 to type Ty2.
Definition TargetTransformInfo.cpp:579

llvm::TargetTransformInfo::isProfitableToSinkOperands
LLVM_ABI bool isProfitableToSinkOperands(Instruction *I, SmallVectorImpl< Use * > &Ops) const
Return true if sinking I's operands to the same basic block as I is profitable, e....
Definition TargetTransformInfo.cpp:1477

llvm::TargetTransformInfo::getMemcpyLoopResidualLoweringType
LLVM_ABI void getMemcpyLoopResidualLoweringType(SmallVectorImpl< Type * > &OpsOut, LLVMContext &Context, unsigned RemainingBytes, unsigned SrcAddrSpace, unsigned DestAddrSpace, Align SrcAlign, Align DestAlign, std::optional< uint32_t > AtomicCpySize=std::nullopt) const
Definition TargetTransformInfo.cpp:1311

llvm::TargetTransformInfo::preferPredicateOverEpilogue
LLVM_ABI bool preferPredicateOverEpilogue(TailFoldingInfo *TFI) const
Query the target whether it would be prefered to create a predicated vector loop, which can avoid the...
Definition TargetTransformInfo.cpp:368

llvm::TargetTransformInfo::forceScalarizeMaskedScatter
LLVM_ABI bool forceScalarizeMaskedScatter(VectorType *Type, Align Alignment) const
Return true if the target forces scalarizing of llvm.masked.scatter intrinsics.
Definition TargetTransformInfo.cpp:517

llvm::TargetTransformInfo::isTargetIntrinsicWithOverloadTypeAtArg
LLVM_ABI bool isTargetIntrinsicWithOverloadTypeAtArg(Intrinsic::ID ID, int OpdIdx) const
Identifies if the vector form of the intrinsic is overloaded on the type of the operand at index OpdI...
Definition TargetTransformInfo.cpp:628

llvm::TargetTransformInfo::haveFastSqrt
LLVM_ABI bool haveFastSqrt(Type *Ty) const
Return true if the hardware has a fast square-root instruction.
Definition TargetTransformInfo.cpp:709

llvm::TargetTransformInfo::shouldExpandReduction
LLVM_ABI bool shouldExpandReduction(const IntrinsicInst *II) const
Definition TargetTransformInfo.cpp:1447

llvm::TargetTransformInfo::getMaxMemIntrinsicInlineSizeThreshold
LLVM_ABI uint64_t getMaxMemIntrinsicInlineSizeThreshold() const
Returns the maximum memset / memcpy size in bytes that still makes it profitable to inline the call.
Definition TargetTransformInfo.cpp:1246

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition TargetTransformInfo.h:1200

llvm::TargetTransformInfo::SK_InsertSubvector
@ SK_InsertSubvector
InsertSubvector. Index indicates start offset.
Definition TargetTransformInfo.h:1207

llvm::TargetTransformInfo::SK_Select
@ SK_Select
Selects elements from the corresponding lane of either source operand.
Definition TargetTransformInfo.h:1203

llvm::TargetTransformInfo::SK_PermuteSingleSrc
@ SK_PermuteSingleSrc
Shuffle elements of single source vector with any shuffle mask.
Definition TargetTransformInfo.h:1211

llvm::TargetTransformInfo::SK_Transpose
@ SK_Transpose
Transpose two vectors.
Definition TargetTransformInfo.h:1206

llvm::TargetTransformInfo::SK_Splice
@ SK_Splice
Concatenates elements from the first input vector with elements of the second input vector.
Definition TargetTransformInfo.h:1213

llvm::TargetTransformInfo::SK_Broadcast
@ SK_Broadcast
Broadcast element 0 to all other elements.
Definition TargetTransformInfo.h:1201

llvm::TargetTransformInfo::SK_PermuteTwoSrc
@ SK_PermuteTwoSrc
Merge elements from two source vectors into one with any shuffle mask.
Definition TargetTransformInfo.h:1209

llvm::TargetTransformInfo::SK_Reverse
@ SK_Reverse
Reverse the order of the vector.
Definition TargetTransformInfo.h:1202

llvm::TargetTransformInfo::SK_ExtractSubvector
@ SK_ExtractSubvector
ExtractSubvector Index indicates start offset.
Definition TargetTransformInfo.h:1208

llvm::TargetTransformInfo::getFeatureMask
LLVM_ABI APInt getFeatureMask(const Function &F) const
Returns a bitmask constructed from the target-features or fmv-features metadata of a function corresp...
Definition TargetTransformInfo.cpp:1431

llvm::TargetTransformInfo::getPeelingPreferences
LLVM_ABI void getPeelingPreferences(Loop *L, ScalarEvolution &SE, PeelingPreferences &PP) const
Get target-customized preferences for the generic loop peeling transformation.
Definition TargetTransformInfo.cpp:407

llvm::TargetTransformInfo::getCallInstrCost
LLVM_ABI InstructionCost getCallInstrCost(Function *F, Type *RetTy, ArrayRef< Type * > Tys, TTI::TargetCostKind CostKind=TTI::TCK_SizeAndLatency) const
Definition TargetTransformInfo.cpp:1219

llvm::TargetTransformInfo::getCFInstrCost
LLVM_ABI InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind=TTI::TCK_SizeAndLatency, const Instruction *I=nullptr) const
Definition TargetTransformInfo.cpp:1093

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition TargetTransformInfo.h:1505

llvm::TargetTransformInfo::CastContextHint::Reversed
@ Reversed
The cast is used with a reversed load/store.
Definition TargetTransformInfo.h:1511

llvm::TargetTransformInfo::CastContextHint::Masked
@ Masked
The cast is used with a masked load/store.
Definition TargetTransformInfo.h:1508

llvm::TargetTransformInfo::CastContextHint::None
@ None
The cast is not used with a load/store of any kind.
Definition TargetTransformInfo.h:1506

llvm::TargetTransformInfo::CastContextHint::Normal
@ Normal
The cast is used with a normal load/store.
Definition TargetTransformInfo.h:1507

llvm::TargetTransformInfo::CastContextHint::Interleave
@ Interleave
The cast is used with an interleaved load/store.
Definition TargetTransformInfo.h:1510

llvm::TargetTransformInfo::CastContextHint::GatherScatter
@ GatherScatter
The cast is used with a gather/scatter.
Definition TargetTransformInfo.h:1509

llvm::TargetTransformInfo::getExtractWithExtendCost
LLVM_ABI InstructionCost getExtractWithExtendCost(unsigned Opcode, Type *Dst, VectorType *VecTy, unsigned Index, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfo.cpp:1084

llvm::TargetTransformInfo::~TargetTransformInfo
LLVM_ABI ~TargetTransformInfo()

llvm::TargetTransformInfo::OperandValueKind
OperandValueKind
Additional information about an operand's possible values.
Definition TargetTransformInfo.h:1220

llvm::TargetTransformInfo::OK_UniformConstantValue
@ OK_UniformConstantValue
Definition TargetTransformInfo.h:1223

llvm::TargetTransformInfo::OK_UniformValue
@ OK_UniformValue
Definition TargetTransformInfo.h:1222

llvm::TargetTransformInfo::OK_AnyValue
@ OK_AnyValue
Definition TargetTransformInfo.h:1221

llvm::TargetTransformInfo::OK_NonUniformConstantValue
@ OK_NonUniformConstantValue
Definition TargetTransformInfo.h:1224

llvm::TargetTransformInfo::CacheLevel
CacheLevel
The possible cache levels.
Definition TargetTransformInfo.h:1343

llvm::TargetTransformInfo::CacheLevel::L1D
@ L1D
Definition TargetTransformInfo.h:1344

llvm::TargetTransformInfo::CacheLevel::L2D
@ L2D
Definition TargetTransformInfo.h:1345

llvm::TypeSize
Definition TypeSize.h:332

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::User
Definition User.h:44

llvm::VPIntrinsic
This is the common base class for vector predication intrinsics.
Definition IntrinsicInst.h:566

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::VectorType
Base class of all SIMD vector types.
Definition DerivedTypes.h:430

uint64_t

uint8_t

Call
CallInst * Call
Definition ObjCARCOpts.cpp:2359

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition AMDGPUMetadata.h:396

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24

llvm::CallingConv::Fast
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition CallingConv.h:41

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::Intrinsic
This namespace contains an enum with a value for every intrinsic/builtin function known by LLVM.
Definition GenericSSAContext.h:27

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::NVPTXAS::AddressSpace
AddressSpace
Definition NVPTXAddrSpace.h:21

llvm::SI
Definition SIInstrInfo.h:1808

llvm::dwarf::Index
Index
Definition Dwarf.h:903

llvm::pdb::PDB_SymType::VectorType
@ VectorType
Definition PDBTypes.h:278

llvm::sampleprof::Base
@ Base
Definition Discriminator.h:58

llvm::sandboxir::Instruction
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::Length
@ Length
Definition DWP.cpp:532

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::None
@ None
Definition CodeGenData.h:107

llvm::Key
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
Definition PassManager.h:667

llvm::AtomicOrdering
AtomicOrdering
Atomic ordering for LLVM's memory model.
Definition AtomicOrdering.h:56

llvm::AtomicOrdering::Unordered
@ Unordered
Definition AtomicOrdering.h:58

llvm::AtomicOrdering::NotAtomic
@ NotAtomic
Definition AtomicOrdering.h:57

llvm::ModRefInfo::LLVM_MARK_AS_BITMASK_ENUM
@ LLVM_MARK_AS_BITMASK_ENUM
Definition ModRef.h:37

llvm::TTI
TargetTransformInfo TTI
Definition TargetTransformInfo.h:273

llvm::Data
FunctionAddr VTableAddr uintptr_t uintptr_t Data
Definition InstrProf.h:189

llvm::createTargetTransformInfoWrapperPass
LLVM_ABI ImmutablePass * createTargetTransformInfoWrapperPass(TargetIRAnalysis TIRA)
Create an analysis pass wrapper around a TTI object.
Definition TargetTransformInfo.cpp:1543

llvm::RecurKind
RecurKind
These are the kinds of recurrences that we support.
Definition IVDescriptors.h:34

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::BitWidth
constexpr unsigned BitWidth
Definition BitmaskEnum.h:219

llvm::move
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1879

llvm::TailFoldingStyle
TailFoldingStyle
Definition TargetTransformInfo.h:230

llvm::TailFoldingStyle::DataAndControlFlowWithoutRuntimeCheck
@ DataAndControlFlowWithoutRuntimeCheck
Use predicate to control both data and control flow, but modify the trip count so that a runtime over...
Definition TargetTransformInfo.h:257

llvm::TailFoldingStyle::DataWithEVL
@ DataWithEVL
Use predicated EVL instructions for tail-folding.
Definition TargetTransformInfo.h:260

llvm::TailFoldingStyle::DataAndControlFlow
@ DataAndControlFlow
Use predicate to control both data and control flow.
Definition TargetTransformInfo.h:253

llvm::TailFoldingStyle::DataWithoutLaneMask
@ DataWithoutLaneMask
Same as Data, but avoids using the get.active.lane.mask intrinsic to calculate the mask and instead i...
Definition TargetTransformInfo.h:247

llvm::FunctionAnalysisManager
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
Definition PassManager.h:563

llvm::VFParamKind::Vector
@ Vector
Definition VFABIDemangler.h:27

llvm::InstructionUniformity
InstructionUniformity
Enum describing how instructions behave with respect to uniformity and divergence,...
Definition Uniformity.h:18

std
Implement std::hash so that hash_code can be used in STL containers.
Definition BitVector.h:870

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39

llvm::AnalysisInfoMixin
A CRTP mix-in that provides informational APIs needed for analysis passes.
Definition PassManager.h:92

llvm::AnalysisKey
A special type used by analysis passes to provide an address that identifies that particular analysis...
Definition Analysis.h:29

llvm::HardwareLoopInfo
Attributes of a target dependent hardware loop.
Definition TargetTransformInfo.h:103

llvm::HardwareLoopInfo::L
Loop * L
Definition TargetTransformInfo.h:106

llvm::HardwareLoopInfo::ExitBranch
BranchInst * ExitBranch
Definition TargetTransformInfo.h:108

llvm::HardwareLoopInfo::ExitBlock
BasicBlock * ExitBlock
Definition TargetTransformInfo.h:107

llvm::HardwareLoopInfo::LoopDecrement
Value * LoopDecrement
Definition TargetTransformInfo.h:111

llvm::HardwareLoopInfo::canAnalyze
LLVM_ABI bool canAnalyze(LoopInfo &LI)
Definition TargetTransformInfo.cpp:65

llvm::HardwareLoopInfo::CounterInReg
bool CounterInReg
Definition TargetTransformInfo.h:115

llvm::HardwareLoopInfo::ExitCount
const SCEV * ExitCount
Definition TargetTransformInfo.h:109

llvm::HardwareLoopInfo::CountType
IntegerType * CountType
Definition TargetTransformInfo.h:110

llvm::HardwareLoopInfo::IsNestingLegal
bool IsNestingLegal
Definition TargetTransformInfo.h:113

llvm::HardwareLoopInfo::HardwareLoopInfo
HardwareLoopInfo()=delete

llvm::HardwareLoopInfo::PerformEntryTest
bool PerformEntryTest
Definition TargetTransformInfo.h:117

llvm::HardwareLoopInfo::isHardwareLoopCandidate
LLVM_ABI bool isHardwareLoopCandidate(ScalarEvolution &SE, LoopInfo &LI, DominatorTree &DT, bool ForceNestedLoop=false, bool ForceHardwareLoopPHI=false)
Definition TargetTransformInfo.cpp:127

llvm::KnownBits
Definition KnownBits.h:24

llvm::MemIntrinsicInfo
Information about a load/store intrinsic defined by the target.
Definition TargetTransformInfo.h:76

llvm::MemIntrinsicInfo::InterestingOperands
SmallVector< InterestingMemoryOperand, 1 > InterestingOperands
Definition TargetTransformInfo.h:93

llvm::MemIntrinsicInfo::MatchingId
unsigned short MatchingId
Definition TargetTransformInfo.h:87

llvm::MemIntrinsicInfo::ReadMem
bool ReadMem
Definition TargetTransformInfo.h:89

llvm::MemIntrinsicInfo::IsVolatile
bool IsVolatile
Definition TargetTransformInfo.h:91

llvm::MemIntrinsicInfo::WriteMem
bool WriteMem
Definition TargetTransformInfo.h:90

llvm::MemIntrinsicInfo::PtrVal
Value * PtrVal
This is the pointer that the intrinsic is loading from or storing to.
Definition TargetTransformInfo.h:81

llvm::MemIntrinsicInfo::Ordering
AtomicOrdering Ordering
Definition TargetTransformInfo.h:84

llvm::MemIntrinsicInfo::isUnordered
bool isUnordered() const
Definition TargetTransformInfo.h:95

llvm::TailFoldingInfo
Definition TargetTransformInfo.h:263

llvm::TailFoldingInfo::IAI
InterleavedAccessInfo * IAI
Definition TargetTransformInfo.h:266

llvm::TailFoldingInfo::TailFoldingInfo
TailFoldingInfo(TargetLibraryInfo *TLI, LoopVectorizationLegality *LVL, InterleavedAccessInfo *IAI)
Definition TargetTransformInfo.h:267

llvm::TailFoldingInfo::TLI
TargetLibraryInfo * TLI
Definition TargetTransformInfo.h:264

llvm::TailFoldingInfo::LVL
LoopVectorizationLegality * LVL
Definition TargetTransformInfo.h:265

llvm::TargetTransformInfo::LSRCost
Definition TargetTransformInfo.h:593

llvm::TargetTransformInfo::LSRCost::NumIVMuls
unsigned NumIVMuls
Definition TargetTransformInfo.h:599

llvm::TargetTransformInfo::LSRCost::ScaleCost
unsigned ScaleCost
Definition TargetTransformInfo.h:603

llvm::TargetTransformInfo::LSRCost::Insns
unsigned Insns
TODO: Some of these could be merged.
Definition TargetTransformInfo.h:596

llvm::TargetTransformInfo::LSRCost::ImmCost
unsigned ImmCost
Definition TargetTransformInfo.h:601

llvm::TargetTransformInfo::LSRCost::AddRecCost
unsigned AddRecCost
Definition TargetTransformInfo.h:598

llvm::TargetTransformInfo::LSRCost::NumRegs
unsigned NumRegs
Definition TargetTransformInfo.h:597

llvm::TargetTransformInfo::LSRCost::NumBaseAdds
unsigned NumBaseAdds
Definition TargetTransformInfo.h:600

llvm::TargetTransformInfo::LSRCost::SetupCost
unsigned SetupCost
Definition TargetTransformInfo.h:602

llvm::TargetTransformInfo::MemCmpExpansionOptions
Returns options for expansion of memcmp. IsZeroCmp is.
Definition TargetTransformInfo.h:1062

llvm::TargetTransformInfo::MemCmpExpansionOptions::LoadSizes
SmallVector< unsigned, 8 > LoadSizes
Definition TargetTransformInfo.h:1070

llvm::TargetTransformInfo::MemCmpExpansionOptions::NumLoadsPerBlock
unsigned NumLoadsPerBlock
Definition TargetTransformInfo.h:1080

llvm::TargetTransformInfo::MemCmpExpansionOptions::AllowOverlappingLoads
bool AllowOverlappingLoads
Definition TargetTransformInfo.h:1085

llvm::TargetTransformInfo::MemCmpExpansionOptions::MaxNumLoads
unsigned MaxNumLoads
Definition TargetTransformInfo.h:1067

llvm::TargetTransformInfo::MemCmpExpansionOptions::AllowedTailExpansions
SmallVector< unsigned, 4 > AllowedTailExpansions
Definition TargetTransformInfo.h:1096

llvm::TargetTransformInfo::OperandValueInfo
Definition TargetTransformInfo.h:1237

llvm::TargetTransformInfo::OperandValueInfo::isConstant
bool isConstant() const
Definition TargetTransformInfo.h:1241

llvm::TargetTransformInfo::OperandValueInfo::isNegatedPowerOf2
bool isNegatedPowerOf2() const
Definition TargetTransformInfo.h:1250

llvm::TargetTransformInfo::OperandValueInfo::Kind
OperandValueKind Kind
Definition TargetTransformInfo.h:1238

llvm::TargetTransformInfo::OperandValueInfo::getNoProps
OperandValueInfo getNoProps() const
Definition TargetTransformInfo.h:1254

llvm::TargetTransformInfo::OperandValueInfo::isPowerOf2
bool isPowerOf2() const
Definition TargetTransformInfo.h:1247

llvm::TargetTransformInfo::OperandValueInfo::isUniform
bool isUniform() const
Definition TargetTransformInfo.h:1244

llvm::TargetTransformInfo::OperandValueInfo::Properties
OperandValueProperties Properties
Definition TargetTransformInfo.h:1239

llvm::TargetTransformInfo::PeelingPreferences
Definition TargetTransformInfo.h:737

llvm::TargetTransformInfo::PeelingPreferences::AllowPeeling
bool AllowPeeling
Allow peeling off loop iterations.
Definition TargetTransformInfo.h:743

llvm::TargetTransformInfo::PeelingPreferences::AllowLoopNestsPeeling
bool AllowLoopNestsPeeling
Allow peeling off loop iterations for loop nests.
Definition TargetTransformInfo.h:745

llvm::TargetTransformInfo::PeelingPreferences::PeelLast
bool PeelLast
Peel off the last PeelCount loop iterations.
Definition TargetTransformInfo.h:753

llvm::TargetTransformInfo::PeelingPreferences::PeelProfiledIterations
bool PeelProfiledIterations
Allow peeling basing on profile.
Definition TargetTransformInfo.h:750

llvm::TargetTransformInfo::PeelingPreferences::PeelCount
unsigned PeelCount
A forced peeling factor (the number of bodied of the original loop that should be peeled off before t...
Definition TargetTransformInfo.h:741

llvm::TargetTransformInfo::PointersChainInfo
Describe known properties for a set of pointers.
Definition TargetTransformInfo.h:381

llvm::TargetTransformInfo::PointersChainInfo::IsKnownStride
unsigned IsKnownStride
True if distance between any two neigbouring pointers is a known value.
Definition TargetTransformInfo.h:388

llvm::TargetTransformInfo::PointersChainInfo::getKnownStride
static PointersChainInfo getKnownStride()
Definition TargetTransformInfo.h:399

llvm::TargetTransformInfo::PointersChainInfo::isUnitStride
bool isUnitStride() const
Definition TargetTransformInfo.h:392

llvm::TargetTransformInfo::PointersChainInfo::Reserved
unsigned Reserved
Definition TargetTransformInfo.h:389

llvm::TargetTransformInfo::PointersChainInfo::isSameBase
bool isSameBase() const
Definition TargetTransformInfo.h:391

llvm::TargetTransformInfo::PointersChainInfo::IsUnitStride
unsigned IsUnitStride
These properties only valid if SameBaseAddress is set.
Definition TargetTransformInfo.h:386

llvm::TargetTransformInfo::PointersChainInfo::isKnownStride
bool isKnownStride() const
Definition TargetTransformInfo.h:393

llvm::TargetTransformInfo::PointersChainInfo::IsSameBaseAddress
unsigned IsSameBaseAddress
All the GEPs in a set have same base address.
Definition TargetTransformInfo.h:383

llvm::TargetTransformInfo::PointersChainInfo::getUnitStride
static PointersChainInfo getUnitStride()
Definition TargetTransformInfo.h:395

llvm::TargetTransformInfo::PointersChainInfo::getUnknownStride
static PointersChainInfo getUnknownStride()
Definition TargetTransformInfo.h:403

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition TargetTransformInfo.h:607

llvm::TargetTransformInfo::UnrollingPreferences::MaxCount
unsigned MaxCount
Definition TargetTransformInfo.h:648

llvm::TargetTransformInfo::UnrollingPreferences::Count
unsigned Count
A forced unrolling factor (the number of concatenated bodies of the original loop in the unrolled loo...
Definition TargetTransformInfo.h:641

llvm::TargetTransformInfo::UnrollingPreferences::UpperBound
bool UpperBound
Allow using trip count upper bound to unroll loops.
Definition TargetTransformInfo.h:678

llvm::TargetTransformInfo::UnrollingPreferences::Threshold
unsigned Threshold
The cost threshold for the unrolled loop.
Definition TargetTransformInfo.h:615

llvm::TargetTransformInfo::UnrollingPreferences::Force
bool Force
Apply loop unroll on any kind of loop (mainly to loops that fail runtime unrolling).
Definition TargetTransformInfo.h:676

llvm::TargetTransformInfo::UnrollingPreferences::PartialOptSizeThreshold
unsigned PartialOptSizeThreshold
The cost threshold for the unrolled loop when optimizing for size, like OptSizeThreshold,...
Definition TargetTransformInfo.h:636

llvm::TargetTransformInfo::UnrollingPreferences::UnrollVectorizedLoop
bool UnrollVectorizedLoop
Don't disable runtime unroll for the loops which were vectorized.
Definition TargetTransformInfo.h:692

llvm::TargetTransformInfo::UnrollingPreferences::DefaultUnrollRuntimeCount
unsigned DefaultUnrollRuntimeCount
Default unroll count for loops with run-time trip count.
Definition TargetTransformInfo.h:643

llvm::TargetTransformInfo::UnrollingPreferences::MaxPercentThresholdBoost
unsigned MaxPercentThresholdBoost
If complete unrolling will reduce the cost of the loop, we will boost the Threshold by a certain perc...
Definition TargetTransformInfo.h:626

llvm::TargetTransformInfo::UnrollingPreferences::RuntimeUnrollMultiExit
bool RuntimeUnrollMultiExit
Allow runtime unrolling multi-exit loops.
Definition TargetTransformInfo.h:700

llvm::TargetTransformInfo::UnrollingPreferences::SCEVExpansionBudget
unsigned SCEVExpansionBudget
Don't allow runtime unrolling if expanding the trip count takes more than SCEVExpansionBudget.
Definition TargetTransformInfo.h:695

llvm::TargetTransformInfo::UnrollingPreferences::AddAdditionalAccumulators
bool AddAdditionalAccumulators
Allow unrolling to add parallel reduction phis.
Definition TargetTransformInfo.h:702

llvm::TargetTransformInfo::UnrollingPreferences::UnrollAndJamInnerLoopThreshold
unsigned UnrollAndJamInnerLoopThreshold
Threshold for unroll and jam, for inner loop size.
Definition TargetTransformInfo.h:687

llvm::TargetTransformInfo::UnrollingPreferences::MaxIterationsCountToAnalyze
unsigned MaxIterationsCountToAnalyze
Don't allow loop unrolling to simulate more than this number of iterations when checking full unroll ...
Definition TargetTransformInfo.h:690

llvm::TargetTransformInfo::UnrollingPreferences::AllowRemainder
bool AllowRemainder
Allow generation of a loop remainder (extra iterations after unroll).
Definition TargetTransformInfo.h:670

llvm::TargetTransformInfo::UnrollingPreferences::UnrollAndJam
bool UnrollAndJam
Allow unroll and jam. Used to enable unroll and jam for the target.
Definition TargetTransformInfo.h:682

llvm::TargetTransformInfo::UnrollingPreferences::UnrollRemainder
bool UnrollRemainder
Allow unrolling of all the iterations of the runtime loop remainder.
Definition TargetTransformInfo.h:680

llvm::TargetTransformInfo::UnrollingPreferences::FullUnrollMaxCount
unsigned FullUnrollMaxCount
Set the maximum unrolling factor for full unrolling.
Definition TargetTransformInfo.h:656

llvm::TargetTransformInfo::UnrollingPreferences::BEInsns
unsigned BEInsns
Definition TargetTransformInfo.h:661

llvm::TargetTransformInfo::UnrollingPreferences::PartialThreshold
unsigned PartialThreshold
The cost threshold for the unrolled loop, like Threshold, but used for partial/runtime unrolling (set...
Definition TargetTransformInfo.h:632

llvm::TargetTransformInfo::UnrollingPreferences::Runtime
bool Runtime
Allow runtime unrolling (unrolling of loops to expand the size of the loop body even when the number ...
Definition TargetTransformInfo.h:668

llvm::TargetTransformInfo::UnrollingPreferences::Partial
bool Partial
Allow partial unrolling (unrolling of loops to expand the size of the loop body, not only to eliminat...
Definition TargetTransformInfo.h:664

llvm::TargetTransformInfo::UnrollingPreferences::OptSizeThreshold
unsigned OptSizeThreshold
The cost threshold for the unrolled loop when optimizing for size (set to UINT_MAX to disable).
Definition TargetTransformInfo.h:629

llvm::TargetTransformInfo::UnrollingPreferences::AllowExpensiveTripCount
bool AllowExpensiveTripCount
Allow emitting expensive instructions (such as divisions) when computing the trip count of a loop for...
Definition TargetTransformInfo.h:673

llvm::TargetTransformInfo::UnrollingPreferences::MaxUpperBound
unsigned MaxUpperBound
Set the maximum upper bound of trip count.
Definition TargetTransformInfo.h:652

llvm::TargetTransformInfo::VPLegalization::OpStrategy
VPTransform OpStrategy
Definition TargetTransformInfo.h:1950

llvm::TargetTransformInfo::VPLegalization::shouldDoNothing
bool shouldDoNothing() const
Definition TargetTransformInfo.h:1952

llvm::TargetTransformInfo::VPLegalization::EVLParamStrategy
VPTransform EVLParamStrategy
Definition TargetTransformInfo.h:1944

llvm::TargetTransformInfo::VPLegalization::VPTransform
VPTransform
Definition TargetTransformInfo.h:1931

llvm::TargetTransformInfo::VPLegalization::Convert
@ Convert
Definition TargetTransformInfo.h:1937

llvm::TargetTransformInfo::VPLegalization::Legal
@ Legal
Definition TargetTransformInfo.h:1933

llvm::TargetTransformInfo::VPLegalization::Discard
@ Discard
Definition TargetTransformInfo.h:1935

llvm::TargetTransformInfo::VPLegalization::VPLegalization
VPLegalization(VPTransform EVLParamStrategy, VPTransform OpStrategy)
Definition TargetTransformInfo.h:1955