doxygen/AArch64TargetTransformInfo_8h_source.html

//===- AArch64TargetTransformInfo.h - AArch64 specific TTI ------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This file a TargetTransformInfo::Concept conforming object specific to the

/// AArch64 target machine. It uses the target's detailed information to

/// provide more precise answers to certain TTI queries, while letting the

/// target independent and default TTI implementations handle the rest.

///

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_AARCH64_AARCH64TARGETTRANSFORMINFO_H

#define LLVM_LIB_TARGET_AARCH64_AARCH64TARGETTRANSFORMINFO_H


#include "AArch64.h"

#include "AArch64Subtarget.h"

#include "AArch64TargetMachine.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/CodeGen/BasicTTIImpl.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/Intrinsics.h"

#include <cstdint>

#include <optional>


namespace llvm {


class APInt;

class Instruction;

class IntrinsicInst;

class Loop;

class SCEV;

class ScalarEvolution;

class Type;

class Value;

class VectorType;


class AArch64TTIImpl : public BasicTTIImplBase<AArch64TTIImpl> {

  using BaseT = BasicTTIImplBase<AArch64TTIImpl>;

  using TTI = TargetTransformInfo;


  friend BaseT;


  const AArch64Subtarget *ST;

  const AArch64TargetLowering *TLI;


  const AArch64Subtarget *getST() const { return ST; }

  const AArch64TargetLowering *getTLI() const { return TLI; }


  enum MemIntrinsicType {

    VECTOR_LDST_TWO_ELEMENTS,

    VECTOR_LDST_THREE_ELEMENTS,

    VECTOR_LDST_FOUR_ELEMENTS

  };


  bool isWideningInstruction(Type *DstTy, unsigned Opcode,

                             ArrayRef<const Value *> Args,

                             Type *SrcOverrideTy = nullptr);


  // A helper function called by 'getVectorInstrCost'.

  //

  // 'Val' and 'Index' are forwarded from 'getVectorInstrCost'; 'HasRealUse'

  // indicates whether the vector instruction is available in the input IR or

  // just imaginary in vectorizer passes.

  InstructionCost getVectorInstrCostHelper(const Instruction *I, Type *Val,

                                           unsigned Index, bool HasRealUse);


public:

  explicit AArch64TTIImpl(const AArch64TargetMachine *TM, const Function &F)

      : BaseT(TM, F.getDataLayout()), ST(TM->getSubtargetImpl(F)),

        TLI(ST->getTargetLowering()) {}


  bool areInlineCompatible(const Function *Caller,

                           const Function *Callee) const;


  bool areTypesABICompatible(const Function *Caller, const Function *Callee,

                             const ArrayRef<Type *> &Types) const;


  unsigned getInlineCallPenalty(const Function *F, const CallBase &Call,

                                unsigned DefaultCallPenalty) const;


  /// \name Scalar TTI Implementations

  /// @{


  using BaseT::getIntImmCost;

  InstructionCost getIntImmCost(int64_t Val);

  InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                TTI::TargetCostKind CostKind);

  InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx,

                                    const APInt &Imm, Type *Ty,

                                    TTI::TargetCostKind CostKind,

                                    Instruction *Inst = nullptr);

  InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx,

                                      const APInt &Imm, Type *Ty,

                                      TTI::TargetCostKind CostKind);

  TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth);


  /// @}


  /// \name Vector TTI Implementations

  /// @{


  bool enableInterleavedAccessVectorization() { return true; }


  bool enableMaskedInterleavedAccessVectorization() { return ST->hasSVE(); }


  unsigned getNumberOfRegisters(unsigned ClassID) const {

    bool Vector = (ClassID == 1);

    if (Vector) {

      if (ST->hasNEON())

        return 32;

      return 0;

    }

    return 31;

  }


  InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                                        TTI::TargetCostKind CostKind);


  std::optional<Instruction *> instCombineIntrinsic(InstCombiner &IC,

                                                    IntrinsicInst &II) const;


  std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const;


  TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const;


  unsigned getMinVectorRegisterBitWidth() const {

    return ST->getMinVectorRegisterBitWidth();

  }


  std::optional<unsigned> getVScaleForTuning() const {

    return ST->getVScaleForTuning();

  }


  bool isVScaleKnownToBeAPowerOfTwo() const { return true; }


  bool shouldMaximizeVectorBandwidth(TargetTransformInfo::RegisterKind K) const;


  /// Try to return an estimate cost factor that can be used as a multiplier

  /// when scalarizing an operation for a vector with ElementCount \p VF.

  /// For scalable vectors this currently takes the most pessimistic view based

  /// upon the maximum possible value for vscale.

  unsigned getMaxNumElements(ElementCount VF) const {

    if (!VF.isScalable())

      return VF.getFixedValue();


    return VF.getKnownMinValue() * ST->getVScaleForTuning();

  }


  unsigned getMaxInterleaveFactor(ElementCount VF);


  bool prefersVectorizedAddressing() const;


  InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src,

                                        Align Alignment, unsigned AddressSpace,

                                        TTI::TargetCostKind CostKind);


  InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy,

                                         const Value *Ptr, bool VariableMask,

                                         Align Alignment,

                                         TTI::TargetCostKind CostKind,

                                         const Instruction *I = nullptr);


  bool isExtPartOfAvgExpr(const Instruction *ExtUser, Type *Dst, Type *Src);


  InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src,

                                   TTI::CastContextHint CCH,

                                   TTI::TargetCostKind CostKind,

                                   const Instruction *I = nullptr);


  InstructionCost getExtractWithExtendCost(unsigned Opcode, Type *Dst,

                                           VectorType *VecTy, unsigned Index);


  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                 const Instruction *I = nullptr);


  InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val,

                                     TTI::TargetCostKind CostKind,

                                     unsigned Index, Value *Op0, Value *Op1);

  InstructionCost getVectorInstrCost(const Instruction &I, Type *Val,

                                     TTI::TargetCostKind CostKind,

                                     unsigned Index);


  InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty,

                                         FastMathFlags FMF,

                                         TTI::TargetCostKind CostKind);


  InstructionCost getArithmeticReductionCostSVE(unsigned Opcode,

                                                VectorType *ValTy,

                                                TTI::TargetCostKind CostKind);


  InstructionCost getSpliceCost(VectorType *Tp, int Index);


  InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      ArrayRef<const Value *> Args = std::nullopt,

      const Instruction *CxtI = nullptr);


  InstructionCost getAddressComputationCost(Type *Ty, ScalarEvolution *SE,

                                            const SCEV *Ptr);


  InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy,

                                     CmpInst::Predicate VecPred,

                                     TTI::TargetCostKind CostKind,

                                     const Instruction *I = nullptr);


  TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize,

                                                    bool IsZeroCmp) const;

  bool useNeonVector(const Type *Ty) const;


  InstructionCost

  getMemoryOpCost(unsigned Opcode, Type *Src, MaybeAlign Alignment,

                  unsigned AddressSpace, TTI::TargetCostKind CostKind,

                  TTI::OperandValueInfo OpInfo = {TTI::OK_AnyValue, TTI::OP_None},

                  const Instruction *I = nullptr);


  InstructionCost getCostOfKeepingLiveOverCall(ArrayRef<Type *> Tys);


  void getUnrollingPreferences(Loop *L, ScalarEvolution &SE,

                               TTI::UnrollingPreferences &UP,

                               OptimizationRemarkEmitter *ORE);


  void getPeelingPreferences(Loop *L, ScalarEvolution &SE,

                             TTI::PeelingPreferences &PP);


  Value *getOrCreateResultFromMemIntrinsic(IntrinsicInst *Inst,

                                           Type *ExpectedType);


  bool getTgtMemIntrinsic(IntrinsicInst *Inst, MemIntrinsicInfo &Info);


  bool isElementTypeLegalForScalableVector(Type *Ty) const {

    if (Ty->isPointerTy())

      return true;


    if (Ty->isBFloatTy() && ST->hasBF16())

      return true;


    if (Ty->isHalfTy() || Ty->isFloatTy() || Ty->isDoubleTy())

      return true;


    if (Ty->isIntegerTy(1) || Ty->isIntegerTy(8) || Ty->isIntegerTy(16) ||

        Ty->isIntegerTy(32) || Ty->isIntegerTy(64))

      return true;


    return false;

  }


  bool isLegalMaskedLoadStore(Type *DataType, Align Alignment) {

    if (!ST->hasSVE())

      return false;


    // For fixed vectors, avoid scalarization if using SVE for them.

    if (isa<FixedVectorType>(DataType) && !ST->useSVEForFixedLengthVectors() &&

        DataType->getPrimitiveSizeInBits() != 128)

      return false; // Fall back to scalarization of masked operations.


    return isElementTypeLegalForScalableVector(DataType->getScalarType());

  }


  bool isLegalMaskedLoad(Type *DataType, Align Alignment) {

    return isLegalMaskedLoadStore(DataType, Alignment);

  }


  bool isLegalMaskedStore(Type *DataType, Align Alignment) {

    return isLegalMaskedLoadStore(DataType, Alignment);

  }


  bool isLegalMaskedGatherScatter(Type *DataType) const {

    if (!ST->isSVEAvailable())

      return false;


    // For fixed vectors, scalarize if not using SVE for them.

    auto *DataTypeFVTy = dyn_cast<FixedVectorType>(DataType);

    if (DataTypeFVTy && (!ST->useSVEForFixedLengthVectors() ||

                         DataTypeFVTy->getNumElements() < 2))

      return false;


    return isElementTypeLegalForScalableVector(DataType->getScalarType());

  }


  bool isLegalMaskedGather(Type *DataType, Align Alignment) const {

    return isLegalMaskedGatherScatter(DataType);

  }


  bool isLegalMaskedScatter(Type *DataType, Align Alignment) const {

    return isLegalMaskedGatherScatter(DataType);

  }


  bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const {

    // Return true if we can generate a `ld1r` splat load instruction.

    if (!ST->hasNEON() || NumElements.isScalable())

      return false;

    switch (unsigned ElementBits = ElementTy->getScalarSizeInBits()) {

    case 8:

    case 16:

    case 32:

    case 64: {

      // We accept bit-widths >= 64bits and elements {8,16,32,64} bits.

      unsigned VectorBits = NumElements.getFixedValue() * ElementBits;

      return VectorBits >= 64;

    }

    }

    return false;

  }


  bool isLegalNTStoreLoad(Type *DataType, Align Alignment) {

    // NOTE: The logic below is mostly geared towards LV, which calls it with

    //       vectors with 2 elements. We might want to improve that, if other

    //       users show up.

    // Nontemporal vector loads/stores can be directly lowered to LDNP/STNP, if

    // the vector can be halved so that each half fits into a register. That's

    // the case if the element type fits into a register and the number of

    // elements is a power of 2 > 1.

    if (auto *DataTypeTy = dyn_cast<FixedVectorType>(DataType)) {

      unsigned NumElements = DataTypeTy->getNumElements();

      unsigned EltSize = DataTypeTy->getElementType()->getScalarSizeInBits();

      return NumElements > 1 && isPowerOf2_64(NumElements) && EltSize >= 8 &&

             EltSize <= 128 && isPowerOf2_64(EltSize);

    }

    return BaseT::isLegalNTStore(DataType, Alignment);

  }


  bool isLegalNTStore(Type *DataType, Align Alignment) {

    return isLegalNTStoreLoad(DataType, Alignment);

  }


  bool isLegalNTLoad(Type *DataType, Align Alignment) {

    // Only supports little-endian targets.

    if (ST->isLittleEndian())

      return isLegalNTStoreLoad(DataType, Alignment);

    return BaseT::isLegalNTLoad(DataType, Alignment);

  }


  bool enableOrderedReductions() const { return true; }


  InstructionCost getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

      bool UseMaskForCond = false, bool UseMaskForGaps = false);


  bool

  shouldConsiderAddressTypePromotion(const Instruction &I,

                                     bool &AllowPromotionWithoutCommonHeader);


  bool shouldExpandReduction(const IntrinsicInst *II) const { return false; }


  unsigned getGISelRematGlobalCost() const {

    return 2;

  }


  unsigned getMinTripCountTailFoldingThreshold() const {

    return ST->hasSVE() ? 5 : 0;

  }


  TailFoldingStyle getPreferredTailFoldingStyle(bool IVUpdateMayOverflow) const {

    if (ST->hasSVE())

      return IVUpdateMayOverflow

                 ? TailFoldingStyle::DataAndControlFlowWithoutRuntimeCheck

                 : TailFoldingStyle::DataAndControlFlow;


    return TailFoldingStyle::DataWithoutLaneMask;

  }


  bool preferFixedOverScalableIfEqualCost() const {

    return ST->useFixedOverScalableIfEqualCost();

  }


  bool preferPredicateOverEpilogue(TailFoldingInfo *TFI);


  bool supportsScalableVectors() const {

    return ST->isSVEorStreamingSVEAvailable();

  }


  bool enableScalableVectorization() const;


  bool isLegalToVectorizeReduction(const RecurrenceDescriptor &RdxDesc,

                                   ElementCount VF) const;


  bool preferPredicatedReductionSelect(unsigned Opcode, Type *Ty,

                                       TTI::ReductionFlags Flags) const {

    return ST->hasSVE();

  }


  InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *Ty,

                                             std::optional<FastMathFlags> FMF,

                                             TTI::TargetCostKind CostKind);


  InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *Tp,

                                 ArrayRef<int> Mask,

                                 TTI::TargetCostKind CostKind, int Index,

                                 VectorType *SubTp,

                                 ArrayRef<const Value *> Args = std::nullopt,

                                 const Instruction *CxtI = nullptr);


  InstructionCost getScalarizationOverhead(VectorType *Ty,

                                           const APInt &DemandedElts,

                                           bool Insert, bool Extract,

                                           TTI::TargetCostKind CostKind);


  /// Return the cost of the scaling factor used in the addressing

  /// mode represented by AM for this target, for a load/store

  /// of the specified type.

  /// If the AM is supported, the return value must be >= 0.

  /// If the AM is not supported, it returns a negative value.

  InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                       StackOffset BaseOffset, bool HasBaseReg,

                                       int64_t Scale, unsigned AddrSpace) const;

  /// @}


  bool enableSelectOptimize() { return ST->enableSelectOptimize(); }


  bool shouldTreatInstructionLikeSelect(const Instruction *I);


  unsigned getStoreMinimumVF(unsigned VF, Type *ScalarMemTy,

                             Type *ScalarValTy) const {

    // We can vectorize store v4i8.

    if (ScalarMemTy->isIntegerTy(8) && isPowerOf2_32(VF) && VF >= 4)

      return 4;


    return BaseT::getStoreMinimumVF(VF, ScalarMemTy, ScalarValTy);

  }


  std::optional<unsigned> getMinPageSize() const { return 4096; }


  bool isLSRCostLess(const TargetTransformInfo::LSRCost &C1,

                     const TargetTransformInfo::LSRCost &C2);

};


} // end namespace llvm


#endif // LLVM_LIB_TARGET_AARCH64_AARCH64TARGETTRANSFORMINFO_H

AArch64Subtarget.h

AArch64TargetMachine.h

AArch64.h

ArrayRef.h

BasicTTIImpl.h
This file provides a helper that implements much of the TTI interface in terms of the target-independ...

Type
RelocType Type
Definition: COFFYAML.cpp:391

Info
Analysis containing CSE Info
Definition: CSEInfo.cpp:27

CostKind
static cl::opt< TargetTransformInfo::TargetCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(TargetTransformInfo::TCK_RecipThroughput), cl::values(clEnumValN(TargetTransformInfo::TCK_RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(TargetTransformInfo::TCK_Latency, "latency", "Instruction latency"), clEnumValN(TargetTransformInfo::TCK_CodeSize, "code-size", "Code size"), clEnumValN(TargetTransformInfo::TCK_SizeAndLatency, "size-latency", "Code size and latency")))

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:352

Function.h

Intrinsics.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:52

TM
const char LLVMTargetMachineRef TM
Definition: PassBuilderBindings.cpp:52

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:77

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

VectorType
Definition: ItaniumDemangle.h:1149

llvm::AArch64Subtarget
Definition: AArch64Subtarget.h:38

llvm::AArch64TTIImpl
Definition: AArch64TargetTransformInfo.h:42

llvm::AArch64TTIImpl::getSpliceCost
InstructionCost getSpliceCost(VectorType *Tp, int Index)
Definition: AArch64TargetTransformInfo.cpp:4055

llvm::AArch64TTIImpl::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: AArch64TargetTransformInfo.cpp:2540

llvm::AArch64TTIImpl::getIntImmCostInst
InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind, Instruction *Inst=nullptr)
Definition: AArch64TargetTransformInfo.cpp:383

llvm::AArch64TTIImpl::getScalingFactorCost
InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, StackOffset BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace) const
Return the cost of the scaling factor used in the addressing mode represented by AM for this target,...
Definition: AArch64TargetTransformInfo.cpp:4454

llvm::AArch64TTIImpl::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind)
Definition: AArch64TargetTransformInfo.cpp:3407

llvm::AArch64TTIImpl::supportsScalableVectors
bool supportsScalableVectors() const
Definition: AArch64TargetTransformInfo.h:380

llvm::AArch64TTIImpl::getMinTripCountTailFoldingThreshold
unsigned getMinTripCountTailFoldingThreshold() const
Definition: AArch64TargetTransformInfo.h:361

llvm::AArch64TTIImpl::isLegalNTStoreLoad
bool isLegalNTStoreLoad(Type *DataType, Align Alignment)
Definition: AArch64TargetTransformInfo.h:316

llvm::AArch64TTIImpl::getGISelRematGlobalCost
unsigned getGISelRematGlobalCost() const
Definition: AArch64TargetTransformInfo.h:357

llvm::AArch64TTIImpl::shouldTreatInstructionLikeSelect
bool shouldTreatInstructionLikeSelect(const Instruction *I)
Definition: AArch64TargetTransformInfo.cpp:4477

llvm::AArch64TTIImpl::enableMaskedInterleavedAccessVectorization
bool enableMaskedInterleavedAccessVectorization()
Definition: AArch64TargetTransformInfo.h:109

llvm::AArch64TTIImpl::preferPredicatedReductionSelect
bool preferPredicatedReductionSelect(unsigned Opcode, Type *Ty, TTI::ReductionFlags Flags) const
Definition: AArch64TargetTransformInfo.h:389

llvm::AArch64TTIImpl::getVScaleForTuning
std::optional< unsigned > getVScaleForTuning() const
Definition: AArch64TargetTransformInfo.h:139

llvm::AArch64TTIImpl::getAddressComputationCost
InstructionCost getAddressComputationCost(Type *Ty, ScalarEvolution *SE, const SCEV *Ptr)
Definition: AArch64TargetTransformInfo.cpp:3274

llvm::AArch64TTIImpl::preferFixedOverScalableIfEqualCost
bool preferFixedOverScalableIfEqualCost() const
Definition: AArch64TargetTransformInfo.h:374

llvm::AArch64TTIImpl::prefersVectorizedAddressing
bool prefersVectorizedAddressing() const
Definition: AArch64TargetTransformInfo.cpp:3402

llvm::AArch64TTIImpl::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind)
Definition: AArch64TargetTransformInfo.cpp:542

llvm::AArch64TTIImpl::getArithmeticReductionCost
InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *Ty, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind)
Definition: AArch64TargetTransformInfo.cpp:3946

llvm::AArch64TTIImpl::getExtractWithExtendCost
InstructionCost getExtractWithExtendCost(unsigned Opcode, Type *Dst, VectorType *VecTy, unsigned Index)
Definition: AArch64TargetTransformInfo.cpp:2941

llvm::AArch64TTIImpl::isLegalMaskedStore
bool isLegalMaskedStore(Type *DataType, Align Alignment)
Definition: AArch64TargetTransformInfo.h:274

llvm::AArch64TTIImpl::getInlineCallPenalty
unsigned getInlineCallPenalty(const Function *F, const CallBase &Call, unsigned DefaultCallPenalty) const
Definition: AArch64TargetTransformInfo.cpp:300

llvm::AArch64TTIImpl::isLegalToVectorizeReduction
bool isLegalToVectorizeReduction(const RecurrenceDescriptor &RdxDesc, ElementCount VF) const
Definition: AArch64TargetTransformInfo.cpp:3863

llvm::AArch64TTIImpl::getOrCreateResultFromMemIntrinsic
Value * getOrCreateResultFromMemIntrinsic(IntrinsicInst *Inst, Type *ExpectedType)
Definition: AArch64TargetTransformInfo.cpp:3755

llvm::AArch64TTIImpl::enableOrderedReductions
bool enableOrderedReductions() const
Definition: AArch64TargetTransformInfo.h:344

llvm::AArch64TTIImpl::isLegalBroadcastLoad
bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const
Definition: AArch64TargetTransformInfo.h:299

llvm::AArch64TTIImpl::shouldConsiderAddressTypePromotion
bool shouldConsiderAddressTypePromotion(const Instruction &I, bool &AllowPromotionWithoutCommonHeader)
See if I should be considered for address type promotion.
Definition: AArch64TargetTransformInfo.cpp:3836

llvm::AArch64TTIImpl::getArithmeticReductionCostSVE
InstructionCost getArithmeticReductionCostSVE(unsigned Opcode, VectorType *ValTy, TTI::TargetCostKind CostKind)
Definition: AArch64TargetTransformInfo.cpp:3920

llvm::AArch64TTIImpl::getMinPageSize
std::optional< unsigned > getMinPageSize() const
Definition: AArch64TargetTransformInfo.h:433

llvm::AArch64TTIImpl::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false)
Definition: AArch64TargetTransformInfo.cpp:3588

llvm::AArch64TTIImpl::shouldExpandReduction
bool shouldExpandReduction(const IntrinsicInst *II) const
Definition: AArch64TargetTransformInfo.h:355

llvm::AArch64TTIImpl::getScalarizationOverhead
InstructionCost getScalarizationOverhead(VectorType *Ty, const APInt &DemandedElts, bool Insert, bool Extract, TTI::TargetCostKind CostKind)
Definition: AArch64TargetTransformInfo.cpp:3081

llvm::AArch64TTIImpl::getStoreMinimumVF
unsigned getStoreMinimumVF(unsigned VF, Type *ScalarMemTy, Type *ScalarValTy) const
Definition: AArch64TargetTransformInfo.h:424

llvm::AArch64TTIImpl::getMinVectorRegisterBitWidth
unsigned getMinVectorRegisterBitWidth() const
Definition: AArch64TargetTransformInfo.h:135

llvm::AArch64TTIImpl::enableSelectOptimize
bool enableSelectOptimize()
Definition: AArch64TargetTransformInfo.h:420

llvm::AArch64TTIImpl::instCombineIntrinsic
std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const
Definition: AArch64TargetTransformInfo.cpp:2101

llvm::AArch64TTIImpl::shouldMaximizeVectorBandwidth
bool shouldMaximizeVectorBandwidth(TargetTransformInfo::RegisterKind K) const
Definition: AArch64TargetTransformInfo.cpp:333

llvm::AArch64TTIImpl::isLSRCostLess
bool isLSRCostLess(const TargetTransformInfo::LSRCost &C1, const TargetTransformInfo::LSRCost &C2)
Definition: AArch64TargetTransformInfo.cpp:4489

llvm::AArch64TTIImpl::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, MaybeAlign Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr)
Definition: AArch64TargetTransformInfo.cpp:3491

llvm::AArch64TTIImpl::isElementTypeLegalForScalableVector
bool isElementTypeLegalForScalableVector(Type *Ty) const
Definition: AArch64TargetTransformInfo.h:241

llvm::AArch64TTIImpl::getCostOfKeepingLiveOverCall
InstructionCost getCostOfKeepingLiveOverCall(ArrayRef< Type * > Tys)
Definition: AArch64TargetTransformInfo.cpp:3624

llvm::AArch64TTIImpl::isLegalMaskedLoadStore
bool isLegalMaskedLoadStore(Type *DataType, Align Alignment)
Definition: AArch64TargetTransformInfo.h:258

llvm::AArch64TTIImpl::areInlineCompatible
bool areInlineCompatible(const Function *Caller, const Function *Callee) const
Definition: AArch64TargetTransformInfo.cpp:242

llvm::AArch64TTIImpl::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: AArch64TargetTransformInfo.cpp:3293

llvm::AArch64TTIImpl::enableScalableVectorization
bool enableScalableVectorization() const
Definition: AArch64TargetTransformInfo.cpp:2371

llvm::AArch64TTIImpl::useNeonVector
bool useNeonVector(const Type *Ty) const
Definition: AArch64TargetTransformInfo.cpp:3487

llvm::AArch64TTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: AArch64TargetTransformInfo.cpp:3065

llvm::AArch64TTIImpl::getPopcntSupport
TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth)
Definition: AArch64TargetTransformInfo.cpp:504

llvm::AArch64TTIImpl::areTypesABICompatible
bool areTypesABICompatible(const Function *Caller, const Function *Callee, const ArrayRef< Type * > &Types) const
Definition: AArch64TargetTransformInfo.cpp:275

llvm::AArch64TTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const
Definition: AArch64TargetTransformInfo.cpp:2377

llvm::AArch64TTIImpl::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: AArch64TargetTransformInfo.cpp:3454

llvm::AArch64TTIImpl::isLegalMaskedLoad
bool isLegalMaskedLoad(Type *DataType, Align Alignment)
Definition: AArch64TargetTransformInfo.h:270

llvm::AArch64TTIImpl::AArch64TTIImpl
AArch64TTIImpl(const AArch64TargetMachine *TM, const Function &F)
Definition: AArch64TargetTransformInfo.h:73

llvm::AArch64TTIImpl::getMaxNumElements
unsigned getMaxNumElements(ElementCount VF) const
Try to return an estimate cost factor that can be used as a multiplier when scalarizing an operation ...
Definition: AArch64TargetTransformInfo.h:151

llvm::AArch64TTIImpl::isLegalNTLoad
bool isLegalNTLoad(Type *DataType, Align Alignment)
Definition: AArch64TargetTransformInfo.h:337

llvm::AArch64TTIImpl::preferPredicateOverEpilogue
bool preferPredicateOverEpilogue(TailFoldingInfo *TFI)
Definition: AArch64TargetTransformInfo.cpp:4413

llvm::AArch64TTIImpl::getPreferredTailFoldingStyle
TailFoldingStyle getPreferredTailFoldingStyle(bool IVUpdateMayOverflow) const
Definition: AArch64TargetTransformInfo.h:365

llvm::AArch64TTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args=std::nullopt, const Instruction *CxtI=nullptr)
Definition: AArch64TargetTransformInfo.cpp:3093

llvm::AArch64TTIImpl::isLegalMaskedGatherScatter
bool isLegalMaskedGatherScatter(Type *DataType) const
Definition: AArch64TargetTransformInfo.h:278

llvm::AArch64TTIImpl::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF)
Definition: AArch64TargetTransformInfo.cpp:3638

llvm::AArch64TTIImpl::isLegalMaskedScatter
bool isLegalMaskedScatter(Type *DataType, Align Alignment) const
Definition: AArch64TargetTransformInfo.h:295

llvm::AArch64TTIImpl::getPeelingPreferences
void getPeelingPreferences(Loop *L, ScalarEvolution &SE, TTI::PeelingPreferences &PP)
Definition: AArch64TargetTransformInfo.cpp:3750

llvm::AArch64TTIImpl::getCFInstrCost
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: AArch64TargetTransformInfo.cpp:3002

llvm::AArch64TTIImpl::getIntImmCost
InstructionCost getIntImmCost(int64_t Val)
Calculate the cost of materializing a 64-bit value.
Definition: AArch64TargetTransformInfo.cpp:343

llvm::AArch64TTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: AArch64TargetTransformInfo.h:111

llvm::AArch64TTIImpl::simplifyDemandedVectorEltsIntrinsic
std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const
Definition: AArch64TargetTransformInfo.cpp:2345

llvm::AArch64TTIImpl::getShuffleCost
InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *Tp, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args=std::nullopt, const Instruction *CxtI=nullptr)
Definition: AArch64TargetTransformInfo.cpp:4111

llvm::AArch64TTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE)
Definition: AArch64TargetTransformInfo.cpp:3694

llvm::AArch64TTIImpl::isLegalMaskedGather
bool isLegalMaskedGather(Type *DataType, Align Alignment) const
Definition: AArch64TargetTransformInfo.h:291

llvm::AArch64TTIImpl::isVScaleKnownToBeAPowerOfTwo
bool isVScaleKnownToBeAPowerOfTwo() const
Definition: AArch64TargetTransformInfo.h:143

llvm::AArch64TTIImpl::getTgtMemIntrinsic
bool getTgtMemIntrinsic(IntrinsicInst *Inst, MemIntrinsicInfo &Info)
Definition: AArch64TargetTransformInfo.cpp:3791

llvm::AArch64TTIImpl::enableMemCmpExpansion
TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const
Definition: AArch64TargetTransformInfo.cpp:3384

llvm::AArch64TTIImpl::getMinMaxReductionCost
InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF, TTI::TargetCostKind CostKind)
Definition: AArch64TargetTransformInfo.cpp:3894

llvm::AArch64TTIImpl::enableInterleavedAccessVectorization
bool enableInterleavedAccessVectorization()
Definition: AArch64TargetTransformInfo.h:107

llvm::AArch64TTIImpl::isLegalNTStore
bool isLegalNTStore(Type *DataType, Align Alignment)
Definition: AArch64TargetTransformInfo.h:333

llvm::AArch64TTIImpl::isExtPartOfAvgExpr
bool isExtPartOfAvgExpr(const Instruction *ExtUser, Type *Dst, Type *Src)
Definition: AArch64TargetTransformInfo.cpp:2498

llvm::AArch64TTIImpl::getIntImmCostIntrin
InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind)
Definition: AArch64TargetTransformInfo.cpp:452

llvm::AArch64TargetLowering
Definition: AArch64ISelLowering.h:559

llvm::AArch64TargetMachine
Definition: AArch64TargetMachine.h:24

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BasicTTIImplBase
Base class which can be used to help build a TTI implementation.
Definition: BasicTTIImpl.h:81

llvm::BasicTTIImplBase< AArch64TTIImpl >::getStoreMinimumVF
unsigned getStoreMinimumVF(unsigned VF, Type *ScalarMemTy, Type *ScalarValTy) const
Definition: BasicTTIImpl.h:357

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1236

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:757

llvm::ElementCount
Definition: TypeSize.h:300

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition: FMF.h:20

llvm::Function
Definition: Function.h:64

llvm::GlobalValue
Definition: GlobalValue.h:48

llvm::InstCombiner
The core instruction combiner logic.
Definition: InstCombiner.h:47

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::Instruction
Definition: Instruction.h:68

llvm::IntrinsicCostAttributes
Definition: TargetTransformInfo.h:121

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:48

llvm::RecurrenceDescriptor
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
Definition: IVDescriptors.h:71

llvm::StackOffset
StackOffset holds a fixed and a scalable offset in bytes.
Definition: TypeSize.h:33

llvm::TargetTransformInfoImplBase::getDataLayout
const DataLayout & getDataLayout() const
Definition: TargetTransformInfoImpl.h:48

llvm::TargetTransformInfoImplBase::isLegalNTStore
bool isLegalNTStore(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:274

llvm::TargetTransformInfoImplBase::getIntImmCost
InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:441

llvm::TargetTransformInfoImplBase::isLegalNTLoad
bool isLegalNTLoad(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:281

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition: TargetTransformInfo.h:214

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition: TargetTransformInfo.h:259

llvm::TargetTransformInfo::OP_None
@ OP_None
Definition: TargetTransformInfo.h:1090

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition: TargetTransformInfo.h:1143

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition: TargetTransformInfo.h:702

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition: TargetTransformInfo.h:1061

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition: TargetTransformInfo.h:1338

llvm::TargetTransformInfo::OK_AnyValue
@ OK_AnyValue
Definition: TargetTransformInfo.h:1082

llvm::TypeSize
Definition: TypeSize.h:334

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::isPointerTy
bool isPointerTy() const
True if this is an instance of PointerType.
Definition: Type.h:251

llvm::Type::isFloatTy
bool isFloatTy() const
Return true if this is 'float', a 32-bit IEEE fp type.
Definition: Type.h:153

llvm::Type::isBFloatTy
bool isBFloatTy() const
Return true if this is 'bfloat', a 16-bit bfloat type.
Definition: Type.h:145

llvm::Type::getScalarSizeInBits
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::Type::isHalfTy
bool isHalfTy() const
Return true if this is 'half', a 16-bit IEEE fp type.
Definition: Type.h:142

llvm::Type::isDoubleTy
bool isDoubleTy() const
Return true if this is 'double', a 64-bit IEEE fp type.
Definition: Type.h:156

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:224

llvm::Type::getPrimitiveSizeInBits
TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition: Type.h:343

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::VectorType
Base class of all SIMD vector types.
Definition: DerivedTypes.h:403

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition: TypeSize.h:202

llvm::details::FixedOrScalableQuantity::isScalable
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition: TypeSize.h:171

llvm::details::FixedOrScalableQuantity::getKnownMinValue
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
Definition: TypeSize.h:168

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition: AMDGPUMetadata.h:395

llvm::Intrinsic::ID
unsigned ID
Definition: GenericSSAContext.h:28

llvm::TargetStackID::Value
Value
Definition: TargetFrameLowering.h:29

llvm::dwarf::Index
Index
Definition: Dwarf.h:875

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::AddressSpace
AddressSpace
Definition: NVPTXBaseInfo.h:21

llvm::isPowerOf2_64
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
Definition: MathExtras.h:296

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:291

llvm::TailFoldingStyle
TailFoldingStyle
Definition: TargetTransformInfo.h:167

llvm::TailFoldingStyle::DataAndControlFlowWithoutRuntimeCheck
@ DataAndControlFlowWithoutRuntimeCheck
Use predicate to control both data and control flow, but modify the trip count so that a runtime over...

llvm::TailFoldingStyle::DataAndControlFlow
@ DataAndControlFlow
Use predicate to control both data and control flow.

llvm::TailFoldingStyle::DataWithoutLaneMask
@ DataWithoutLaneMask
Same as Data, but avoids using the get.active.lane.mask intrinsic to calculate the mask and instead i...

llvm::VFParamKind::Vector
@ Vector

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::TailFoldingInfo
Definition: TargetTransformInfo.h:200

llvm::TargetTransformInfo::LSRCost
Definition: TargetTransformInfo.h:517

llvm::TargetTransformInfo::OperandValueInfo
Definition: TargetTransformInfo.h:1098

llvm::TargetTransformInfo::ReductionFlags
Flags describing the kind of vector reduction.
Definition: TargetTransformInfo.h:1679