doxygen/ARMTargetTransformInfo_8h_source.html

//===- ARMTargetTransformInfo.h - ARM specific TTI --------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file

/// This file a TargetTransformInfo::Concept conforming object specific to the

/// ARM target machine. It uses the target's detailed information to

/// provide more precise answers to certain TTI queries, while letting the

/// target independent and default TTI implementations handle the rest.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H

#define LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H


#include "ARM.h"

#include "ARMSubtarget.h"

#include "ARMTargetMachine.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/CodeGen/BasicTTIImpl.h"

#include "llvm/IR/Constant.h"

#include "llvm/IR/Function.h"

#include "llvm/TargetParser/SubtargetFeature.h"

#include <optional>


namespace llvm {


class APInt;

class ARMTargetLowering;

class Instruction;

class Loop;

class SCEV;

class ScalarEvolution;

class Type;

class Value;


namespace TailPredication {

  enum Mode {

    Disabled = 0,

    EnabledNoReductions,

    Enabled,

    ForceEnabledNoReductions,

    ForceEnabled

  };

}


// For controlling conversion of memcpy into Tail Predicated loop.

namespace TPLoop {

enum MemTransfer { ForceDisabled = 0, ForceEnabled, Allow };

}


class ARMTTIImpl : public BasicTTIImplBase<ARMTTIImpl> {

  using BaseT = BasicTTIImplBase<ARMTTIImpl>;

  using TTI = TargetTransformInfo;


  friend BaseT;


  const ARMSubtarget *ST;

  const ARMTargetLowering *TLI;


  // Currently the following features are excluded from InlineFeaturesAllowed.

  // ModeThumb, FeatureNoARM, ModeSoftFloat, FeatureFP64, FeatureD32

  // Depending on whether they are set or unset, different

  // instructions/registers are available. For example, inlining a callee with

  // -thumb-mode in a caller with +thumb-mode, may cause the assembler to

  // fail if the callee uses ARM only instructions, e.g. in inline asm.

  const FeatureBitset InlineFeaturesAllowed = {

      ARM::FeatureVFP2, ARM::FeatureVFP3, ARM::FeatureNEON, ARM::FeatureThumb2,

      ARM::FeatureFP16, ARM::FeatureVFP4, ARM::FeatureFPARMv8,

      ARM::FeatureFullFP16, ARM::FeatureFP16FML, ARM::FeatureHWDivThumb,

      ARM::FeatureHWDivARM, ARM::FeatureDB, ARM::FeatureV7Clrex,

      ARM::FeatureAcquireRelease, ARM::FeatureSlowFPBrcc,

      ARM::FeaturePerfMon, ARM::FeatureTrustZone, ARM::Feature8MSecExt,

      ARM::FeatureCrypto, ARM::FeatureCRC, ARM::FeatureRAS,

      ARM::FeatureFPAO, ARM::FeatureFuseAES, ARM::FeatureZCZeroing,

      ARM::FeatureProfUnpredicate, ARM::FeatureSlowVGETLNi32,

      ARM::FeatureSlowVDUP32, ARM::FeaturePreferVMOVSR,

      ARM::FeaturePrefISHSTBarrier, ARM::FeatureMuxedUnits,

      ARM::FeatureSlowOddRegister, ARM::FeatureSlowLoadDSubreg,

      ARM::FeatureDontWidenVMOVS, ARM::FeatureExpandMLx,

      ARM::FeatureHasVMLxHazards, ARM::FeatureNEONForFPMovs,

      ARM::FeatureNEONForFP, ARM::FeatureCheckVLDnAlign,

      ARM::FeatureHasSlowFPVMLx, ARM::FeatureHasSlowFPVFMx,

      ARM::FeatureVMLxForwarding, ARM::FeaturePref32BitThumb,

      ARM::FeatureAvoidPartialCPSR, ARM::FeatureCheapPredicableCPSR,

      ARM::FeatureAvoidMOVsShOp, ARM::FeatureHasRetAddrStack,

      ARM::FeatureHasNoBranchPredictor, ARM::FeatureDSP, ARM::FeatureMP,

      ARM::FeatureVirtualization, ARM::FeatureMClass, ARM::FeatureRClass,

      ARM::FeatureAClass, ARM::FeatureNaClTrap, ARM::FeatureStrictAlign,

      ARM::FeatureLongCalls, ARM::FeatureExecuteOnly, ARM::FeatureReserveR9,

      ARM::FeatureNoMovt, ARM::FeatureNoNegativeImmediates

  };


  const ARMSubtarget *getST() const { return ST; }

  const ARMTargetLowering *getTLI() const { return TLI; }


public:

  explicit ARMTTIImpl(const ARMBaseTargetMachine *TM, const Function &F)

      : BaseT(TM, F.getParent()->getDataLayout()), ST(TM->getSubtargetImpl(F)),

        TLI(ST->getTargetLowering()) {}


  bool areInlineCompatible(const Function *Caller,

                           const Function *Callee) const;


  bool enableInterleavedAccessVectorization() { return true; }


  TTI::AddressingModeKind

    getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const;


  /// Floating-point computation using ARMv8 AArch32 Advanced

  /// SIMD instructions remains unchanged from ARMv7. Only AArch64 SIMD

  /// and Arm MVE are IEEE-754 compliant.

  bool isFPVectorizationPotentiallyUnsafe() {

    return !ST->isTargetDarwin() && !ST->hasMVEFloatOps();

  }


  std::optional<Instruction *> instCombineIntrinsic(InstCombiner &IC,

                                                    IntrinsicInst &II) const;

  std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const;


  /// \name Scalar TTI Implementations

  /// @{


  InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx,

                                        const APInt &Imm, Type *Ty);


  using BaseT::getIntImmCost;

  InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                TTI::TargetCostKind CostKind);


  InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx,

                                    const APInt &Imm, Type *Ty,

                                    TTI::TargetCostKind CostKind,

                                    Instruction *Inst = nullptr);


  /// @}


  /// \name Vector TTI Implementations

  /// @{


  unsigned getNumberOfRegisters(unsigned ClassID) const {

    bool Vector = (ClassID == 1);

    if (Vector) {

      if (ST->hasNEON())

        return 16;

      if (ST->hasMVEIntegerOps())

        return 8;

      return 0;

    }


    if (ST->isThumb1Only())

      return 8;

    return 13;

  }


  TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const {

    switch (K) {

    case TargetTransformInfo::RGK_Scalar:

      return TypeSize::getFixed(32);

    case TargetTransformInfo::RGK_FixedWidthVector:

      if (ST->hasNEON())

        return TypeSize::getFixed(128);

      if (ST->hasMVEIntegerOps())

        return TypeSize::getFixed(128);

      return TypeSize::getFixed(0);

    case TargetTransformInfo::RGK_ScalableVector:

      return TypeSize::getScalable(0);

    }

    llvm_unreachable("Unsupported register kind");

  }


  unsigned getMaxInterleaveFactor(ElementCount VF) {

    return ST->getMaxInterleaveFactor();

  }


  bool isProfitableLSRChainElement(Instruction *I);


  bool isLegalMaskedLoad(Type *DataTy, Align Alignment);


  bool isLegalMaskedStore(Type *DataTy, Align Alignment) {

    return isLegalMaskedLoad(DataTy, Alignment);

  }


  bool forceScalarizeMaskedGather(VectorType *VTy, Align Alignment) {

    // For MVE, we have a custom lowering pass that will already have custom

    // legalised any gathers that we can lower to MVE intrinsics, and want to

    // expand all the rest. The pass runs before the masked intrinsic lowering

    // pass.

    return true;

  }


  bool forceScalarizeMaskedScatter(VectorType *VTy, Align Alignment) {

    return forceScalarizeMaskedGather(VTy, Alignment);

  }


  bool isLegalMaskedGather(Type *Ty, Align Alignment);


  bool isLegalMaskedScatter(Type *Ty, Align Alignment) {

    return isLegalMaskedGather(Ty, Alignment);

  }


  InstructionCost getMemcpyCost(const Instruction *I);


  uint64_t getMaxMemIntrinsicInlineSizeThreshold() const {

    return ST->getMaxInlineSizeThreshold();

  }


  int getNumMemOps(const IntrinsicInst *I) const;


  InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *Tp,

                                 ArrayRef<int> Mask,

                                 TTI::TargetCostKind CostKind, int Index,

                                 VectorType *SubTp,

                                 ArrayRef<const Value *> Args = std::nullopt,

                                 const Instruction *CxtI = nullptr);


  bool preferInLoopReduction(unsigned Opcode, Type *Ty,

                             TTI::ReductionFlags Flags) const;


  bool preferPredicatedReductionSelect(unsigned Opcode, Type *Ty,

                                       TTI::ReductionFlags Flags) const;


  bool shouldExpandReduction(const IntrinsicInst *II) const { return false; }


  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                 const Instruction *I = nullptr);


  InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src,

                                   TTI::CastContextHint CCH,

                                   TTI::TargetCostKind CostKind,

                                   const Instruction *I = nullptr);


  InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy,

                                     CmpInst::Predicate VecPred,

                                     TTI::TargetCostKind CostKind,

                                     const Instruction *I = nullptr);


  using BaseT::getVectorInstrCost;

  InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val,

                                     TTI::TargetCostKind CostKind,

                                     unsigned Index, Value *Op0, Value *Op1);


  InstructionCost getAddressComputationCost(Type *Val, ScalarEvolution *SE,

                                            const SCEV *Ptr);


  InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      ArrayRef<const Value *> Args = ArrayRef<const Value *>(),

      const Instruction *CxtI = nullptr);


  InstructionCost

  getMemoryOpCost(unsigned Opcode, Type *Src, MaybeAlign Alignment,

                  unsigned AddressSpace, TTI::TargetCostKind CostKind,

                  TTI::OperandValueInfo OpInfo = {TTI::OK_AnyValue, TTI::OP_None},

                  const Instruction *I = nullptr);


  InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src,

                                        Align Alignment, unsigned AddressSpace,

                                        TTI::TargetCostKind CostKind);


  InstructionCost getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

      bool UseMaskForCond = false, bool UseMaskForGaps = false);


  InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy,

                                         const Value *Ptr, bool VariableMask,

                                         Align Alignment,

                                         TTI::TargetCostKind CostKind,

                                         const Instruction *I = nullptr);


  InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *ValTy,

                                             std::optional<FastMathFlags> FMF,

                                             TTI::TargetCostKind CostKind);

  InstructionCost getExtendedReductionCost(unsigned Opcode, bool IsUnsigned,

                                           Type *ResTy, VectorType *ValTy,

                                           FastMathFlags FMF,

                                           TTI::TargetCostKind CostKind);

  InstructionCost getMulAccReductionCost(bool IsUnsigned, Type *ResTy,

                                         VectorType *ValTy,

                                         TTI::TargetCostKind CostKind);


  InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty,

                                         FastMathFlags FMF,

                                         TTI::TargetCostKind CostKind);


  InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                                        TTI::TargetCostKind CostKind);


  /// getScalingFactorCost - Return the cost of the scaling used in

  /// addressing mode represented by AM.

  /// If the AM is supported, the return value must be >= 0.

  /// If the AM is not supported, the return value must be negative.

  InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                       int64_t BaseOffset, bool HasBaseReg,

                                       int64_t Scale, unsigned AddrSpace) const;


  bool maybeLoweredToCall(Instruction &I);

  bool isLoweredToCall(const Function *F);

  bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE,

                                AssumptionCache &AC,

                                TargetLibraryInfo *LibInfo,

                                HardwareLoopInfo &HWLoopInfo);

  bool preferPredicateOverEpilogue(TailFoldingInfo *TFI);

  void getUnrollingPreferences(Loop *L, ScalarEvolution &SE,

                               TTI::UnrollingPreferences &UP,

                               OptimizationRemarkEmitter *ORE);


  TailFoldingStyle

  getPreferredTailFoldingStyle(bool IVUpdateMayOverflow = true) const;


  void getPeelingPreferences(Loop *L, ScalarEvolution &SE,

                             TTI::PeelingPreferences &PP);

  bool shouldBuildLookupTablesForConstant(Constant *C) const {

    // In the ROPI and RWPI relocation models we can't have pointers to global

    // variables or functions in constant data, so don't convert switches to

    // lookup tables if any of the values would need relocation.

    if (ST->isROPI() || ST->isRWPI())

      return !C->needsDynamicRelocation();


    return true;

  }


  bool hasArmWideBranch(bool Thumb) const;


  /// @}

};


/// isVREVMask - Check if a vector shuffle corresponds to a VREV

/// instruction with the specified blocksize.  (The order of the elements

/// within each block of the vector is reversed.)

inline bool isVREVMask(ArrayRef<int> M, EVT VT, unsigned BlockSize) {

  assert((BlockSize == 16 || BlockSize == 32 || BlockSize == 64) &&

         "Only possible block sizes for VREV are: 16, 32, 64");


  unsigned EltSz = VT.getScalarSizeInBits();

  if (EltSz != 8 && EltSz != 16 && EltSz != 32)

    return false;


  unsigned BlockElts = M[0] + 1;

  // If the first shuffle index is UNDEF, be optimistic.

  if (M[0] < 0)

    BlockElts = BlockSize / EltSz;


  if (BlockSize <= EltSz || BlockSize != BlockElts * EltSz)

    return false;


  for (unsigned i = 0, e = M.size(); i < e; ++i) {

    if (M[i] < 0)

      continue; // ignore UNDEF indices

    if ((unsigned)M[i] != (i - i % BlockElts) + (BlockElts - 1 - i % BlockElts))

      return false;

  }


  return true;

}


} // end namespace llvm


#endif // LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H

ARMSubtarget.h

ARMTargetMachine.h

ARM.h

ArrayRef.h

getParent
static const Function * getParent(const Value *V)
Definition: BasicAliasAnalysis.cpp:848

BasicTTIImpl.h
This file provides a helper that implements much of the TTI interface in terms of the target-independ...

Type
RelocType Type
Definition: COFFYAML.cpp:391

Constant.h

CostKind
static cl::opt< TargetTransformInfo::TargetCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(TargetTransformInfo::TCK_RecipThroughput), cl::values(clEnumValN(TargetTransformInfo::TCK_RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(TargetTransformInfo::TCK_Latency, "latency", "Instruction latency"), clEnumValN(TargetTransformInfo::TCK_CodeSize, "code-size", "Code size"), clEnumValN(TargetTransformInfo::TCK_SizeAndLatency, "size-latency", "Code size and latency")))

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:354

Function.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

TM
const char LLVMTargetMachineRef TM
Definition: PassBuilderBindings.cpp:47

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

SubtargetFeature.h

BlockSize
static const int BlockSize
Definition: TarWriter.cpp:33

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:76

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

VectorType
Definition: ItaniumDemangle.h:1149

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:76

llvm::ARMBaseTargetMachine
Definition: ARMTargetMachine.h:27

llvm::ARMSubtarget
Definition: ARMSubtarget.h:48

llvm::ARMTTIImpl
Definition: ARMTargetTransformInfo.h:57

llvm::ARMTTIImpl::preferInLoopReduction
bool preferInLoopReduction(unsigned Opcode, Type *Ty, TTI::ReductionFlags Flags) const
Definition: ARMTargetTransformInfo.cpp:2552

llvm::ARMTTIImpl::getAddressComputationCost
InstructionCost getAddressComputationCost(Type *Val, ScalarEvolution *SE, const SCEV *Ptr)
Definition: ARMTargetTransformInfo.cpp:1064

llvm::ARMTTIImpl::maybeLoweredToCall
bool maybeLoweredToCall(Instruction &I)
Definition: ARMTargetTransformInfo.cpp:2051

llvm::ARMTTIImpl::enableInterleavedAccessVectorization
bool enableInterleavedAccessVectorization()
Definition: ARMTargetTransformInfo.h:110

llvm::ARMTTIImpl::getPreferredTailFoldingStyle
TailFoldingStyle getPreferredTailFoldingStyle(bool IVUpdateMayOverflow=true) const
Definition: ARMTargetTransformInfo.cpp:2428

llvm::ARMTTIImpl::isLegalMaskedStore
bool isLegalMaskedStore(Type *DataTy, Align Alignment)
Definition: ARMTargetTransformInfo.h:189

llvm::ARMTTIImpl::isLegalMaskedLoad
bool isLegalMaskedLoad(Type *DataTy, Align Alignment)
Definition: ARMTargetTransformInfo.cpp:1103

llvm::ARMTTIImpl::getMemcpyCost
InstructionCost getMemcpyCost(const Instruction *I)
Definition: ARMTargetTransformInfo.cpp:1201

llvm::ARMTTIImpl::shouldBuildLookupTablesForConstant
bool shouldBuildLookupTablesForConstant(Constant *C) const
Definition: ARMTargetTransformInfo.h:325

llvm::ARMTTIImpl::getIntImmCost
InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind)
Definition: ARMTargetTransformInfo.cpp:297

llvm::ARMTTIImpl::isLoweredToCall
bool isLoweredToCall(const Function *F)
Definition: ARMTargetTransformInfo.cpp:1990

llvm::ARMTTIImpl::getMulAccReductionCost
InstructionCost getMulAccReductionCost(bool IsUnsigned, Type *ResTy, VectorType *ValTy, TTI::TargetCostKind CostKind)
Definition: ARMTargetTransformInfo.cpp:1798

llvm::ARMTTIImpl::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind)
Definition: ARMTargetTransformInfo.cpp:1885

llvm::ARMTTIImpl::isHardwareLoopProfitable
bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE, AssumptionCache &AC, TargetLibraryInfo *LibInfo, HardwareLoopInfo &HWLoopInfo)
Definition: ARMTargetTransformInfo.cpp:2138

llvm::ARMTTIImpl::isFPVectorizationPotentiallyUnsafe
bool isFPVectorizationPotentiallyUnsafe()
Floating-point computation using ARMv8 AArch32 Advanced SIMD instructions remains unchanged from ARMv...
Definition: ARMTargetTransformInfo.h:118

llvm::ARMTTIImpl::getNumMemOps
int getNumMemOps(const IntrinsicInst *I) const
Given a memcpy/memset/memmove instruction, return the number of memory operations performed,...
Definition: ARMTargetTransformInfo.cpp:1135

llvm::ARMTTIImpl::instCombineIntrinsic
std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const
Definition: ARMTargetTransformInfo.cpp:122

llvm::ARMTTIImpl::getArithmeticReductionCost
InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *ValTy, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind)
Definition: ARMTargetTransformInfo.cpp:1678

llvm::ARMTTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args=ArrayRef< const Value * >(), const Instruction *CxtI=nullptr)
Definition: ARMTargetTransformInfo.cpp:1326

llvm::ARMTTIImpl::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: ARMTargetTransformInfo.cpp:474

llvm::ARMTTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE)
Definition: ARMTargetTransformInfo.cpp:2438

llvm::ARMTTIImpl::isLegalMaskedScatter
bool isLegalMaskedScatter(Type *Ty, Align Alignment)
Definition: ARMTargetTransformInfo.h:207

llvm::ARMTTIImpl::shouldExpandReduction
bool shouldExpandReduction(const IntrinsicInst *II) const
Definition: ARMTargetTransformInfo.h:232

llvm::ARMTTIImpl::getMinMaxReductionCost
InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF, TTI::TargetCostKind CostKind)
Definition: ARMTargetTransformInfo.cpp:1825

llvm::ARMTTIImpl::hasArmWideBranch
bool hasArmWideBranch(bool Thumb) const
Definition: ARMTargetTransformInfo.cpp:2590

llvm::ARMTTIImpl::forceScalarizeMaskedGather
bool forceScalarizeMaskedGather(VectorType *VTy, Align Alignment)
Definition: ARMTargetTransformInfo.h:193

llvm::ARMTTIImpl::getMaxMemIntrinsicInlineSizeThreshold
uint64_t getMaxMemIntrinsicInlineSizeThreshold() const
Definition: ARMTargetTransformInfo.h:213

llvm::ARMTTIImpl::preferPredicateOverEpilogue
bool preferPredicateOverEpilogue(TailFoldingInfo *TFI)
Definition: ARMTargetTransformInfo.cpp:2374

llvm::ARMTTIImpl::ARMTTIImpl
ARMTTIImpl(const ARMBaseTargetMachine *TM, const Function &F)
Definition: ARMTargetTransformInfo.h:103

llvm::ARMTTIImpl::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: ARMTargetTransformInfo.cpp:1573

llvm::ARMTTIImpl::getIntImmCostInst
InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind, Instruction *Inst=nullptr)
Definition: ARMTargetTransformInfo.cpp:389

llvm::ARMTTIImpl::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: ARMTargetTransformInfo.cpp:917

llvm::ARMTTIImpl::isLegalMaskedGather
bool isLegalMaskedGather(Type *Ty, Align Alignment)
Definition: ARMTargetTransformInfo.cpp:1123

llvm::ARMTTIImpl::areInlineCompatible
bool areInlineCompatible(const Function *Caller, const Function *Callee) const
Definition: ARMTargetTransformInfo.cpp:87

llvm::ARMTTIImpl::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false)
Definition: ARMTargetTransformInfo.cpp:1532

llvm::ARMTTIImpl::getCFInstrCost
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: ARMTargetTransformInfo.cpp:460

llvm::ARMTTIImpl::forceScalarizeMaskedScatter
bool forceScalarizeMaskedScatter(VectorType *VTy, Align Alignment)
Definition: ARMTargetTransformInfo.h:201

llvm::ARMTTIImpl::getScalingFactorCost
InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, int64_t BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace) const
getScalingFactorCost - Return the cost of the scaling used in addressing mode represented by AM.
Definition: ARMTargetTransformInfo.cpp:2573

llvm::ARMTTIImpl::getPreferredAddressingMode
TTI::AddressingModeKind getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const
Definition: ARMTargetTransformInfo.cpp:106

llvm::ARMTTIImpl::getIntImmCodeSizeCost
InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty)
Definition: ARMTargetTransformInfo.cpp:332

llvm::ARMTTIImpl::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF)
Definition: ARMTargetTransformInfo.h:181

llvm::ARMTTIImpl::getShuffleCost
InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *Tp, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args=std::nullopt, const Instruction *CxtI=nullptr)
Definition: ARMTargetTransformInfo.cpp:1211

llvm::ARMTTIImpl::getExtendedReductionCost
InstructionCost getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy, VectorType *ValTy, FastMathFlags FMF, TTI::TargetCostKind CostKind)
Definition: ARMTargetTransformInfo.cpp:1763

llvm::ARMTTIImpl::preferPredicatedReductionSelect
bool preferPredicatedReductionSelect(unsigned Opcode, Type *Ty, TTI::ReductionFlags Flags) const
Definition: ARMTargetTransformInfo.cpp:2566

llvm::ARMTTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const
Definition: ARMTargetTransformInfo.h:165

llvm::ARMTTIImpl::simplifyDemandedVectorEltsIntrinsic
std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const
Definition: ARMTargetTransformInfo.cpp:255

llvm::ARMTTIImpl::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind)
Definition: ARMTargetTransformInfo.cpp:1515

llvm::ARMTTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: ARMTargetTransformInfo.h:150

llvm::ARMTTIImpl::isProfitableLSRChainElement
bool isProfitableLSRChainElement(Instruction *I)
Definition: ARMTargetTransformInfo.cpp:1086

llvm::ARMTTIImpl::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, MaybeAlign Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr)
Definition: ARMTargetTransformInfo.cpp:1467

llvm::ARMTTIImpl::getPeelingPreferences
void getPeelingPreferences(Loop *L, ScalarEvolution &SE, TTI::PeelingPreferences &PP)
Definition: ARMTargetTransformInfo.cpp:2547

llvm::ARMTTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: ARMTargetTransformInfo.cpp:878

llvm::ARMTargetLowering
Definition: ARMISelLowering.h:398

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BasicTTIImplBase
Base class which can be used to help build a TTI implementation.
Definition: BasicTTIImpl.h:80

llvm::BasicTTIImplBase< ARMTTIImpl >::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: BasicTTIImpl.h:1273

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:993

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:41

llvm::ElementCount
Definition: TypeSize.h:285

llvm::FeatureBitset
Container class for subtarget features.
Definition: SubtargetFeature.h:41

llvm::Function
Definition: Function.h:62

llvm::InstCombiner
The core instruction combiner logic.
Definition: InstCombiner.h:47

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::Instruction
Definition: Instruction.h:49

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:47

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:44

llvm::SCEV
This class represents an analyzed expression in the program.
Definition: ScalarEvolution.h:75

llvm::ScalarEvolution
The main scalar evolution driver.
Definition: ScalarEvolution.h:452

llvm::TargetTransformInfoImplBase::getDataLayout
const DataLayout & getDataLayout() const
Definition: TargetTransformInfoImpl.h:47

llvm::TargetTransformInfoImplBase::getIntImmCost
InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:428

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition: TargetTransformInfo.h:213

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition: TargetTransformInfo.h:258

llvm::TargetTransformInfo::OP_None
@ OP_None
Definition: TargetTransformInfo.h:1076

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition: TargetTransformInfo.h:1125

llvm::TargetTransformInfo::RGK_FixedWidthVector
@ RGK_FixedWidthVector
Definition: TargetTransformInfo.h:1125

llvm::TargetTransformInfo::RGK_ScalableVector
@ RGK_ScalableVector
Definition: TargetTransformInfo.h:1125

llvm::TargetTransformInfo::RGK_Scalar
@ RGK_Scalar
Definition: TargetTransformInfo.h:1125

llvm::TargetTransformInfo::AddressingModeKind
AddressingModeKind
Definition: TargetTransformInfo.h:757

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition: TargetTransformInfo.h:1047

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition: TargetTransformInfo.h:1320

llvm::TargetTransformInfo::OK_AnyValue
@ OK_AnyValue
Definition: TargetTransformInfo.h:1068

llvm::TypeSize
Definition: TypeSize.h:319

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition: TypeSize.h:330

llvm::TypeSize::getScalable
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition: TypeSize.h:333

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::VectorType
Base class of all SIMD vector types.
Definition: DerivedTypes.h:403

uint64_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition: AMDGPUMetadata.h:395

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::Intrinsic::ID
unsigned ID
Definition: GenericSSAContext.h:28

llvm::TPLoop::MemTransfer
MemTransfer
Definition: ARMTargetTransformInfo.h:54

llvm::TPLoop::Allow
@ Allow
Definition: ARMTargetTransformInfo.h:54

llvm::TPLoop::ForceDisabled
@ ForceDisabled
Definition: ARMTargetTransformInfo.h:54

llvm::TPLoop::ForceEnabled
@ ForceEnabled
Definition: ARMTargetTransformInfo.h:54

llvm::TailPredication::Mode
Mode
Definition: ARMTargetTransformInfo.h:43

llvm::TailPredication::ForceEnabled
@ ForceEnabled
Definition: ARMTargetTransformInfo.h:48

llvm::TailPredication::Disabled
@ Disabled
Definition: ARMTargetTransformInfo.h:44

llvm::TailPredication::EnabledNoReductions
@ EnabledNoReductions
Definition: ARMTargetTransformInfo.h:45

llvm::TailPredication::ForceEnabledNoReductions
@ ForceEnabledNoReductions
Definition: ARMTargetTransformInfo.h:47

llvm::TailPredication::Enabled
@ Enabled
Definition: ARMTargetTransformInfo.h:46

llvm::TargetStackID::Value
Value
Definition: TargetFrameLowering.h:28

llvm::dwarf::Index
Index
Definition: Dwarf.h:558

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::AddressSpace
AddressSpace
Definition: NVPTXBaseInfo.h:21

llvm::isVREVMask
bool isVREVMask(ArrayRef< int > M, EVT VT, unsigned BlockSize)
isVREVMask - Check if a vector shuffle corresponds to a VREV instruction with the specified blocksize...
Definition: ARMTargetTransformInfo.h:343

llvm::TailFoldingStyle
TailFoldingStyle
Definition: TargetTransformInfo.h:166

llvm::VFParamKind::Vector
@ Vector

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:34

llvm::EVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition: ValueTypes.h:370

llvm::TargetTransformInfo::OperandValueInfo
Definition: TargetTransformInfo.h:1084

llvm::TargetTransformInfo::ReductionFlags
Flags describing the kind of vector reduction.
Definition: TargetTransformInfo.h:1661