doxygen/WebAssemblyTargetTransformInfo_8cpp_source.html

//===-- WebAssemblyTargetTransformInfo.cpp - WebAssembly-specific TTI -----===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

///

/// \file

/// This file defines the WebAssembly-specific TargetTransformInfo

/// implementation.

///

//===----------------------------------------------------------------------===//


#include "WebAssemblyTargetTransformInfo.h"

using namespace llvm;


#define DEBUG_TYPE "wasmtti"


TargetTransformInfo::PopcntSupportKind

WebAssemblyTTIImpl::getPopcntSupport(unsigned TyWidth) const {

  assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2");

  return TargetTransformInfo::PSK_FastHardware;

}


unsigned WebAssemblyTTIImpl::getNumberOfRegisters(unsigned ClassID) const {

  unsigned Result = BaseT::getNumberOfRegisters(ClassID);


  // For SIMD, use at least 16 registers, as a rough guess.

  bool Vector = (ClassID == 1);

  if (Vector)

    Result = std::max(Result, 16u);


  return Result;

}


TypeSize WebAssemblyTTIImpl::getRegisterBitWidth(

    TargetTransformInfo::RegisterKind K) const {

  switch (K) {

  case TargetTransformInfo::RGK_Scalar:

    return TypeSize::getFixed(64);

  case TargetTransformInfo::RGK_FixedWidthVector:

    return TypeSize::getFixed(getST()->hasSIMD128() ? 128 : 64);

  case TargetTransformInfo::RGK_ScalableVector:

    return TypeSize::getScalable(0);

  }


  llvm_unreachable("Unsupported register kind");

}


InstructionCost WebAssemblyTTIImpl::getArithmeticInstrCost(

    unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

    TTI::OperandValueInfo Op1Info, TTI::OperandValueInfo Op2Info,

    ArrayRef<const Value *> Args,

    const Instruction *CxtI) {


  InstructionCost Cost =

      BasicTTIImplBase<WebAssemblyTTIImpl>::getArithmeticInstrCost(

          Opcode, Ty, CostKind, Op1Info, Op2Info);


  if (auto *VTy = dyn_cast<VectorType>(Ty)) {

    switch (Opcode) {

    case Instruction::LShr:

    case Instruction::AShr:

    case Instruction::Shl:

      // SIMD128's shifts currently only accept a scalar shift count. For each

      // element, we'll need to extract, op, insert. The following is a rough

      // approximation.

      if (!Op2Info.isUniform())

        Cost =

            cast<FixedVectorType>(VTy)->getNumElements() *

            (TargetTransformInfo::TCC_Basic +

             getArithmeticInstrCost(Opcode, VTy->getElementType(), CostKind) +

             TargetTransformInfo::TCC_Basic);

      break;

    }

  }

  return Cost;

}


InstructionCost

WebAssemblyTTIImpl::getVectorInstrCost(unsigned Opcode, Type *Val,

                                       TTI::TargetCostKind CostKind,

                                       unsigned Index, Value *Op0, Value *Op1) {

  InstructionCost Cost = BasicTTIImplBase::getVectorInstrCost(

      Opcode, Val, CostKind, Index, Op0, Op1);


  // SIMD128's insert/extract currently only take constant indices.

  if (Index == -1u)

    return Cost + 25 * TargetTransformInfo::TCC_Expensive;


  return Cost;

}


TTI::ReductionShuffle WebAssemblyTTIImpl::getPreferredExpandedReductionShuffle(

    const IntrinsicInst *II) const {


  switch (II->getIntrinsicID()) {

  default:

    break;

  case Intrinsic::vector_reduce_fadd:

    return TTI::ReductionShuffle::Pairwise;

  }

  return TTI::ReductionShuffle::SplitHalf;

}


void WebAssemblyTTIImpl::getUnrollingPreferences(

    Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP,

    OptimizationRemarkEmitter *ORE) const {

  // Scan the loop: don't unroll loops with calls. This is a standard approach

  // for most (all?) targets.

  for (BasicBlock *BB : L->blocks())

    for (Instruction &I : *BB)

      if (isa<CallInst>(I) || isa<InvokeInst>(I))

        if (const Function *F = cast<CallBase>(I).getCalledFunction())

          if (isLoweredToCall(F))

            return;


  // The chosen threshold is within the range of 'LoopMicroOpBufferSize' of

  // the various microarchitectures that use the BasicTTI implementation and

  // has been selected through heuristics across multiple cores and runtimes.

  UP.Partial = UP.Runtime = UP.UpperBound = true;

  UP.PartialThreshold = 30;


  // Avoid unrolling when optimizing for size.

  UP.OptSizeThreshold = 0;

  UP.PartialOptSizeThreshold = 0;


  // Set number of instructions optimized when "back edge"

  // becomes "fall through" to default value of 2.

  UP.BEInsns = 2;

}


bool WebAssemblyTTIImpl::supportsTailCalls() const {

  return getST()->hasTailCall();

}


bool WebAssemblyTTIImpl::isProfitableToSinkOperands(

    Instruction *I, SmallVectorImpl<Use *> &Ops) const {

  using namespace llvm::PatternMatch;


  if (!I->getType()->isVectorTy() || !I->isShift())

    return false;


  Value *V = I->getOperand(1);

  // We dont need to sink constant splat.

  if (dyn_cast<Constant>(V))

    return false;


  if (match(V, m_Shuffle(m_InsertElt(m_Value(), m_Value(), m_ZeroInt()),

                         m_Value(), m_ZeroMask()))) {

    // Sink insert

    Ops.push_back(&cast<Instruction>(V)->getOperandUse(0));

    // Sink shuffle

    Ops.push_back(&I->getOperandUse(1));

    return true;

  }


  return false;

}

CostKind
static cl::opt< TargetTransformInfo::TargetCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(TargetTransformInfo::TCK_RecipThroughput), cl::values(clEnumValN(TargetTransformInfo::TCK_RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(TargetTransformInfo::TCK_Latency, "latency", "Instruction latency"), clEnumValN(TargetTransformInfo::TCK_CodeSize, "code-size", "Code size"), clEnumValN(TargetTransformInfo::TCK_SizeAndLatency, "size-latency", "Code size and latency")))

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

getCalledFunction
static const Function * getCalledFunction(const Value *V)
Definition: MemoryBuiltins.cpp:159

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:51

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

WebAssemblyTargetTransformInfo.h
This file a TargetTransformInfo::Concept conforming object specific to the WebAssembly target machine...

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::BasicTTIImplBase::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: BasicTTIImpl.h:1345

llvm::BasicTTIImplBase::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Opd1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Opd2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr)
Definition: BasicTTIImpl.h:958

llvm::Function
Definition: Function.h:63

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::Instruction
Definition: Instruction.h:68

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:48

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:39

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition: OptimizationRemarkEmitter.h:32

llvm::ScalarEvolution
The main scalar evolution driver.
Definition: ScalarEvolution.h:447

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:573

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:413

llvm::TargetTransformInfoImplBase::isLoweredToCall
bool isLoweredToCall(const Function *F) const
Definition: TargetTransformInfoImpl.h:149

llvm::TargetTransformInfoImplBase::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: TargetTransformInfoImpl.h:506

llvm::TargetTransformInfo::ReductionShuffle
ReductionShuffle
Definition: TargetTransformInfo.h:1788

llvm::TargetTransformInfo::ReductionShuffle::Pairwise
@ Pairwise

llvm::TargetTransformInfo::ReductionShuffle::SplitHalf
@ SplitHalf

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition: TargetTransformInfo.h:263

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition: TargetTransformInfo.h:1180

llvm::TargetTransformInfo::RGK_FixedWidthVector
@ RGK_FixedWidthVector
Definition: TargetTransformInfo.h:1180

llvm::TargetTransformInfo::RGK_ScalableVector
@ RGK_ScalableVector
Definition: TargetTransformInfo.h:1180

llvm::TargetTransformInfo::RGK_Scalar
@ RGK_Scalar
Definition: TargetTransformInfo.h:1180

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition: TargetTransformInfo.h:719

llvm::TargetTransformInfo::PSK_FastHardware
@ PSK_FastHardware
Definition: TargetTransformInfo.h:719

llvm::TargetTransformInfo::TCC_Expensive
@ TCC_Expensive
The cost of a 'div' instruction on x86.
Definition: TargetTransformInfo.h:291

llvm::TargetTransformInfo::TCC_Basic
@ TCC_Basic
The cost of a typical 'add' instruction.
Definition: TargetTransformInfo.h:290

llvm::TypeSize
Definition: TypeSize.h:334

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition: TypeSize.h:345

llvm::TypeSize::getScalable
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition: TypeSize.h:348

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::WebAssemblySubtarget::hasTailCall
bool hasTailCall() const
Definition: WebAssemblySubtarget.h:113

llvm::WebAssemblyTTIImpl::isProfitableToSinkOperands
bool isProfitableToSinkOperands(Instruction *I, SmallVectorImpl< Use * > &Ops) const
Definition: WebAssemblyTargetTransformInfo.cpp:138

llvm::WebAssemblyTTIImpl::getPreferredExpandedReductionShuffle
TTI::ReductionShuffle getPreferredExpandedReductionShuffle(const IntrinsicInst *II) const
Definition: WebAssemblyTargetTransformInfo.cpp:95

llvm::WebAssemblyTTIImpl::supportsTailCalls
bool supportsTailCalls() const
Definition: WebAssemblyTargetTransformInfo.cpp:134

llvm::WebAssemblyTTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const
Definition: WebAssemblyTargetTransformInfo.cpp:37

llvm::WebAssemblyTTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: WebAssemblyTargetTransformInfo.cpp:82

llvm::WebAssemblyTTIImpl::getPopcntSupport
TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) const
Definition: WebAssemblyTargetTransformInfo.cpp:21

llvm::WebAssemblyTTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE) const
Definition: WebAssemblyTargetTransformInfo.cpp:107

llvm::WebAssemblyTTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr)
Definition: WebAssemblyTargetTransformInfo.cpp:51

llvm::WebAssemblyTTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: WebAssemblyTargetTransformInfo.cpp:26

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::PatternMatch
Definition: PatternMatch.h:47

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_ZeroInt
cst_pred_ty< is_zero_int > m_ZeroInt()
Match an integer 0 or a vector with all elements equal to 0.
Definition: PatternMatch.h:599

llvm::PatternMatch::m_Shuffle
TwoOps_match< V1_t, V2_t, Instruction::ShuffleVector > m_Shuffle(const V1_t &v1, const V2_t &v2)
Matches ShuffleVectorInst independently of mask value.
Definition: PatternMatch.h:1911

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_InsertElt
ThreeOps_match< Val_t, Elt_t, Idx_t, Instruction::InsertElement > m_InsertElt(const Val_t &Val, const Elt_t &Elt, const Idx_t &Idx)
Matches InsertElementInst.
Definition: PatternMatch.h:1829

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:292

llvm::Cost
InstructionCost Cost
Definition: FunctionSpecialization.h:102

llvm::VFParamKind::Vector
@ Vector

llvm::PatternMatch::m_ZeroMask
Definition: PatternMatch.h:1868

llvm::TargetTransformInfo::OperandValueInfo
Definition: TargetTransformInfo.h:1135

llvm::TargetTransformInfo::OperandValueInfo::isUniform
bool isUniform() const
Definition: TargetTransformInfo.h:1142

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition: TargetTransformInfo.h:536

llvm::TargetTransformInfo::UnrollingPreferences::UpperBound
bool UpperBound
Allow using trip count upper bound to unroll loops.
Definition: TargetTransformInfo.h:607

llvm::TargetTransformInfo::UnrollingPreferences::PartialOptSizeThreshold
unsigned PartialOptSizeThreshold
The cost threshold for the unrolled loop when optimizing for size, like OptSizeThreshold,...
Definition: TargetTransformInfo.h:565

llvm::TargetTransformInfo::UnrollingPreferences::BEInsns
unsigned BEInsns
Definition: TargetTransformInfo.h:590

llvm::TargetTransformInfo::UnrollingPreferences::PartialThreshold
unsigned PartialThreshold
The cost threshold for the unrolled loop, like Threshold, but used for partial/runtime unrolling (set...
Definition: TargetTransformInfo.h:561

llvm::TargetTransformInfo::UnrollingPreferences::Runtime
bool Runtime
Allow runtime unrolling (unrolling of loops to expand the size of the loop body even when the number ...
Definition: TargetTransformInfo.h:597

llvm::TargetTransformInfo::UnrollingPreferences::Partial
bool Partial
Allow partial unrolling (unrolling of loops to expand the size of the loop body, not only to eliminat...
Definition: TargetTransformInfo.h:593

llvm::TargetTransformInfo::UnrollingPreferences::OptSizeThreshold
unsigned OptSizeThreshold
The cost threshold for the unrolled loop when optimizing for size (set to UINT_MAX to disable).
Definition: TargetTransformInfo.h:558