docs/doxygen/R600TargetTransformInfo_8h_source.html

//===- R600TargetTransformInfo.h - R600 specific TTI --------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file

/// This file a TargetTransformInfo::Concept conforming object specific to the

/// R600 target machine. It uses the target's detailed information to

/// provide more precise answers to certain TTI queries, while letting the

/// target independent and default TTI implementations handle the rest.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H

#define LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H


#include "AMDGPUTargetTransformInfo.h"

#include "llvm/CodeGen/BasicTTIImpl.h"


namespace llvm {


class R600Subtarget;

class AMDGPUTargetLowering;


class R600TTIImpl final : public BasicTTIImplBase<R600TTIImpl> {

  using BaseT = BasicTTIImplBase<R600TTIImpl>;

  using TTI = TargetTransformInfo;


  friend BaseT;


  const R600Subtarget *ST;

  const AMDGPUTargetLowering *TLI;

  AMDGPUTTIImpl CommonTTI;


public:

  explicit R600TTIImpl(const AMDGPUTargetMachine *TM, const Function &F);


  const R600Subtarget *getST() const { return ST; }

  const AMDGPUTargetLowering *getTLI() const { return TLI; }


  void getUnrollingPreferences(Loop *L, ScalarEvolution &SE,

                               TTI::UnrollingPreferences &UP,

                               OptimizationRemarkEmitter *ORE);

  void getPeelingPreferences(Loop *L, ScalarEvolution &SE,

                             TTI::PeelingPreferences &PP);

  unsigned getHardwareNumberOfRegisters(bool Vec) const;

  unsigned getNumberOfRegisters(bool Vec) const;

  TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind Vector) const;

  unsigned getMinVectorRegisterBitWidth() const;

  unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const;

  bool isLegalToVectorizeMemChain(unsigned ChainSizeInBytes, Align Alignment,

                                  unsigned AddrSpace) const;

  bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment,

                                   unsigned AddrSpace) const;

  bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment,

                                    unsigned AddrSpace) const;

  unsigned getMaxInterleaveFactor(ElementCount VF);

  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                 const Instruction *I = nullptr);

  using BaseT::getVectorInstrCost;

  InstructionCost getVectorInstrCost(unsigned Opcode, Type *ValTy,

                                     TTI::TargetCostKind CostKind,

                                     unsigned Index, Value *Op0, Value *Op1);

};


} // end namespace llvm


#endif // LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H

AMDGPUTargetTransformInfo.h
This file a TargetTransformInfo::Concept conforming object specific to the AMDGPU target machine.

BasicTTIImpl.h
This file provides a helper that implements much of the TTI interface in terms of the target-independ...

CostKind
static cl::opt< TargetTransformInfo::TargetCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(TargetTransformInfo::TCK_RecipThroughput), cl::values(clEnumValN(TargetTransformInfo::TCK_RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(TargetTransformInfo::TCK_Latency, "latency", "Instruction latency"), clEnumValN(TargetTransformInfo::TCK_CodeSize, "code-size", "Code size"), clEnumValN(TargetTransformInfo::TCK_SizeAndLatency, "size-latency", "Code size and latency")))

Index
uint32_t Index
Definition: ELFObjHandler.cpp:83

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

llvm::AMDGPUTTIImpl
Definition: AMDGPUTargetTransformInfo.h:36

llvm::AMDGPUTargetLowering
Definition: AMDGPUISelLowering.h:27

llvm::AMDGPUTargetMachine
Definition: AMDGPUTargetMachine.h:31

llvm::BasicTTIImplBase
Base class which can be used to help build a TTI implementation.
Definition: BasicTTIImpl.h:80

llvm::BasicTTIImplBase< R600TTIImpl >::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: BasicTTIImpl.h:1346

llvm::ElementCount
Definition: TypeSize.h:300

llvm::Function
Definition: Function.h:63

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::Instruction
Definition: Instruction.h:68

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:39

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition: OptimizationRemarkEmitter.h:32

llvm::R600Subtarget
Definition: R600Subtarget.h:29

llvm::R600TTIImpl
Definition: R600TargetTransformInfo.h:28

llvm::R600TTIImpl::isLegalToVectorizeMemChain
bool isLegalToVectorizeMemChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition: R600TargetTransformInfo.cpp:64

llvm::R600TTIImpl::getPeelingPreferences
void getPeelingPreferences(Loop *L, ScalarEvolution &SE, TTI::PeelingPreferences &PP)
Definition: R600TargetTransformInfo.cpp:142

llvm::R600TTIImpl::getCFInstrCost
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: R600TargetTransformInfo.cpp:94

llvm::R600TTIImpl::isLegalToVectorizeStoreChain
bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition: R600TargetTransformInfo.cpp:79

llvm::R600TTIImpl::getST
const R600Subtarget * getST() const
Definition: R600TargetTransformInfo.h:41

llvm::R600TTIImpl::getTLI
const AMDGPUTargetLowering * getTLI() const
Definition: R600TargetTransformInfo.h:42

llvm::R600TTIImpl::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF)
Definition: R600TargetTransformInfo.cpp:85

llvm::R600TTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE)
Definition: R600TargetTransformInfo.cpp:136

llvm::R600TTIImpl::getLoadStoreVecRegBitWidth
unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const
Definition: R600TargetTransformInfo.cpp:46

llvm::R600TTIImpl::getHardwareNumberOfRegisters
unsigned getHardwareNumberOfRegisters(bool Vec) const
Definition: R600TargetTransformInfo.cpp:31

llvm::R600TTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind Vector) const
Definition: R600TargetTransformInfo.cpp:40

llvm::R600TTIImpl::getMinVectorRegisterBitWidth
unsigned getMinVectorRegisterBitWidth() const
Definition: R600TargetTransformInfo.cpp:44

llvm::R600TTIImpl::isLegalToVectorizeLoadChain
bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition: R600TargetTransformInfo.cpp:73

llvm::R600TTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *ValTy, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: R600TargetTransformInfo.cpp:110

llvm::R600TTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(bool Vec) const
Definition: R600TargetTransformInfo.cpp:35

llvm::ScalarEvolution
The main scalar evolution driver.
Definition: ScalarEvolution.h:447

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition: TargetTransformInfo.h:212

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition: TargetTransformInfo.h:257

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition: TargetTransformInfo.h:1169

llvm::TypeSize
Definition: TypeSize.h:334

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::VFParamKind::Vector
@ Vector

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::TargetTransformInfo::PeelingPreferences
Definition: TargetTransformInfo.h:652

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition: TargetTransformInfo.h:530