doxygen/html/AMDGPUBaseInfo%5F8h%5Fsource.html

//===- AMDGPUBaseInfo.h - Top level definitions for AMDGPU ------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_AMDGPU_UTILS_AMDGPUBASEINFO_H

#define LLVM_LIB_TARGET_AMDGPU_UTILS_AMDGPUBASEINFO_H


#include "AMDGPUSubtarget.h"

#include "SIDefines.h"

#include "llvm/IR/CallingConv.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Module.h"

#include "llvm/Support/Alignment.h"

#include <array>

#include <functional>

#include <utility>


// Pull in OpName enum definition and getNamedOperandIdx() declaration.

#define GET_INSTRINFO_OPERAND_ENUM

#include "AMDGPUGenInstrInfo.inc"


struct amd_kernel_code_t;


namespace llvm {


struct Align;

class Argument;

class Function;

class GlobalValue;

class MCInstrInfo;

class MCRegisterClass;

class MCRegisterInfo;

class MCSubtargetInfo;

class MDNode;

class StringRef;

class Triple;

class raw_ostream;


namespace AMDGPU {


struct AMDGPUMCKernelCodeT;

struct IsaVersion;


/// Generic target versions emitted by this version of LLVM.

///

/// These numbers are incremented every time a codegen breaking change occurs

/// within a generic family.


namespace GenericVersion {

static constexpr unsigned GFX9 = 1;

static constexpr unsigned GFX9_4 = 1;

static constexpr unsigned GFX10_1 = 1;

static constexpr unsigned GFX10_3 = 1;

static constexpr unsigned GFX11 = 1;

static constexpr unsigned GFX12 = 1;

} // namespace GenericVersion


enum { AMDHSA_COV4 = 4, AMDHSA_COV5 = 5, AMDHSA_COV6 = 6 };


enum class FPType { None, FP4, FP8 };


/// \returns True if \p STI is AMDHSA.

bool isHsaAbi(const MCSubtargetInfo &STI);


/// \returns Code object version from the IR module flag.

unsigned getAMDHSACodeObjectVersion(const Module &M);


/// \returns Code object version from ELF's e_ident[EI_ABIVERSION].

unsigned getAMDHSACodeObjectVersion(unsigned ABIVersion);


/// \returns The default HSA code object version. This should only be used when

/// we lack a more accurate CodeObjectVersion value (e.g. from the IR module

/// flag or a .amdhsa_code_object_version directive)

unsigned getDefaultAMDHSACodeObjectVersion();


/// \returns ABIVersion suitable for use in ELF's e_ident[EI_ABIVERSION]. \param

/// CodeObjectVersion is a value returned by getAMDHSACodeObjectVersion().

uint8_t getELFABIVersion(const Triple &OS, unsigned CodeObjectVersion);


/// \returns The offset of the multigrid_sync_arg argument from implicitarg_ptr

unsigned getMultigridSyncArgImplicitArgPosition(unsigned COV);


/// \returns The offset of the hostcall pointer argument from implicitarg_ptr

unsigned getHostcallImplicitArgPosition(unsigned COV);


unsigned getDefaultQueueImplicitArgPosition(unsigned COV);

unsigned getCompletionActionImplicitArgPosition(unsigned COV);


struct GcnBufferFormatInfo {

  unsigned Format;

  unsigned BitsPerComp;

  unsigned NumComponents;

  unsigned NumFormat;

  unsigned DataFormat;

};


struct MAIInstInfo {

  uint16_t Opcode;

  bool is_dgemm;

  bool is_gfx940_xdl;

};


struct MFMA_F8F6F4_Info {

  unsigned Opcode;

  unsigned F8F8Opcode;

  uint8_t NumRegsSrcA;

  uint8_t NumRegsSrcB;

};


struct CvtScaleF32_F32F16ToF8F4_Info {

  unsigned Opcode;

};


struct True16D16Info {

  unsigned T16Op;

  unsigned HiOp;

  unsigned LoOp;

};


struct WMMAInstInfo {

  uint16_t Opcode;

  bool is_wmma_xdl;

};


#define GET_MIMGBaseOpcode_DECL

#define GET_MIMGDim_DECL

#define GET_MIMGEncoding_DECL

#define GET_MIMGLZMapping_DECL

#define GET_MIMGMIPMapping_DECL

#define GET_MIMGBiASMapping_DECL

#define GET_MAIInstInfoTable_DECL

#define GET_isMFMA_F8F6F4Table_DECL

#define GET_isCvtScaleF32_F32F16ToF8F4Table_DECL

#define GET_True16D16Table_DECL

#define GET_WMMAInstInfoTable_DECL

#include "AMDGPUGenSearchableTables.inc"


namespace IsaInfo {


enum {

  // The closed Vulkan driver sets 96, which limits the wave count to 8 but

  // doesn't spill SGPRs as much as when 80 is set.

  FIXED_NUM_SGPRS_FOR_INIT_BUG = 96,

  TRAP_NUM_SGPRS = 16

};


enum class TargetIDSetting { Unsupported, Any, Off, On };


class AMDGPUTargetID {

private:

  const MCSubtargetInfo &STI;

  TargetIDSetting XnackSetting;

  TargetIDSetting SramEccSetting;


public:

  explicit AMDGPUTargetID(const MCSubtargetInfo &STI);

  ~AMDGPUTargetID() = default;


  /// \return True if the current xnack setting is not "Unsupported".


  bool isXnackSupported() const {

    return XnackSetting != TargetIDSetting::Unsupported;

  }


  /// \returns True if the current xnack setting is "On" or "Any".


  bool isXnackOnOrAny() const {

    return XnackSetting == TargetIDSetting::On ||

           XnackSetting == TargetIDSetting::Any;

  }


  /// \returns True if current xnack setting is "On" or "Off",

  /// false otherwise.


  bool isXnackOnOrOff() const {

    return getXnackSetting() == TargetIDSetting::On ||

           getXnackSetting() == TargetIDSetting::Off;

  }


  /// \returns The current xnack TargetIDSetting, possible options are

  /// "Unsupported", "Any", "Off", and "On".

  TargetIDSetting getXnackSetting() const { return XnackSetting; }


  /// Sets xnack setting to \p NewXnackSetting.


  void setXnackSetting(TargetIDSetting NewXnackSetting) {

    XnackSetting = NewXnackSetting;

  }


  /// \return True if the current sramecc setting is not "Unsupported".


  bool isSramEccSupported() const {

    return SramEccSetting != TargetIDSetting::Unsupported;

  }


  /// \returns True if the current sramecc setting is "On" or "Any".


  bool isSramEccOnOrAny() const {

    return SramEccSetting == TargetIDSetting::On ||

           SramEccSetting == TargetIDSetting::Any;

  }


  /// \returns True if current sramecc setting is "On" or "Off",

  /// false otherwise.


  bool isSramEccOnOrOff() const {

    return getSramEccSetting() == TargetIDSetting::On ||

           getSramEccSetting() == TargetIDSetting::Off;

  }


  /// \returns The current sramecc TargetIDSetting, possible options are

  /// "Unsupported", "Any", "Off", and "On".

  TargetIDSetting getSramEccSetting() const { return SramEccSetting; }


  /// Sets sramecc setting to \p NewSramEccSetting.


  void setSramEccSetting(TargetIDSetting NewSramEccSetting) {

    SramEccSetting = NewSramEccSetting;

  }


  void setTargetIDFromFeaturesString(StringRef FS);

  void setTargetIDFromTargetIDStream(StringRef TargetID);


  /// \returns String representation of an object.

  std::string toString() const;

};


/// \returns Wavefront size for given subtarget \p STI.

unsigned getWavefrontSize(const MCSubtargetInfo *STI);


/// \returns Local memory size in bytes for given subtarget \p STI.

unsigned getLocalMemorySize(const MCSubtargetInfo *STI);


/// \returns Maximum addressable local memory size in bytes for given subtarget

/// \p STI.

unsigned getAddressableLocalMemorySize(const MCSubtargetInfo *STI);


/// \returns Number of execution units per compute unit for given subtarget \p

/// STI.

unsigned getEUsPerCU(const MCSubtargetInfo *STI);


/// \returns Maximum number of work groups per compute unit for given subtarget

/// \p STI and limited by given \p FlatWorkGroupSize.

unsigned getMaxWorkGroupsPerCU(const MCSubtargetInfo *STI,

                               unsigned FlatWorkGroupSize);


/// \returns Minimum number of waves per execution unit for given subtarget \p

/// STI.

unsigned getMinWavesPerEU(const MCSubtargetInfo *STI);


/// \returns Maximum number of waves per execution unit for given subtarget \p

/// STI without any kind of limitation.

unsigned getMaxWavesPerEU(const MCSubtargetInfo *STI);


/// \returns Number of waves per execution unit required to support the given \p

/// FlatWorkGroupSize.

unsigned getWavesPerEUForWorkGroup(const MCSubtargetInfo *STI,

                                   unsigned FlatWorkGroupSize);


/// \returns Minimum flat work group size for given subtarget \p STI.

unsigned getMinFlatWorkGroupSize(const MCSubtargetInfo *STI);


/// \returns Maximum flat work group size for given subtarget \p STI.

unsigned getMaxFlatWorkGroupSize(const MCSubtargetInfo *STI);


/// \returns Number of waves per work group for given subtarget \p STI and

/// \p FlatWorkGroupSize.

unsigned getWavesPerWorkGroup(const MCSubtargetInfo *STI,

                              unsigned FlatWorkGroupSize);


/// \returns SGPR allocation granularity for given subtarget \p STI.

unsigned getSGPRAllocGranule(const MCSubtargetInfo *STI);


/// \returns SGPR encoding granularity for given subtarget \p STI.

unsigned getSGPREncodingGranule(const MCSubtargetInfo *STI);


/// \returns Total number of SGPRs for given subtarget \p STI.

unsigned getTotalNumSGPRs(const MCSubtargetInfo *STI);


/// \returns Addressable number of SGPRs for given subtarget \p STI.

unsigned getAddressableNumSGPRs(const MCSubtargetInfo *STI);


/// \returns Minimum number of SGPRs that meets the given number of waves per

/// execution unit requirement for given subtarget \p STI.

unsigned getMinNumSGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU);


/// \returns Maximum number of SGPRs that meets the given number of waves per

/// execution unit requirement for given subtarget \p STI.

unsigned getMaxNumSGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU,

                        bool Addressable);


/// \returns Number of extra SGPRs implicitly required by given subtarget \p

/// STI when the given special registers are used.

unsigned getNumExtraSGPRs(const MCSubtargetInfo *STI, bool VCCUsed,

                          bool FlatScrUsed, bool XNACKUsed);


/// \returns Number of extra SGPRs implicitly required by given subtarget \p

/// STI when the given special registers are used. XNACK is inferred from

/// \p STI.

unsigned getNumExtraSGPRs(const MCSubtargetInfo *STI, bool VCCUsed,

                          bool FlatScrUsed);


/// \returns Number of SGPR blocks needed for given subtarget \p STI when

/// \p NumSGPRs are used. \p NumSGPRs should already include any special

/// register counts.

unsigned getNumSGPRBlocks(const MCSubtargetInfo *STI, unsigned NumSGPRs);


/// \returns VGPR allocation granularity for given subtarget \p STI.

///

/// For subtargets which support it, \p EnableWavefrontSize32 should match

/// the ENABLE_WAVEFRONT_SIZE32 kernel descriptor field.

unsigned

getVGPRAllocGranule(const MCSubtargetInfo *STI, unsigned DynamicVGPRBlockSize,

                    std::optional<bool> EnableWavefrontSize32 = std::nullopt);


/// \returns VGPR encoding granularity for given subtarget \p STI.

///

/// For subtargets which support it, \p EnableWavefrontSize32 should match

/// the ENABLE_WAVEFRONT_SIZE32 kernel descriptor field.

unsigned getVGPREncodingGranule(

    const MCSubtargetInfo *STI,

    std::optional<bool> EnableWavefrontSize32 = std::nullopt);


/// For subtargets with a unified VGPR file and mixed ArchVGPR/AGPR usage,

/// returns the allocation granule for ArchVGPRs.

unsigned getArchVGPRAllocGranule();


/// \returns Total number of VGPRs for given subtarget \p STI.

unsigned getTotalNumVGPRs(const MCSubtargetInfo *STI);


/// \returns Addressable number of architectural VGPRs for a given subtarget \p

/// STI.

unsigned getAddressableNumArchVGPRs(const MCSubtargetInfo *STI);


/// \returns Addressable number of VGPRs for given subtarget \p STI.

unsigned getAddressableNumVGPRs(const MCSubtargetInfo *STI,

                                unsigned DynamicVGPRBlockSize);


/// \returns Minimum number of VGPRs that meets given number of waves per

/// execution unit requirement for given subtarget \p STI.

unsigned getMinNumVGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU,

                        unsigned DynamicVGPRBlockSize);


/// \returns Maximum number of VGPRs that meets given number of waves per

/// execution unit requirement for given subtarget \p STI.

unsigned getMaxNumVGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU,

                        unsigned DynamicVGPRBlockSize);


/// \returns Number of waves reachable for a given \p NumVGPRs usage for given

/// subtarget \p STI.

unsigned getNumWavesPerEUWithNumVGPRs(const MCSubtargetInfo *STI,

                                      unsigned NumVGPRs,

                                      unsigned DynamicVGPRBlockSize);


/// \returns Number of waves reachable for a given \p NumVGPRs usage, \p Granule

/// size, \p MaxWaves possible, and \p TotalNumVGPRs available.

unsigned getNumWavesPerEUWithNumVGPRs(unsigned NumVGPRs, unsigned Granule,

                                      unsigned MaxWaves,

                                      unsigned TotalNumVGPRs);


/// \returns Occupancy for a given \p SGPRs usage, \p MaxWaves possible, and \p

/// Gen.

unsigned getOccupancyWithNumSGPRs(unsigned SGPRs, unsigned MaxWaves,

                                  AMDGPUSubtarget::Generation Gen);


/// \returns Number of VGPR blocks needed for given subtarget \p STI when

/// \p NumVGPRs are used. We actually return the number of blocks -1, since

/// that's what we encode.

///

/// For subtargets which support it, \p EnableWavefrontSize32 should match the

/// ENABLE_WAVEFRONT_SIZE32 kernel descriptor field.

unsigned getEncodedNumVGPRBlocks(

    const MCSubtargetInfo *STI, unsigned NumVGPRs,

    std::optional<bool> EnableWavefrontSize32 = std::nullopt);


/// \returns Number of VGPR blocks that need to be allocated for the given

/// subtarget \p STI when \p NumVGPRs are used.

unsigned getAllocatedNumVGPRBlocks(

    const MCSubtargetInfo *STI, unsigned NumVGPRs,

    unsigned DynamicVGPRBlockSize,

    std::optional<bool> EnableWavefrontSize32 = std::nullopt);


} // end namespace IsaInfo


// Represents a field in an encoded value.

template <unsigned HighBit, unsigned LowBit, unsigned D = 0>


struct EncodingField {

  static_assert(HighBit >= LowBit, "Invalid bit range!");

  static constexpr unsigned Offset = LowBit;

  static constexpr unsigned Width = HighBit - LowBit + 1;


  using ValueType = unsigned;

  static constexpr ValueType Default = D;


  ValueType Value;

  constexpr EncodingField(ValueType Value) : Value(Value) {}


  constexpr uint64_t encode() const { return Value; }

  static ValueType decode(uint64_t Encoded) { return Encoded; }

};


// Represents a single bit in an encoded value.

template <unsigned Bit, unsigned D = 0>

using EncodingBit = EncodingField<Bit, Bit, D>;


// A helper for encoding and decoding multiple fields.


template <typename... Fields> struct EncodingFields {


  static constexpr uint64_t encode(Fields... Values) {

    return ((Values.encode() << Values.Offset) | ...);

  }


  static std::tuple<typename Fields::ValueType...> decode(uint64_t Encoded) {

    return {Fields::decode((Encoded >> Fields::Offset) &

                           maxUIntN(Fields::Width))...};

  }


};


LLVM_READONLY


inline bool hasNamedOperand(uint64_t Opcode, OpName NamedIdx) {

  return getNamedOperandIdx(Opcode, NamedIdx) != -1;

}


LLVM_READONLY

int getSOPPWithRelaxation(uint16_t Opcode);


struct MIMGBaseOpcodeInfo {

  MIMGBaseOpcode BaseOpcode;

  bool Store;

  bool Atomic;

  bool AtomicX2;

  bool Sampler;

  bool Gather4;


  uint8_t NumExtraArgs;

  bool Gradients;

  bool G16;

  bool Coordinates;

  bool LodOrClampOrMip;

  bool HasD16;

  bool MSAA;

  bool BVH;

  bool A16;

  bool NoReturn;

  bool PointSampleAccel;

};


LLVM_READONLY

const MIMGBaseOpcodeInfo *getMIMGBaseOpcode(unsigned Opc);


LLVM_READONLY

const MIMGBaseOpcodeInfo *getMIMGBaseOpcodeInfo(unsigned BaseOpcode);


struct MIMGDimInfo {

  MIMGDim Dim;

  uint8_t NumCoords;

  uint8_t NumGradients;

  bool MSAA;

  bool DA;

  uint8_t Encoding;

  const char *AsmSuffix;

};


LLVM_READONLY

const MIMGDimInfo *getMIMGDimInfo(unsigned DimEnum);


LLVM_READONLY

const MIMGDimInfo *getMIMGDimInfoByEncoding(uint8_t DimEnc);


LLVM_READONLY

const MIMGDimInfo *getMIMGDimInfoByAsmSuffix(StringRef AsmSuffix);


struct MIMGLZMappingInfo {

  MIMGBaseOpcode L;

  MIMGBaseOpcode LZ;

};


struct MIMGMIPMappingInfo {

  MIMGBaseOpcode MIP;

  MIMGBaseOpcode NONMIP;

};


struct MIMGBiasMappingInfo {

  MIMGBaseOpcode Bias;

  MIMGBaseOpcode NoBias;

};


struct MIMGOffsetMappingInfo {

  MIMGBaseOpcode Offset;

  MIMGBaseOpcode NoOffset;

};


struct MIMGG16MappingInfo {

  MIMGBaseOpcode G;

  MIMGBaseOpcode G16;

};


LLVM_READONLY

const MIMGLZMappingInfo *getMIMGLZMappingInfo(unsigned L);


struct WMMAOpcodeMappingInfo {

  unsigned Opcode2Addr;

  unsigned Opcode3Addr;

};


LLVM_READONLY

const MIMGMIPMappingInfo *getMIMGMIPMappingInfo(unsigned MIP);


LLVM_READONLY

const MIMGBiasMappingInfo *getMIMGBiasMappingInfo(unsigned Bias);


LLVM_READONLY

const MIMGOffsetMappingInfo *getMIMGOffsetMappingInfo(unsigned Offset);


LLVM_READONLY

const MIMGG16MappingInfo *getMIMGG16MappingInfo(unsigned G);


LLVM_READONLY

int getMIMGOpcode(unsigned BaseOpcode, unsigned MIMGEncoding,

                  unsigned VDataDwords, unsigned VAddrDwords);


LLVM_READONLY

int getMaskedMIMGOp(unsigned Opc, unsigned NewChannels);


LLVM_READONLY

unsigned getAddrSizeMIMGOp(const MIMGBaseOpcodeInfo *BaseOpcode,

                           const MIMGDimInfo *Dim, bool IsA16,

                           bool IsG16Supported);


struct MIMGInfo {

  uint16_t Opcode;

  uint16_t BaseOpcode;

  uint8_t MIMGEncoding;

  uint8_t VDataDwords;

  uint8_t VAddrDwords;

  uint8_t VAddrOperands;

};


LLVM_READONLY

const MIMGInfo *getMIMGInfo(unsigned Opc);


LLVM_READONLY

int getMTBUFBaseOpcode(unsigned Opc);


LLVM_READONLY

int getMTBUFOpcode(unsigned BaseOpc, unsigned Elements);


LLVM_READONLY

int getMTBUFElements(unsigned Opc);


LLVM_READONLY

bool getMTBUFHasVAddr(unsigned Opc);


LLVM_READONLY

bool getMTBUFHasSrsrc(unsigned Opc);


LLVM_READONLY

bool getMTBUFHasSoffset(unsigned Opc);


LLVM_READONLY

int getMUBUFBaseOpcode(unsigned Opc);


LLVM_READONLY

int getMUBUFOpcode(unsigned BaseOpc, unsigned Elements);


LLVM_READONLY

int getMUBUFElements(unsigned Opc);


LLVM_READONLY

bool getMUBUFHasVAddr(unsigned Opc);


LLVM_READONLY

bool getMUBUFHasSrsrc(unsigned Opc);


LLVM_READONLY

bool getMUBUFHasSoffset(unsigned Opc);


LLVM_READONLY

bool getMUBUFIsBufferInv(unsigned Opc);


LLVM_READONLY

bool getMUBUFTfe(unsigned Opc);


LLVM_READONLY

bool getSMEMIsBuffer(unsigned Opc);


LLVM_READONLY

bool getVOP1IsSingle(unsigned Opc);


LLVM_READONLY

bool getVOP2IsSingle(unsigned Opc);


LLVM_READONLY

bool getVOP3IsSingle(unsigned Opc);


LLVM_READONLY

bool isVOPC64DPP(unsigned Opc);


LLVM_READONLY

bool isVOPCAsmOnly(unsigned Opc);


/// Returns true if MAI operation is a double precision GEMM.

LLVM_READONLY

bool getMAIIsDGEMM(unsigned Opc);


LLVM_READONLY

bool getMAIIsGFX940XDL(unsigned Opc);


LLVM_READONLY

bool getWMMAIsXDL(unsigned Opc);


// Get an equivalent BitOp3 for a binary logical \p Opc.

// \returns BitOp3 modifier for the logical operation or zero.

// Used in VOPD3 conversion.

unsigned getBitOp2(unsigned Opc);


struct CanBeVOPD {

  bool X;

  bool Y;

};


/// \returns SIEncodingFamily used for VOPD encoding on a \p ST.

LLVM_READONLY

unsigned getVOPDEncodingFamily(const MCSubtargetInfo &ST);


LLVM_READONLY

CanBeVOPD getCanBeVOPD(unsigned Opc, unsigned EncodingFamily, bool VOPD3);


LLVM_READNONE

uint8_t mfmaScaleF8F6F4FormatToNumRegs(unsigned EncodingVal);


LLVM_READONLY

const MFMA_F8F6F4_Info *getMFMA_F8F6F4_WithFormatArgs(unsigned CBSZ,

                                                      unsigned BLGP,

                                                      unsigned F8F8Opcode);


LLVM_READNONE

uint8_t wmmaScaleF8F6F4FormatToNumRegs(unsigned Fmt);


LLVM_READONLY

const MFMA_F8F6F4_Info *getWMMA_F8F6F4_WithFormatArgs(unsigned FmtA,

                                                      unsigned FmtB,

                                                      unsigned F8F8Opcode);


LLVM_READONLY

const GcnBufferFormatInfo *getGcnBufferFormatInfo(uint8_t BitsPerComp,

                                                  uint8_t NumComponents,

                                                  uint8_t NumFormat,

                                                  const MCSubtargetInfo &STI);

LLVM_READONLY

const GcnBufferFormatInfo *getGcnBufferFormatInfo(uint8_t Format,

                                                  const MCSubtargetInfo &STI);


LLVM_READONLY

int getMCOpcode(uint16_t Opcode, unsigned Gen);


LLVM_READONLY

unsigned getVOPDOpcode(unsigned Opc, bool VOPD3);


LLVM_READONLY

int getVOPDFull(unsigned OpX, unsigned OpY, unsigned EncodingFamily,

                bool VOPD3);


LLVM_READONLY

bool isVOPD(unsigned Opc);


LLVM_READNONE

bool isMAC(unsigned Opc);


LLVM_READNONE

bool isPermlane16(unsigned Opc);


LLVM_READNONE

bool isGenericAtomic(unsigned Opc);


LLVM_READNONE

bool isCvt_F32_Fp8_Bf8_e64(unsigned Opc);


namespace VOPD {


enum Component : unsigned {

  DST = 0,

  SRC0,

  SRC1,

  SRC2,


  DST_NUM = 1,

  MAX_SRC_NUM = 3,

  MAX_OPR_NUM = DST_NUM + MAX_SRC_NUM

};


// LSB mask for VGPR banks per VOPD component operand.

// 4 banks result in a mask 3, setting 2 lower bits.

constexpr unsigned VOPD_VGPR_BANK_MASKS[] = {1, 3, 3, 1};

constexpr unsigned VOPD3_VGPR_BANK_MASKS[] = {1, 3, 3, 3};


enum ComponentIndex : unsigned { X = 0, Y = 1 };

constexpr unsigned COMPONENTS[] = {ComponentIndex::X, ComponentIndex::Y};

constexpr unsigned COMPONENTS_NUM = 2;


// Properties of VOPD components.


class ComponentProps {

private:

  unsigned SrcOperandsNum = 0;

  unsigned MandatoryLiteralIdx = ~0u;

  bool HasSrc2Acc = false;

  unsigned NumVOPD3Mods = 0;

  unsigned Opcode = 0;

  bool IsVOP3 = false;


public:

  ComponentProps() = default;

  ComponentProps(const MCInstrDesc &OpDesc, bool VOP3Layout = false);


  // Return the total number of src operands this component has.

  unsigned getCompSrcOperandsNum() const { return SrcOperandsNum; }


  // Return the number of src operands of this component visible to the parser.


  unsigned getCompParsedSrcOperandsNum() const {

    return SrcOperandsNum - HasSrc2Acc;

  }


  // Return true iif this component has a mandatory literal.

  bool hasMandatoryLiteral() const { return MandatoryLiteralIdx != ~0u; }


  // If this component has a mandatory literal, return component operand

  // index of this literal (i.e. either Component::SRC1 or Component::SRC2).


  unsigned getMandatoryLiteralCompOperandIndex() const {

    assert(hasMandatoryLiteral());

    return MandatoryLiteralIdx;

  }


  // Return true iif this component has operand

  // with component index CompSrcIdx and this operand may be a register.


  bool hasRegSrcOperand(unsigned CompSrcIdx) const {

    assert(CompSrcIdx < Component::MAX_SRC_NUM);

    return SrcOperandsNum > CompSrcIdx && !hasMandatoryLiteralAt(CompSrcIdx);

  }


  // Return true iif this component has tied src2.

  bool hasSrc2Acc() const { return HasSrc2Acc; }


  // Return a number of source modifiers if instruction is used in VOPD3.

  unsigned getCompVOPD3ModsNum() const { return NumVOPD3Mods; }


  // Return opcode of the component.

  unsigned getOpcode() const { return Opcode; }


  // Returns if component opcode is in VOP3 encoding.

  unsigned isVOP3() const { return IsVOP3; }


  // Return index of BitOp3 operand or -1.

  int getBitOp3OperandIdx() const;


private:

  bool hasMandatoryLiteralAt(unsigned CompSrcIdx) const {

    assert(CompSrcIdx < Component::MAX_SRC_NUM);

    return MandatoryLiteralIdx == Component::DST_NUM + CompSrcIdx;

  }

};


enum ComponentKind : unsigned {

  SINGLE = 0,  // A single VOP1 or VOP2 instruction which may be used in VOPD.

  COMPONENT_X, // A VOPD instruction, X component.

  COMPONENT_Y, // A VOPD instruction, Y component.

  MAX = COMPONENT_Y

};


// Interface functions of this class map VOPD component operand indices

// to indices of operands in MachineInstr/MCInst or parsed operands array.

//

// Note that this class operates with 3 kinds of indices:

// - VOPD component operand indices (Component::DST, Component::SRC0, etc.);

// - MC operand indices (they refer operands in a MachineInstr/MCInst);

// - parsed operand indices (they refer operands in parsed operands array).

//

// For SINGLE components mapping between these indices is trivial.

// But things get more complicated for COMPONENT_X and

// COMPONENT_Y because these components share the same

// MachineInstr/MCInst and the same parsed operands array.

// Below is an example of component operand to parsed operand

// mapping for the following instruction:

//

//   v_dual_add_f32 v255, v4, v5 :: v_dual_mov_b32 v6, v1

//

//                          PARSED        COMPONENT         PARSED

// COMPONENT               OPERANDS     OPERAND INDEX    OPERAND INDEX

// -------------------------------------------------------------------

//                     "v_dual_add_f32"                        0

// v_dual_add_f32            v255          0 (DST)    -->      1

//                           v4            1 (SRC0)   -->      2

//                           v5            2 (SRC1)   -->      3

//                          "::"                               4

//                     "v_dual_mov_b32"                        5

// v_dual_mov_b32            v6            0 (DST)    -->      6

//                           v1            1 (SRC0)   -->      7

// -------------------------------------------------------------------

//


class ComponentLayout {

private:

  // Regular MachineInstr/MCInst operands are ordered as follows:

  //   dst, src0 [, other src operands]

  // VOPD MachineInstr/MCInst operands are ordered as follows:

  //   dstX, dstY, src0X [, other OpX operands], src0Y [, other OpY operands]

  // Each ComponentKind has operand indices defined below.

  static constexpr unsigned MC_DST_IDX[] = {0, 0, 1};


  // VOPD3 instructions may have 2 or 3 source modifiers, src2 modifier is not

  // used if there is tied accumulator. Indexing of this array:

  // MC_SRC_IDX[VOPD3ModsNum][SrcNo]. This returns an index for a SINGLE

  // instruction layout, add 1 for COMPONENT_X or COMPONENT_Y. For the second

  // component add OpX.MCSrcNum + OpX.VOPD3ModsNum.

  // For VOPD1/VOPD2 use column with zero modifiers.

  static constexpr unsigned SINGLE_MC_SRC_IDX[4][3] = {

      {1, 2, 3}, {2, 3, 4}, {2, 4, 5}, {2, 4, 6}};


  // Parsed operands of regular instructions are ordered as follows:

  //   Mnemo dst src0 [vsrc1 ...]

  // Parsed VOPD operands are ordered as follows:

  //   OpXMnemo dstX src0X [vsrc1X|imm vsrc1X|vsrc1X imm] '::'

  //   OpYMnemo dstY src0Y [vsrc1Y|imm vsrc1Y|vsrc1Y imm]

  // Each ComponentKind has operand indices defined below.

  static constexpr unsigned PARSED_DST_IDX[] = {1, 1,

                                                4 /* + OpX.ParsedSrcNum */};

  static constexpr unsigned FIRST_PARSED_SRC_IDX[] = {

      2, 2, 5 /* + OpX.ParsedSrcNum */};


private:

  const ComponentKind Kind;

  const ComponentProps PrevComp;

  const unsigned VOPD3ModsNum;

  const int BitOp3Idx; // Index of bitop3 operand or -1


public:

  // Create layout for COMPONENT_X or SINGLE component.


  ComponentLayout(ComponentKind Kind, unsigned VOPD3ModsNum, int BitOp3Idx)

      : Kind(Kind), VOPD3ModsNum(VOPD3ModsNum), BitOp3Idx(BitOp3Idx) {

    assert(Kind == ComponentKind::SINGLE || Kind == ComponentKind::COMPONENT_X);

  }


  // Create layout for COMPONENT_Y which depends on COMPONENT_X layout.


  ComponentLayout(const ComponentProps &OpXProps, unsigned VOPD3ModsNum,

                  int BitOp3Idx)

      : Kind(ComponentKind::COMPONENT_Y), PrevComp(OpXProps),

        VOPD3ModsNum(VOPD3ModsNum), BitOp3Idx(BitOp3Idx) {}


public:

  // Return the index of dst operand in MCInst operands.

  unsigned getIndexOfDstInMCOperands() const { return MC_DST_IDX[Kind]; }


  // Return the index of the specified src operand in MCInst operands.


  unsigned getIndexOfSrcInMCOperands(unsigned CompSrcIdx, bool VOPD3) const {

    assert(CompSrcIdx < Component::MAX_SRC_NUM);


    if (Kind == SINGLE && CompSrcIdx == 2 && BitOp3Idx != -1)

      return BitOp3Idx;


    if (VOPD3) {

      return SINGLE_MC_SRC_IDX[VOPD3ModsNum][CompSrcIdx] + getPrevCompSrcNum() +

             getPrevCompVOPD3ModsNum() + (Kind != SINGLE ? 1 : 0);

    }


    return SINGLE_MC_SRC_IDX[0][CompSrcIdx] + getPrevCompSrcNum() +

           (Kind != SINGLE ? 1 : 0);

  }


  // Return the index of dst operand in the parsed operands array.


  unsigned getIndexOfDstInParsedOperands() const {

    return PARSED_DST_IDX[Kind] + getPrevCompParsedSrcNum();

  }


  // Return the index of the specified src operand in the parsed operands array.


  unsigned getIndexOfSrcInParsedOperands(unsigned CompSrcIdx) const {

    assert(CompSrcIdx < Component::MAX_SRC_NUM);

    return FIRST_PARSED_SRC_IDX[Kind] + getPrevCompParsedSrcNum() + CompSrcIdx;

  }


private:

  unsigned getPrevCompSrcNum() const {

    return PrevComp.getCompSrcOperandsNum();

  }

  unsigned getPrevCompParsedSrcNum() const {

    return PrevComp.getCompParsedSrcOperandsNum();

  }

  unsigned getPrevCompVOPD3ModsNum() const {

    return PrevComp.getCompVOPD3ModsNum();

  }

};


// Layout and properties of VOPD components.


class ComponentInfo : public ComponentProps, public ComponentLayout {

public:

  // Create ComponentInfo for COMPONENT_X or SINGLE component.


  ComponentInfo(const MCInstrDesc &OpDesc,

                ComponentKind Kind = ComponentKind::SINGLE,

                bool VOP3Layout = false)

      : ComponentProps(OpDesc, VOP3Layout),

        ComponentLayout(Kind, getCompVOPD3ModsNum(), getBitOp3OperandIdx()) {}


  // Create ComponentInfo for COMPONENT_Y which depends on COMPONENT_X layout.


  ComponentInfo(const MCInstrDesc &OpDesc, const ComponentProps &OpXProps,

                bool VOP3Layout = false)

      : ComponentProps(OpDesc, VOP3Layout),

        ComponentLayout(OpXProps, getCompVOPD3ModsNum(),

                        getBitOp3OperandIdx()) {}


  // Map component operand index to parsed operand index.

  // Return 0 if the specified operand does not exist.

  unsigned getIndexInParsedOperands(unsigned CompOprIdx) const;

};


// Properties of VOPD instructions.


class InstInfo {

private:

  const ComponentInfo CompInfo[COMPONENTS_NUM];


public:

  using RegIndices = std::array<MCRegister, Component::MAX_OPR_NUM>;


  InstInfo(const MCInstrDesc &OpX, const MCInstrDesc &OpY)

      : CompInfo{OpX, OpY} {}


  InstInfo(const ComponentInfo &OprInfoX, const ComponentInfo &OprInfoY)

      : CompInfo{OprInfoX, OprInfoY} {}


  const ComponentInfo &operator[](size_t ComponentIdx) const {

    assert(ComponentIdx < COMPONENTS_NUM);

    return CompInfo[ComponentIdx];

  }


  // Check VOPD operands constraints.

  // GetRegIdx(Component, MCOperandIdx) must return a VGPR register index

  // for the specified component and MC operand. The callback must return 0

  // if the operand is not a register or not a VGPR.

  // If \p SkipSrc is set to true then constraints for source operands are not

  // checked.

  // If \p AllowSameVGPR is set then same VGPRs are allowed for X and Y sources

  // even though it violates requirement to be from different banks.

  // If \p VOPD3 is set to true both dst registers allowed to be either odd

  // or even and instruction may have real src2 as opposed to tied accumulator.

  bool


  hasInvalidOperand(std::function<MCRegister(unsigned, unsigned)> GetRegIdx,

                    const MCRegisterInfo &MRI, bool SkipSrc = false,

                    bool AllowSameVGPR = false, bool VOPD3 = false) const {

    return getInvalidCompOperandIndex(GetRegIdx, MRI, SkipSrc, AllowSameVGPR,

                                      VOPD3)

        .has_value();

  }


  // Check VOPD operands constraints.

  // Return the index of an invalid component operand, if any.

  // If \p SkipSrc is set to true then constraints for source operands are not

  // checked except for being from the same halves of VGPR file on gfx1250.

  // If \p AllowSameVGPR is set then same VGPRs are allowed for X and Y sources

  // even though it violates requirement to be from different banks.

  // If \p VOPD3 is set to true both dst registers allowed to be either odd

  // or even and instruction may have real src2 as opposed to tied accumulator.

  std::optional<unsigned> getInvalidCompOperandIndex(

      std::function<MCRegister(unsigned, unsigned)> GetRegIdx,

      const MCRegisterInfo &MRI, bool SkipSrc = false,

      bool AllowSameVGPR = false, bool VOPD3 = false) const;


private:

  RegIndices

  getRegIndices(unsigned ComponentIdx,

                std::function<MCRegister(unsigned, unsigned)> GetRegIdx,

                bool VOPD3) const;

};


} // namespace VOPD


LLVM_READONLY

std::pair<unsigned, unsigned> getVOPDComponents(unsigned VOPDOpcode);


LLVM_READONLY

// Get properties of 2 single VOP1/VOP2 instructions

// used as components to create a VOPD instruction.

VOPD::InstInfo getVOPDInstInfo(const MCInstrDesc &OpX, const MCInstrDesc &OpY);


LLVM_READONLY

// Get properties of VOPD X and Y components.

VOPD::InstInfo getVOPDInstInfo(unsigned VOPDOpcode,

                               const MCInstrInfo *InstrInfo);


LLVM_READONLY

bool isAsyncStore(unsigned Opc);

LLVM_READONLY

bool isTensorStore(unsigned Opc);

LLVM_READONLY

unsigned getTemporalHintType(const MCInstrDesc TID);


LLVM_READONLY

bool isTrue16Inst(unsigned Opc);


LLVM_READONLY

FPType getFPDstSelType(unsigned Opc);


LLVM_READONLY

bool isInvalidSingleUseConsumerInst(unsigned Opc);


LLVM_READONLY

bool isInvalidSingleUseProducerInst(unsigned Opc);


bool isDPMACCInstruction(unsigned Opc);


LLVM_READONLY

unsigned mapWMMA2AddrTo3AddrOpcode(unsigned Opc);


LLVM_READONLY

unsigned mapWMMA3AddrTo2AddrOpcode(unsigned Opc);


void initDefaultAMDKernelCodeT(AMDGPUMCKernelCodeT &Header,

                               const MCSubtargetInfo *STI);


bool isGroupSegment(const GlobalValue *GV);

bool isGlobalSegment(const GlobalValue *GV);

bool isReadOnlySegment(const GlobalValue *GV);


/// \returns True if constants should be emitted to .text section for given

/// target triple \p TT, false otherwise.

bool shouldEmitConstantsToTextSection(const Triple &TT);


/// Returns a valid charcode or 0 in the first entry if this is a valid physical

/// register name. Followed by the start register number, and the register

/// width. Does not validate the number of registers exists in the class. Unlike

/// parseAsmConstraintPhysReg, this does not expect the name to be wrapped in

/// "{}".

std::tuple<char, unsigned, unsigned> parseAsmPhysRegName(StringRef TupleString);


/// Returns a valid charcode or 0 in the first entry if this is a valid physical

/// register constraint. Followed by the start register number, and the register

/// width. Does not validate the number of registers exists in the class.

std::tuple<char, unsigned, unsigned>

parseAsmConstraintPhysReg(StringRef Constraint);


/// \returns Integer value requested using \p F's \p Name attribute.

///

/// \returns \p Default if attribute is not present.

///

/// \returns \p Default and emits error if requested value cannot be converted

/// to integer.

int getIntegerAttribute(const Function &F, StringRef Name, int Default);


/// \returns A pair of integer values requested using \p F's \p Name attribute

/// in "first[,second]" format ("second" is optional unless \p OnlyFirstRequired

/// is false).

///

/// \returns \p Default if attribute is not present.

///

/// \returns \p Default and emits error if one of the requested values cannot be

/// converted to integer, or \p OnlyFirstRequired is false and "second" value is

/// not present.

std::pair<unsigned, unsigned>

getIntegerPairAttribute(const Function &F, StringRef Name,

                        std::pair<unsigned, unsigned> Default,

                        bool OnlyFirstRequired = false);


/// \returns A pair of integer values requested using \p F's \p Name attribute

/// in "first[,second]" format ("second" is optional unless \p OnlyFirstRequired

/// is false).

///

/// \returns \p std::nullopt if attribute is not present.

///

/// \returns \p std::nullopt and emits error if one of the requested values

/// cannot be converted to integer, or \p OnlyFirstRequired is false and

/// "second" value is not present.

std::optional<std::pair<unsigned, std::optional<unsigned>>>

getIntegerPairAttribute(const Function &F, StringRef Name,

                        bool OnlyFirstRequired = false);


/// \returns Generate a vector of integer values requested using \p F's \p Name

/// attribute.

/// \returns A vector of size \p Size, with all elements set to \p DefaultVal,

/// if any error occurs. The corresponding error will also be emitted.

SmallVector<unsigned> getIntegerVecAttribute(const Function &F, StringRef Name,

                                             unsigned Size,

                                             unsigned DefaultVal);

/// Similar to the function above, but returns std::nullopt if any error occurs.

std::optional<SmallVector<unsigned>>

getIntegerVecAttribute(const Function &F, StringRef Name, unsigned Size);


/// Checks if \p Val is inside \p MD, a !range-like metadata.

bool hasValueInRangeLikeMetadata(const MDNode &MD, int64_t Val);


/// Represents the counter values to wait for in an s_waitcnt instruction.

///

/// Large values (including the maximum possible integer) can be used to

/// represent "don't care" waits.


struct Waitcnt {

  unsigned LoadCnt = ~0u; // Corresponds to Vmcnt prior to gfx12.

  unsigned ExpCnt = ~0u;

  unsigned DsCnt = ~0u;     // Corresponds to LGKMcnt prior to gfx12.

  unsigned StoreCnt = ~0u;  // Corresponds to VScnt on gfx10/gfx11.

  unsigned SampleCnt = ~0u; // gfx12+ only.

  unsigned BvhCnt = ~0u;    // gfx12+ only.

  unsigned KmCnt = ~0u;     // gfx12+ only.

  unsigned XCnt = ~0u;      // gfx1250.

  unsigned VaVdst = ~0u;    // gfx12+ expert scheduling mode only.

  unsigned VmVsrc = ~0u;    // gfx12+ expert scheduling mode only.


  Waitcnt() = default;

  // Pre-gfx12 constructor.


  Waitcnt(unsigned VmCnt, unsigned ExpCnt, unsigned LgkmCnt, unsigned VsCnt)

      : LoadCnt(VmCnt), ExpCnt(ExpCnt), DsCnt(LgkmCnt), StoreCnt(VsCnt) {}


  // gfx12+ constructor.


  Waitcnt(unsigned LoadCnt, unsigned ExpCnt, unsigned DsCnt, unsigned StoreCnt,

          unsigned SampleCnt, unsigned BvhCnt, unsigned KmCnt, unsigned XCnt,

          unsigned VaVdst, unsigned VmVsrc)

      : LoadCnt(LoadCnt), ExpCnt(ExpCnt), DsCnt(DsCnt), StoreCnt(StoreCnt),

        SampleCnt(SampleCnt), BvhCnt(BvhCnt), KmCnt(KmCnt), XCnt(XCnt),

        VaVdst(VaVdst), VmVsrc(VmVsrc) {}


  bool hasWait() const { return StoreCnt != ~0u || hasWaitExceptStoreCnt(); }


  bool hasWaitExceptStoreCnt() const {

    return LoadCnt != ~0u || ExpCnt != ~0u || DsCnt != ~0u ||

           SampleCnt != ~0u || BvhCnt != ~0u || KmCnt != ~0u || XCnt != ~0u ||

           VaVdst != ~0u || VmVsrc != ~0u;

  }


  bool hasWaitStoreCnt() const { return StoreCnt != ~0u; }


  bool hasWaitDepctr() const { return VaVdst != ~0u || VmVsrc != ~0u; }


  Waitcnt combined(const Waitcnt &Other) const {

    // Does the right thing provided self and Other are either both pre-gfx12

    // or both gfx12+.

    return Waitcnt(

        std::min(LoadCnt, Other.LoadCnt), std::min(ExpCnt, Other.ExpCnt),

        std::min(DsCnt, Other.DsCnt), std::min(StoreCnt, Other.StoreCnt),

        std::min(SampleCnt, Other.SampleCnt), std::min(BvhCnt, Other.BvhCnt),

        std::min(KmCnt, Other.KmCnt), std::min(XCnt, Other.XCnt),

        std::min(VaVdst, Other.VaVdst), std::min(VmVsrc, Other.VmVsrc));

  }


  friend raw_ostream &operator<<(raw_ostream &OS, const AMDGPU::Waitcnt &Wait);

};


/// Represents the hardware counter limits for different wait count types.


struct HardwareLimits {

  unsigned LoadcntMax; // Corresponds to Vmcnt prior to gfx12.

  unsigned ExpcntMax;

  unsigned DscntMax;     // Corresponds to LGKMcnt prior to gfx12.

  unsigned StorecntMax;  // Corresponds to VScnt in gfx10/gfx11.

  unsigned SamplecntMax; // gfx12+ only.

  unsigned BvhcntMax;    // gfx12+ only.

  unsigned KmcntMax;     // gfx12+ only.

  unsigned XcntMax;      // gfx1250.

  unsigned VaVdstMax;    // gfx12+ expert mode only.

  unsigned VmVsrcMax;    // gfx12+ expert mode only.


  HardwareLimits() = default;


  /// Initializes hardware limits from ISA version.

  HardwareLimits(const IsaVersion &IV);

};


// The following methods are only meaningful on targets that support

// S_WAITCNT.


/// \returns Vmcnt bit mask for given isa \p Version.

unsigned getVmcntBitMask(const IsaVersion &Version);


/// \returns Expcnt bit mask for given isa \p Version.

unsigned getExpcntBitMask(const IsaVersion &Version);


/// \returns Lgkmcnt bit mask for given isa \p Version.

unsigned getLgkmcntBitMask(const IsaVersion &Version);


/// \returns Waitcnt bit mask for given isa \p Version.

unsigned getWaitcntBitMask(const IsaVersion &Version);


/// \returns Decoded Vmcnt from given \p Waitcnt for given isa \p Version.

unsigned decodeVmcnt(const IsaVersion &Version, unsigned Waitcnt);


/// \returns Decoded Expcnt from given \p Waitcnt for given isa \p Version.

unsigned decodeExpcnt(const IsaVersion &Version, unsigned Waitcnt);


/// \returns Decoded Lgkmcnt from given \p Waitcnt for given isa \p Version.

unsigned decodeLgkmcnt(const IsaVersion &Version, unsigned Waitcnt);


/// Decodes Vmcnt, Expcnt and Lgkmcnt from given \p Waitcnt for given isa

/// \p Version, and writes decoded values into \p Vmcnt, \p Expcnt and

/// \p Lgkmcnt respectively. Should not be used on gfx12+, the instruction

/// which needs it is deprecated

///

/// \details \p Vmcnt, \p Expcnt and \p Lgkmcnt are decoded as follows:

///     \p Vmcnt = \p Waitcnt[3:0]        (pre-gfx9)

///     \p Vmcnt = \p Waitcnt[15:14,3:0]  (gfx9,10)

///     \p Vmcnt = \p Waitcnt[15:10]      (gfx11)

///     \p Expcnt = \p Waitcnt[6:4]       (pre-gfx11)

///     \p Expcnt = \p Waitcnt[2:0]       (gfx11)

///     \p Lgkmcnt = \p Waitcnt[11:8]     (pre-gfx10)

///     \p Lgkmcnt = \p Waitcnt[13:8]     (gfx10)

///     \p Lgkmcnt = \p Waitcnt[9:4]      (gfx11)

///

void decodeWaitcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned &Vmcnt,

                   unsigned &Expcnt, unsigned &Lgkmcnt);


Waitcnt decodeWaitcnt(const IsaVersion &Version, unsigned Encoded);


/// \returns \p Waitcnt with encoded \p Vmcnt for given isa \p Version.

unsigned encodeVmcnt(const IsaVersion &Version, unsigned Waitcnt,

                     unsigned Vmcnt);


/// \returns \p Waitcnt with encoded \p Expcnt for given isa \p Version.

unsigned encodeExpcnt(const IsaVersion &Version, unsigned Waitcnt,

                      unsigned Expcnt);


/// \returns \p Waitcnt with encoded \p Lgkmcnt for given isa \p Version.

unsigned encodeLgkmcnt(const IsaVersion &Version, unsigned Waitcnt,

                       unsigned Lgkmcnt);


/// Encodes \p Vmcnt, \p Expcnt and \p Lgkmcnt into Waitcnt for given isa

/// \p Version. Should not be used on gfx12+, the instruction which needs

/// it is deprecated

///

/// \details \p Vmcnt, \p Expcnt and \p Lgkmcnt are encoded as follows:

///     Waitcnt[2:0]   = \p Expcnt      (gfx11+)

///     Waitcnt[3:0]   = \p Vmcnt       (pre-gfx9)

///     Waitcnt[3:0]   = \p Vmcnt[3:0]  (gfx9,10)

///     Waitcnt[6:4]   = \p Expcnt      (pre-gfx11)

///     Waitcnt[9:4]   = \p Lgkmcnt     (gfx11)

///     Waitcnt[11:8]  = \p Lgkmcnt     (pre-gfx10)

///     Waitcnt[13:8]  = \p Lgkmcnt     (gfx10)

///     Waitcnt[15:10] = \p Vmcnt       (gfx11)

///     Waitcnt[15:14] = \p Vmcnt[5:4]  (gfx9,10)

///

/// \returns Waitcnt with encoded \p Vmcnt, \p Expcnt and \p Lgkmcnt for given

/// isa \p Version.

///

unsigned encodeWaitcnt(const IsaVersion &Version, unsigned Vmcnt,

                       unsigned Expcnt, unsigned Lgkmcnt);


unsigned encodeWaitcnt(const IsaVersion &Version, const Waitcnt &Decoded);


// The following methods are only meaningful on targets that support

// S_WAIT_*CNT, introduced with gfx12.


/// \returns Loadcnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support LOADcnt

unsigned getLoadcntBitMask(const IsaVersion &Version);


/// \returns Samplecnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support SAMPLEcnt

unsigned getSamplecntBitMask(const IsaVersion &Version);


/// \returns Bvhcnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support BVHcnt

unsigned getBvhcntBitMask(const IsaVersion &Version);


/// \returns Dscnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support DScnt

unsigned getDscntBitMask(const IsaVersion &Version);


/// \returns Dscnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support KMcnt

unsigned getKmcntBitMask(const IsaVersion &Version);


/// \returns Xcnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support Xcnt.

unsigned getXcntBitMask(const IsaVersion &Version);


/// \return STOREcnt or VScnt bit mask for given isa \p Version.

/// returns 0 for versions that do not support STOREcnt or VScnt.

/// STOREcnt and VScnt are the same counter, the name used

/// depends on the ISA version.

unsigned getStorecntBitMask(const IsaVersion &Version);


// The following are only meaningful on targets that support

// S_WAIT_LOADCNT_DSCNT and S_WAIT_STORECNT_DSCNT.


/// \returns Decoded Waitcnt structure from given \p LoadcntDscnt for given

/// isa \p Version.

Waitcnt decodeLoadcntDscnt(const IsaVersion &Version, unsigned LoadcntDscnt);


/// \returns Decoded Waitcnt structure from given \p StorecntDscnt for given

/// isa \p Version.

Waitcnt decodeStorecntDscnt(const IsaVersion &Version, unsigned StorecntDscnt);


/// \returns \p Loadcnt and \p Dscnt components of \p Decoded  encoded as an

/// immediate that can be used with S_WAIT_LOADCNT_DSCNT for given isa

/// \p Version.

unsigned encodeLoadcntDscnt(const IsaVersion &Version, const Waitcnt &Decoded);


/// \returns \p Storecnt and \p Dscnt components of \p Decoded  encoded as an

/// immediate that can be used with S_WAIT_STORECNT_DSCNT for given isa

/// \p Version.

unsigned encodeStorecntDscnt(const IsaVersion &Version, const Waitcnt &Decoded);


namespace Hwreg {


using HwregId = EncodingField<5, 0>;

using HwregOffset = EncodingField<10, 6>;


struct HwregSize : EncodingField<15, 11, 32> {

  using EncodingField::EncodingField;

  constexpr uint64_t encode() const { return Value - 1; }

  static ValueType decode(uint64_t Encoded) { return Encoded + 1; }

};


using HwregEncoding = EncodingFields<HwregId, HwregOffset, HwregSize>;


} // namespace Hwreg


namespace DepCtr {


int getDefaultDepCtrEncoding(const MCSubtargetInfo &STI);

int encodeDepCtr(const StringRef Name, int64_t Val, unsigned &UsedOprMask,

                 const MCSubtargetInfo &STI);

bool isSymbolicDepCtrEncoding(unsigned Code, bool &HasNonDefaultVal,

                              const MCSubtargetInfo &STI);

bool decodeDepCtr(unsigned Code, int &Id, StringRef &Name, unsigned &Val,

                  bool &IsDefault, const MCSubtargetInfo &STI);


/// \returns Maximum VaVdst value that can be encoded.

unsigned getVaVdstBitMask();


/// \returns Maximum VmVsrc value that can be encoded.

unsigned getVmVsrcBitMask();


/// \returns Decoded VaVdst from given immediate \p Encoded.

unsigned decodeFieldVaVdst(unsigned Encoded);


/// \returns Decoded VmVsrc from given immediate \p Encoded.

unsigned decodeFieldVmVsrc(unsigned Encoded);


/// \returns Decoded SaSdst from given immediate \p Encoded.

unsigned decodeFieldSaSdst(unsigned Encoded);


/// \returns Decoded VaSdst from given immediate \p Encoded.

unsigned decodeFieldVaSdst(unsigned Encoded);


/// \returns Decoded VaVcc from given immediate \p Encoded.

unsigned decodeFieldVaVcc(unsigned Encoded);


/// \returns Decoded SaSrc from given immediate \p Encoded.

unsigned decodeFieldVaSsrc(unsigned Encoded);


/// \returns Decoded HoldCnt from given immediate \p Encoded.

unsigned decodeFieldHoldCnt(unsigned Encoded);


/// \returns \p VmVsrc as an encoded Depctr immediate.

unsigned encodeFieldVmVsrc(unsigned VmVsrc, const MCSubtargetInfo &STI);


/// \returns \p Encoded combined with encoded \p VmVsrc.

unsigned encodeFieldVmVsrc(unsigned Encoded, unsigned VmVsrc);


/// \returns \p VaVdst as an encoded Depctr immediate.

unsigned encodeFieldVaVdst(unsigned VaVdst, const MCSubtargetInfo &STI);


/// \returns \p Encoded combined with encoded \p VaVdst.

unsigned encodeFieldVaVdst(unsigned Encoded, unsigned VaVdst);


/// \returns \p SaSdst as an encoded Depctr immediate.

unsigned encodeFieldSaSdst(unsigned SaSdst, const MCSubtargetInfo &STI);


/// \returns \p Encoded combined with encoded \p SaSdst.

unsigned encodeFieldSaSdst(unsigned Encoded, unsigned SaSdst);


/// \returns \p VaSdst as an encoded Depctr immediate.

unsigned encodeFieldVaSdst(unsigned VaSdst, const MCSubtargetInfo &STI);


/// \returns \p Encoded combined with encoded \p VaSdst.

unsigned encodeFieldVaSdst(unsigned Encoded, unsigned VaSdst);


/// \returns \p VaVcc as an encoded Depctr immediate.

unsigned encodeFieldVaVcc(unsigned VaVcc, const MCSubtargetInfo &STI);


/// \returns \p Encoded combined with encoded \p VaVcc.

unsigned encodeFieldVaVcc(unsigned Encoded, unsigned VaVcc);


/// \returns \p HoldCnt as an encoded Depctr immediate.

unsigned encodeFieldHoldCnt(unsigned HoldCnt, const MCSubtargetInfo &STI);


/// \returns \p Encoded combined with encoded \p HoldCnt.

unsigned encodeFieldHoldCnt(unsigned Encoded, unsigned HoldCnt);


/// \returns \p VaSsrc as an encoded Depctr immediate.

unsigned encodeFieldVaSsrc(unsigned VaSsrc, const MCSubtargetInfo &STI);


/// \returns \p Encoded combined with encoded \p VaSsrc.

unsigned encodeFieldVaSsrc(unsigned Encoded, unsigned VaSsrc);


} // namespace DepCtr


namespace Exp {


bool getTgtName(unsigned Id, StringRef &Name, int &Index);


LLVM_READONLY

unsigned getTgtId(const StringRef Name);


LLVM_READNONE

bool isSupportedTgtId(unsigned Id, const MCSubtargetInfo &STI);


} // namespace Exp


namespace MTBUFFormat {


LLVM_READNONE

int64_t encodeDfmtNfmt(unsigned Dfmt, unsigned Nfmt);


void decodeDfmtNfmt(unsigned Format, unsigned &Dfmt, unsigned &Nfmt);


int64_t getDfmt(const StringRef Name);


StringRef getDfmtName(unsigned Id);


int64_t getNfmt(const StringRef Name, const MCSubtargetInfo &STI);


StringRef getNfmtName(unsigned Id, const MCSubtargetInfo &STI);


bool isValidDfmtNfmt(unsigned Val, const MCSubtargetInfo &STI);


bool isValidNfmt(unsigned Val, const MCSubtargetInfo &STI);


int64_t getUnifiedFormat(const StringRef Name, const MCSubtargetInfo &STI);


StringRef getUnifiedFormatName(unsigned Id, const MCSubtargetInfo &STI);


bool isValidUnifiedFormat(unsigned Val, const MCSubtargetInfo &STI);


int64_t convertDfmtNfmt2Ufmt(unsigned Dfmt, unsigned Nfmt,

                             const MCSubtargetInfo &STI);


bool isValidFormatEncoding(unsigned Val, const MCSubtargetInfo &STI);


unsigned getDefaultFormatEncoding(const MCSubtargetInfo &STI);


} // namespace MTBUFFormat


namespace SendMsg {


LLVM_READNONE

bool isValidMsgId(int64_t MsgId, const MCSubtargetInfo &STI);


LLVM_READNONE

bool isValidMsgOp(int64_t MsgId, int64_t OpId, const MCSubtargetInfo &STI,

                  bool Strict = true);


LLVM_READNONE

bool isValidMsgStream(int64_t MsgId, int64_t OpId, int64_t StreamId,

                      const MCSubtargetInfo &STI, bool Strict = true);


LLVM_READNONE

bool msgRequiresOp(int64_t MsgId, const MCSubtargetInfo &STI);


LLVM_READNONE

bool msgSupportsStream(int64_t MsgId, int64_t OpId, const MCSubtargetInfo &STI);


void decodeMsg(unsigned Val, uint16_t &MsgId, uint16_t &OpId,

               uint16_t &StreamId, const MCSubtargetInfo &STI);


LLVM_READNONE

uint64_t encodeMsg(uint64_t MsgId, uint64_t OpId, uint64_t StreamId);


} // namespace SendMsg


unsigned getInitialPSInputAddr(const Function &F);


bool getHasColorExport(const Function &F);


bool getHasDepthExport(const Function &F);


bool hasDynamicVGPR(const Function &F);


// Returns the value of the "amdgpu-dynamic-vgpr-block-size" attribute, or 0 if

// the attribute is missing or its value is invalid.

unsigned getDynamicVGPRBlockSize(const Function &F);


LLVM_READNONE


constexpr bool isShader(CallingConv::ID CC) {

  switch (CC) {

  case CallingConv::AMDGPU_VS:

  case CallingConv::AMDGPU_LS:

  case CallingConv::AMDGPU_HS:

  case CallingConv::AMDGPU_ES:

  case CallingConv::AMDGPU_GS:

  case CallingConv::AMDGPU_PS:

  case CallingConv::AMDGPU_CS_Chain:

  case CallingConv::AMDGPU_CS_ChainPreserve:

  case CallingConv::AMDGPU_CS:

    return true;

  default:

    return false;

  }

}


LLVM_READNONE


constexpr bool isGraphics(CallingConv::ID CC) {

  return isShader(CC) || CC == CallingConv::AMDGPU_Gfx ||

         CC == CallingConv::AMDGPU_Gfx_WholeWave;

}


LLVM_READNONE


constexpr bool isCompute(CallingConv::ID CC) {

  return !isGraphics(CC) || CC == CallingConv::AMDGPU_CS;

}


LLVM_READNONE


constexpr bool isEntryFunctionCC(CallingConv::ID CC) {

  switch (CC) {

  case CallingConv::AMDGPU_KERNEL:

  case CallingConv::SPIR_KERNEL:

  case CallingConv::AMDGPU_VS:

  case CallingConv::AMDGPU_GS:

  case CallingConv::AMDGPU_PS:

  case CallingConv::AMDGPU_CS:

  case CallingConv::AMDGPU_ES:

  case CallingConv::AMDGPU_HS:

  case CallingConv::AMDGPU_LS:

    return true;

  default:

    return false;

  }

}


LLVM_READNONE


constexpr bool isChainCC(CallingConv::ID CC) {

  switch (CC) {

  case CallingConv::AMDGPU_CS_Chain:

  case CallingConv::AMDGPU_CS_ChainPreserve:

    return true;

  default:

    return false;

  }

}


// These functions are considered entrypoints into the current module, i.e. they

// are allowed to be called from outside the current module. This is different

// from isEntryFunctionCC, which is only true for functions that are entered by

// the hardware. Module entry points include all entry functions but also

// include functions that can be called from other functions inside or outside

// the current module. Module entry functions are allowed to allocate LDS.

LLVM_READNONE


constexpr bool isModuleEntryFunctionCC(CallingConv::ID CC) {

  switch (CC) {

  case CallingConv::AMDGPU_Gfx:

    return true;

  default:

    return isEntryFunctionCC(CC) || isChainCC(CC);

  }

}


LLVM_READNONE


constexpr inline bool isKernel(CallingConv::ID CC) {

  switch (CC) {

  case CallingConv::AMDGPU_KERNEL:

  case CallingConv::SPIR_KERNEL:

    return true;

  default:

    return false;

  }

}


inline bool isKernel(const Function &F) { return isKernel(F.getCallingConv()); }


LLVM_READNONE


constexpr bool canGuaranteeTCO(CallingConv::ID CC) {

  return CC == CallingConv::Fast;

}


/// Return true if we might ever do TCO for calls with this calling convention.

LLVM_READNONE


constexpr bool mayTailCallThisCC(CallingConv::ID CC) {

  switch (CC) {

  case CallingConv::C:

  case CallingConv::AMDGPU_Gfx:

  case CallingConv::AMDGPU_Gfx_WholeWave:

    return true;

  default:

    return canGuaranteeTCO(CC);

  }

}


bool hasXNACK(const MCSubtargetInfo &STI);

bool hasSRAMECC(const MCSubtargetInfo &STI);

bool hasMIMG_R128(const MCSubtargetInfo &STI);

bool hasA16(const MCSubtargetInfo &STI);

bool hasG16(const MCSubtargetInfo &STI);

bool hasPackedD16(const MCSubtargetInfo &STI);

bool hasGDS(const MCSubtargetInfo &STI);

unsigned getNSAMaxSize(const MCSubtargetInfo &STI, bool HasSampler = false);

unsigned getMaxNumUserSGPRs(const MCSubtargetInfo &STI);


bool isSI(const MCSubtargetInfo &STI);

bool isCI(const MCSubtargetInfo &STI);

bool isVI(const MCSubtargetInfo &STI);

bool isGFX9(const MCSubtargetInfo &STI);

bool isGFX9_GFX10(const MCSubtargetInfo &STI);

bool isGFX9_GFX10_GFX11(const MCSubtargetInfo &STI);

bool isGFX8_GFX9_GFX10(const MCSubtargetInfo &STI);

bool isGFX8Plus(const MCSubtargetInfo &STI);

bool isGFX9Plus(const MCSubtargetInfo &STI);

bool isNotGFX9Plus(const MCSubtargetInfo &STI);

bool isGFX10(const MCSubtargetInfo &STI);

bool isGFX10_GFX11(const MCSubtargetInfo &STI);

bool isGFX10Plus(const MCSubtargetInfo &STI);

bool isNotGFX10Plus(const MCSubtargetInfo &STI);

bool isGFX10Before1030(const MCSubtargetInfo &STI);

bool isGFX11(const MCSubtargetInfo &STI);

bool isGFX11Plus(const MCSubtargetInfo &STI);

bool isGFX12(const MCSubtargetInfo &STI);

bool isGFX12Plus(const MCSubtargetInfo &STI);

bool isGFX1250(const MCSubtargetInfo &STI);

bool supportsWGP(const MCSubtargetInfo &STI);

bool isNotGFX12Plus(const MCSubtargetInfo &STI);

bool isNotGFX11Plus(const MCSubtargetInfo &STI);

bool isGCN3Encoding(const MCSubtargetInfo &STI);

bool isGFX10_AEncoding(const MCSubtargetInfo &STI);

bool isGFX10_BEncoding(const MCSubtargetInfo &STI);

bool hasGFX10_3Insts(const MCSubtargetInfo &STI);

bool isGFX10_3_GFX11(const MCSubtargetInfo &STI);

bool isGFX90A(const MCSubtargetInfo &STI);

bool isGFX940(const MCSubtargetInfo &STI);

bool hasArchitectedFlatScratch(const MCSubtargetInfo &STI);

bool hasMAIInsts(const MCSubtargetInfo &STI);

bool hasVOPD(const MCSubtargetInfo &STI);

bool hasDPPSrc1SGPR(const MCSubtargetInfo &STI);


inline bool supportsWave32(const MCSubtargetInfo &STI) {

  return AMDGPU::isGFX10Plus(STI) && !AMDGPU::isGFX1250(STI);

}


int getTotalNumVGPRs(bool has90AInsts, int32_t ArgNumAGPR, int32_t ArgNumVGPR);

unsigned hasKernargPreload(const MCSubtargetInfo &STI);

bool hasSMRDSignedImmOffset(const MCSubtargetInfo &ST);


/// Is Reg - scalar register

bool isSGPR(MCRegister Reg, const MCRegisterInfo *TRI);


/// \returns if \p Reg occupies the high 16-bits of a 32-bit register.

bool isHi16Reg(MCRegister Reg, const MCRegisterInfo &MRI);


/// If \p Reg is a pseudo reg, return the correct hardware register given

/// \p STI otherwise return \p Reg.

MCRegister getMCReg(MCRegister Reg, const MCSubtargetInfo &STI);


/// Convert hardware register \p Reg to a pseudo register

LLVM_READNONE

MCRegister mc2PseudoReg(MCRegister Reg);


LLVM_READNONE

bool isInlineValue(MCRegister Reg);


/// Is this an AMDGPU specific source operand? These include registers,

/// inline constants, literals and mandatory literals (KImm).


constexpr bool isSISrcOperand(const MCOperandInfo &OpInfo) {

  return OpInfo.OperandType >= AMDGPU::OPERAND_SRC_FIRST &&

         OpInfo.OperandType <= AMDGPU::OPERAND_SRC_LAST;

}


inline bool isSISrcOperand(const MCInstrDesc &Desc, unsigned OpNo) {

  return isSISrcOperand(Desc.operands()[OpNo]);

}


/// Is this a KImm operand?

bool isKImmOperand(const MCInstrDesc &Desc, unsigned OpNo);


/// Is this floating-point operand?

bool isSISrcFPOperand(const MCInstrDesc &Desc, unsigned OpNo);


/// Does this operand support only inlinable literals?

bool isSISrcInlinableOperand(const MCInstrDesc &Desc, unsigned OpNo);


/// Get the size in bits of a register from the register class \p RC.

unsigned getRegBitWidth(unsigned RCID);


/// Get the size in bits of a register from the register class \p RC.

unsigned getRegBitWidth(const MCRegisterClass &RC);


LLVM_READNONE


inline unsigned getOperandSize(const MCOperandInfo &OpInfo) {

  switch (OpInfo.OperandType) {

  case AMDGPU::OPERAND_REG_IMM_INT32:

  case AMDGPU::OPERAND_REG_IMM_FP32:

  case AMDGPU::OPERAND_REG_INLINE_C_INT32:

  case AMDGPU::OPERAND_REG_INLINE_C_FP32:

  case AMDGPU::OPERAND_REG_INLINE_AC_INT32:

  case AMDGPU::OPERAND_REG_INLINE_AC_FP32:

  case AMDGPU::OPERAND_REG_IMM_V2INT32:

  case AMDGPU::OPERAND_REG_IMM_V2FP32:

  case AMDGPU::OPERAND_KIMM32:

  case AMDGPU::OPERAND_KIMM16: // mandatory literal is always size 4

  case AMDGPU::OPERAND_INLINE_SPLIT_BARRIER_INT32:

    return 4;


  case AMDGPU::OPERAND_REG_IMM_INT64:

  case AMDGPU::OPERAND_REG_IMM_FP64:

  case AMDGPU::OPERAND_REG_INLINE_C_INT64:

  case AMDGPU::OPERAND_REG_INLINE_C_FP64:

  case AMDGPU::OPERAND_REG_INLINE_AC_FP64:

  case AMDGPU::OPERAND_KIMM64:

    return 8;


  case AMDGPU::OPERAND_REG_IMM_INT16:

  case AMDGPU::OPERAND_REG_IMM_BF16:

  case AMDGPU::OPERAND_REG_IMM_FP16:

  case AMDGPU::OPERAND_REG_INLINE_C_INT16:

  case AMDGPU::OPERAND_REG_INLINE_C_BF16:

  case AMDGPU::OPERAND_REG_INLINE_C_FP16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2INT16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2BF16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2FP16:

  case AMDGPU::OPERAND_REG_IMM_V2INT16:

  case AMDGPU::OPERAND_REG_IMM_V2BF16:

  case AMDGPU::OPERAND_REG_IMM_V2FP16:

  case AMDGPU::OPERAND_REG_IMM_NOINLINE_V2FP16:

    return 2;


  default:

    llvm_unreachable("unhandled operand type");

  }

}


LLVM_READNONE


inline unsigned getOperandSize(const MCInstrDesc &Desc, unsigned OpNo) {

  return getOperandSize(Desc.operands()[OpNo]);

}


/// Is this literal inlinable, and not one of the values intended for floating

/// point values.

LLVM_READNONE


inline bool isInlinableIntLiteral(int64_t Literal) {

  return Literal >= -16 && Literal <= 64;

}


/// Is this literal inlinable

LLVM_READNONE

bool isInlinableLiteral64(int64_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteral32(int32_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteralBF16(int16_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteralFP16(int16_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteralI16(int32_t Literal, bool HasInv2Pi);


LLVM_READNONE

std::optional<unsigned> getInlineEncodingV2I16(uint32_t Literal);


LLVM_READNONE

std::optional<unsigned> getInlineEncodingV2BF16(uint32_t Literal);


LLVM_READNONE

std::optional<unsigned> getInlineEncodingV2F16(uint32_t Literal);


LLVM_READNONE

bool isInlinableLiteralV216(uint32_t Literal, uint8_t OpType);


LLVM_READNONE

bool isInlinableLiteralV2I16(uint32_t Literal);


LLVM_READNONE

bool isInlinableLiteralV2BF16(uint32_t Literal);


LLVM_READNONE

bool isInlinableLiteralV2F16(uint32_t Literal);


LLVM_READNONE

bool isValid32BitLiteral(uint64_t Val, bool IsFP64);


LLVM_READNONE

int64_t encode32BitLiteral(int64_t Imm, OperandType Type, bool IsLit);


bool isArgPassedInSGPR(const Argument *Arg);


bool isArgPassedInSGPR(const CallBase *CB, unsigned ArgNo);


LLVM_READONLY bool isPackedFP32Inst(unsigned Opc);


LLVM_READONLY

bool isLegalSMRDEncodedUnsignedOffset(const MCSubtargetInfo &ST,

                                      int64_t EncodedOffset);


LLVM_READONLY

bool isLegalSMRDEncodedSignedOffset(const MCSubtargetInfo &ST,

                                    int64_t EncodedOffset, bool IsBuffer);


/// Convert \p ByteOffset to dwords if the subtarget uses dword SMRD immediate

/// offsets.

uint64_t convertSMRDOffsetUnits(const MCSubtargetInfo &ST, uint64_t ByteOffset);


/// \returns The encoding that will be used for \p ByteOffset in the

/// SMRD offset field, or std::nullopt if it won't fit. On GFX9 and GFX10

/// S_LOAD instructions have a signed offset, on other subtargets it is

/// unsigned. S_BUFFER has an unsigned offset for all subtargets.

std::optional<int64_t> getSMRDEncodedOffset(const MCSubtargetInfo &ST,

                                            int64_t ByteOffset, bool IsBuffer,

                                            bool HasSOffset = false);


/// \return The encoding that can be used for a 32-bit literal offset in an SMRD

/// instruction. This is only useful on CI.s

std::optional<int64_t> getSMRDEncodedLiteralOffset32(const MCSubtargetInfo &ST,

                                                     int64_t ByteOffset);


/// For pre-GFX12 FLAT instructions the offset must be positive;

/// MSB is ignored and forced to zero.

///

/// \return The number of bits available for the signed offset field in flat

/// instructions. Note that some forms of the instruction disallow negative

/// offsets.

unsigned getNumFlatOffsetBits(const MCSubtargetInfo &ST);


/// \returns true if this offset is small enough to fit in the SMRD

/// offset field.  \p ByteOffset should be the offset in bytes and

/// not the encoded offset.

bool isLegalSMRDImmOffset(const MCSubtargetInfo &ST, int64_t ByteOffset);


LLVM_READNONE


inline bool isLegalDPALU_DPPControl(const MCSubtargetInfo &ST, unsigned DC) {

  if (isGFX12(ST))

    return DC >= DPP::ROW_SHARE_FIRST && DC <= DPP::ROW_SHARE_LAST;

  if (isGFX90A(ST))

    return DC >= DPP::ROW_NEWBCAST_FIRST && DC <= DPP::ROW_NEWBCAST_LAST;

  return false;

}


/// \returns true if an instruction may have a 64-bit VGPR operand.

bool hasAny64BitVGPROperands(const MCInstrDesc &OpDesc,

                             const MCSubtargetInfo &ST);


/// \returns true if an instruction is a DP ALU DPP without any 64-bit operands.

bool isDPALU_DPP32BitOpc(unsigned Opc);


/// \returns true if an instruction is a DP ALU DPP.

bool isDPALU_DPP(const MCInstrDesc &OpDesc, const MCInstrInfo &MII,

                 const MCSubtargetInfo &ST);


/// \returns true if the intrinsic is divergent

bool isIntrinsicSourceOfDivergence(unsigned IntrID);


/// \returns true if the intrinsic is uniform

bool isIntrinsicAlwaysUniform(unsigned IntrID);


/// \returns a register class for the physical register \p Reg if it is a VGPR

/// or nullptr otherwise.

const MCRegisterClass *getVGPRPhysRegClass(MCRegister Reg,

                                           const MCRegisterInfo &MRI);


/// \returns the MODE bits which have to be set by the S_SET_VGPR_MSB for the

/// physical register \p Reg.

unsigned getVGPREncodingMSBs(MCRegister Reg, const MCRegisterInfo &MRI);


/// If \p Reg is a low VGPR return a corresponding high VGPR with \p MSBs set.

MCRegister getVGPRWithMSBs(MCRegister Reg, unsigned MSBs,

                           const MCRegisterInfo &MRI);


// Returns a table for the opcode with a given \p Desc to map the VGPR MSB

// set by the S_SET_VGPR_MSB to one of 4 sources. In case of VOPD returns 2

// maps, one for X and one for Y component.

std::pair<const AMDGPU::OpName *, const AMDGPU::OpName *>

getVGPRLoweringOperandTables(const MCInstrDesc &Desc);


/// \returns true if a memory instruction supports scale_offset modifier.

bool supportsScaleOffset(const MCInstrInfo &MII, unsigned Opcode);


/// \returns lds block size in terms of dwords. \p

/// This is used to calculate the lds size encoded for PAL metadata 3.0+ which

/// must be defined in terms of bytes.

unsigned getLdsDwGranularity(const MCSubtargetInfo &ST);


class ClusterDimsAttr {

public:

  enum class Kind { Unknown, NoCluster, VariableDims, FixedDims };


  ClusterDimsAttr() = default;


  Kind getKind() const { return AttrKind; }


  bool isUnknown() const { return getKind() == Kind::Unknown; }


  bool isNoCluster() const { return getKind() == Kind::NoCluster; }


  bool isFixedDims() const { return getKind() == Kind::FixedDims; }


  bool isVariableDims() const { return getKind() == Kind::VariableDims; }


  void setUnknown() { *this = ClusterDimsAttr(Kind::Unknown); }


  void setNoCluster() { *this = ClusterDimsAttr(Kind::NoCluster); }


  void setVariableDims() { *this = ClusterDimsAttr(Kind::VariableDims); }


  /// \returns the dims stored. Note that this function can only be called if

  /// the kind is \p Fixed.

  const std::array<unsigned, 3> &getDims() const;


  bool operator==(const ClusterDimsAttr &RHS) const {

    return AttrKind == RHS.AttrKind && Dims == RHS.Dims;

  }


  std::string to_string() const;


  static ClusterDimsAttr get(const Function &F);


private:

  enum Encoding { EncoNoCluster = 0, EncoVariableDims = 1024 };


  ClusterDimsAttr(Kind AttrKind) : AttrKind(AttrKind) {}


  std::array<unsigned, 3> Dims = {0, 0, 0};


  Kind AttrKind = Kind::Unknown;

};


} // end namespace AMDGPU


raw_ostream &operator<<(raw_ostream &OS,

                        const AMDGPU::IsaInfo::TargetIDSetting S);


} // end namespace llvm


#endif // LLVM_LIB_TARGET_AMDGPU_UTILS_AMDGPUBASEINFO_H

MRI
unsigned const MachineRegisterInfo * MRI
Definition AArch64AdvSIMDScalarPass.cpp:103

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

AMDGPUSubtarget.h
Base class for AMDGPU specific classes of TargetSubtarget.

Alignment.h

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

CallingConv.h

LLVM_READNONE
#define LLVM_READNONE
Definition Compiler.h:315

LLVM_READONLY
#define LLVM_READONLY
Definition Compiler.h:322

Module.h
Module.h This file contains the declarations for the Module class.

InlinePriorityMode::Size
@ Size
Definition InlineOrder.cpp:25

InstrTypes.h

F
#define F(x, y, z)
Definition MD5.cpp:54

G
#define G(x, y, z)
Definition MD5.cpp:55

Reg
Register Reg
Definition MachineSink.cpp:2121

TRI
Register const TargetRegisterInfo * TRI
Definition MachineSink.cpp:2122

Opc
auto Opc
Definition RISCVRedundantCopyElimination.cpp:77

SIDefines.h

DefaultVal
unsigned unsigned DefaultVal
Definition SPIRVModuleAnalysis.cpp:61

RHS
Value * RHS
Definition X86PartialReduction.cpp:81

IV
static const uint32_t IV[8]
Definition blake3_impl.h:83

llvm::AMDGPUSubtarget::Generation
Generation
Definition AMDGPUSubtarget.h:32

llvm::AMDGPU::ClusterDimsAttr
Definition AMDGPUBaseInfo.h:1864

llvm::AMDGPU::ClusterDimsAttr::isNoCluster
bool isNoCluster() const
Definition AMDGPUBaseInfo.h:1874

llvm::AMDGPU::ClusterDimsAttr::setUnknown
void setUnknown()
Definition AMDGPUBaseInfo.h:1880

llvm::AMDGPU::ClusterDimsAttr::get
static ClusterDimsAttr get(const Function &F)
Definition AMDGPUBaseInfo.cpp:3694

llvm::AMDGPU::ClusterDimsAttr::isFixedDims
bool isFixedDims() const
Definition AMDGPUBaseInfo.h:1876

llvm::AMDGPU::ClusterDimsAttr::Kind
Kind
Definition AMDGPUBaseInfo.h:1866

llvm::AMDGPU::ClusterDimsAttr::Kind::FixedDims
@ FixedDims
Definition AMDGPUBaseInfo.h:1866

llvm::AMDGPU::ClusterDimsAttr::Kind::NoCluster
@ NoCluster
Definition AMDGPUBaseInfo.h:1866

llvm::AMDGPU::ClusterDimsAttr::Kind::Unknown
@ Unknown
Definition AMDGPUBaseInfo.h:1866

llvm::AMDGPU::ClusterDimsAttr::Kind::VariableDims
@ VariableDims
Definition AMDGPUBaseInfo.h:1866

llvm::AMDGPU::ClusterDimsAttr::getKind
Kind getKind() const
Definition AMDGPUBaseInfo.h:1870

llvm::AMDGPU::ClusterDimsAttr::ClusterDimsAttr
ClusterDimsAttr()=default

llvm::AMDGPU::ClusterDimsAttr::setNoCluster
void setNoCluster()
Definition AMDGPUBaseInfo.h:1882

llvm::AMDGPU::ClusterDimsAttr::isUnknown
bool isUnknown() const
Definition AMDGPUBaseInfo.h:1872

llvm::AMDGPU::ClusterDimsAttr::setVariableDims
void setVariableDims()
Definition AMDGPUBaseInfo.h:1884

llvm::AMDGPU::ClusterDimsAttr::operator==
bool operator==(const ClusterDimsAttr &RHS) const
Definition AMDGPUBaseInfo.h:1890

llvm::AMDGPU::ClusterDimsAttr::to_string
std::string to_string() const
Definition AMDGPUBaseInfo.cpp:3670

llvm::AMDGPU::ClusterDimsAttr::getDims
const std::array< unsigned, 3 > & getDims() const
Definition AMDGPUBaseInfo.cpp:3665

llvm::AMDGPU::ClusterDimsAttr::isVariableDims
bool isVariableDims() const
Definition AMDGPUBaseInfo.h:1878

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isSramEccSupported
bool isSramEccSupported() const
Definition AMDGPUBaseInfo.h:190

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::setTargetIDFromFeaturesString
void setTargetIDFromFeaturesString(StringRef FS)
Definition AMDGPUBaseInfo.cpp:1029

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::setXnackSetting
void setXnackSetting(TargetIDSetting NewXnackSetting)
Sets xnack setting to NewXnackSetting.
Definition AMDGPUBaseInfo.h:185

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isSramEccOnOrAny
bool isSramEccOnOrAny() const
Definition AMDGPUBaseInfo.h:195

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::getXnackSetting
TargetIDSetting getXnackSetting() const
Definition AMDGPUBaseInfo.h:182

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isXnackOnOrAny
bool isXnackOnOrAny() const
Definition AMDGPUBaseInfo.h:168

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::AMDGPUTargetID
AMDGPUTargetID(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:1020

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isXnackOnOrOff
bool isXnackOnOrOff() const
Definition AMDGPUBaseInfo.h:175

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isXnackSupported
bool isXnackSupported() const
Definition AMDGPUBaseInfo.h:163

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::setTargetIDFromTargetIDStream
void setTargetIDFromTargetIDStream(StringRef TargetID)
Definition AMDGPUBaseInfo.cpp:1097

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::~AMDGPUTargetID
~AMDGPUTargetID()=default

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::setSramEccSetting
void setSramEccSetting(TargetIDSetting NewSramEccSetting)
Sets sramecc setting to NewSramEccSetting.
Definition AMDGPUBaseInfo.h:212

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isSramEccOnOrOff
bool isSramEccOnOrOff() const
Definition AMDGPUBaseInfo.h:202

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::toString
std::string toString() const
Definition AMDGPUBaseInfo.cpp:1109

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::getSramEccSetting
TargetIDSetting getSramEccSetting() const
Definition AMDGPUBaseInfo.h:209

llvm::AMDGPU::VOPD::ComponentInfo
Definition AMDGPUBaseInfo.h:885

llvm::AMDGPU::VOPD::ComponentInfo::getIndexInParsedOperands
unsigned getIndexInParsedOperands(unsigned CompOprIdx) const
Definition AMDGPUBaseInfo.cpp:894

llvm::AMDGPU::VOPD::ComponentInfo::ComponentInfo
ComponentInfo(const MCInstrDesc &OpDesc, ComponentKind Kind=ComponentKind::SINGLE, bool VOP3Layout=false)
Definition AMDGPUBaseInfo.h:888

llvm::AMDGPU::VOPD::ComponentInfo::ComponentInfo
ComponentInfo(const MCInstrDesc &OpDesc, const ComponentProps &OpXProps, bool VOP3Layout=false)
Definition AMDGPUBaseInfo.h:895

llvm::AMDGPU::VOPD::ComponentLayout::getIndexOfDstInMCOperands
unsigned getIndexOfDstInMCOperands() const
Definition AMDGPUBaseInfo.h:843

llvm::AMDGPU::VOPD::ComponentLayout::getIndexOfDstInParsedOperands
unsigned getIndexOfDstInParsedOperands() const
Definition AMDGPUBaseInfo.h:862

llvm::AMDGPU::VOPD::ComponentLayout::getIndexOfSrcInMCOperands
unsigned getIndexOfSrcInMCOperands(unsigned CompSrcIdx, bool VOPD3) const
Definition AMDGPUBaseInfo.h:846

llvm::AMDGPU::VOPD::ComponentLayout::ComponentLayout
ComponentLayout(const ComponentProps &OpXProps, unsigned VOPD3ModsNum, int BitOp3Idx)
Definition AMDGPUBaseInfo.h:836

llvm::AMDGPU::VOPD::ComponentLayout::getIndexOfSrcInParsedOperands
unsigned getIndexOfSrcInParsedOperands(unsigned CompSrcIdx) const
Definition AMDGPUBaseInfo.h:867

llvm::AMDGPU::VOPD::ComponentLayout::ComponentLayout
ComponentLayout(ComponentKind Kind, unsigned VOPD3ModsNum, int BitOp3Idx)
Definition AMDGPUBaseInfo.h:830

llvm::AMDGPU::VOPD::ComponentProps
Definition AMDGPUBaseInfo.h:696

llvm::AMDGPU::VOPD::ComponentProps::hasMandatoryLiteral
bool hasMandatoryLiteral() const
Definition AMDGPUBaseInfo.h:718

llvm::AMDGPU::VOPD::ComponentProps::getBitOp3OperandIdx
int getBitOp3OperandIdx() const
Definition AMDGPUBaseInfo.cpp:890

llvm::AMDGPU::VOPD::ComponentProps::hasRegSrcOperand
bool hasRegSrcOperand(unsigned CompSrcIdx) const
Definition AMDGPUBaseInfo.h:729

llvm::AMDGPU::VOPD::ComponentProps::hasSrc2Acc
bool hasSrc2Acc() const
Definition AMDGPUBaseInfo.h:735

llvm::AMDGPU::VOPD::ComponentProps::ComponentProps
ComponentProps()=default

llvm::AMDGPU::VOPD::ComponentProps::getCompSrcOperandsNum
unsigned getCompSrcOperandsNum() const
Definition AMDGPUBaseInfo.h:710

llvm::AMDGPU::VOPD::ComponentProps::getMandatoryLiteralCompOperandIndex
unsigned getMandatoryLiteralCompOperandIndex() const
Definition AMDGPUBaseInfo.h:722

llvm::AMDGPU::VOPD::ComponentProps::isVOP3
unsigned isVOP3() const
Definition AMDGPUBaseInfo.h:744

llvm::AMDGPU::VOPD::ComponentProps::getOpcode
unsigned getOpcode() const
Definition AMDGPUBaseInfo.h:741

llvm::AMDGPU::VOPD::ComponentProps::getCompVOPD3ModsNum
unsigned getCompVOPD3ModsNum() const
Definition AMDGPUBaseInfo.h:738

llvm::AMDGPU::VOPD::ComponentProps::getCompParsedSrcOperandsNum
unsigned getCompParsedSrcOperandsNum() const
Definition AMDGPUBaseInfo.h:713

llvm::AMDGPU::VOPD::InstInfo::getInvalidCompOperandIndex
std::optional< unsigned > getInvalidCompOperandIndex(std::function< MCRegister(unsigned, unsigned)> GetRegIdx, const MCRegisterInfo &MRI, bool SkipSrc=false, bool AllowSameVGPR=false, bool VOPD3=false) const
Definition AMDGPUBaseInfo.cpp:908

llvm::AMDGPU::VOPD::InstInfo::InstInfo
InstInfo(const ComponentInfo &OprInfoX, const ComponentInfo &OprInfoY)
Definition AMDGPUBaseInfo.h:917

llvm::AMDGPU::VOPD::InstInfo::hasInvalidOperand
bool hasInvalidOperand(std::function< MCRegister(unsigned, unsigned)> GetRegIdx, const MCRegisterInfo &MRI, bool SkipSrc=false, bool AllowSameVGPR=false, bool VOPD3=false) const
Definition AMDGPUBaseInfo.h:936

llvm::AMDGPU::VOPD::InstInfo::operator[]
const ComponentInfo & operator[](size_t ComponentIdx) const
Definition AMDGPUBaseInfo.h:920

llvm::AMDGPU::VOPD::InstInfo::InstInfo
InstInfo(const MCInstrDesc &OpX, const MCInstrDesc &OpY)
Definition AMDGPUBaseInfo.h:914

llvm::AMDGPU::VOPD::InstInfo::RegIndices
std::array< MCRegister, Component::MAX_OPR_NUM > RegIndices
Definition AMDGPUBaseInfo.h:912

llvm::Argument
This class represents an incoming formal argument to a Function.
Definition Argument.h:32

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition InstrTypes.h:1114

llvm::Function
Definition Function.h:64

llvm::GlobalValue
Definition GlobalValue.h:49

llvm::MCInstrDesc
Describe properties that are true of each instruction in the target description file.
Definition MCInstrDesc.h:199

llvm::MCInstrInfo
Interface to description of machine instruction set.
Definition MCInstrInfo.h:27

llvm::MCOperandInfo
This holds information about one operand of a machine instruction, indicating the register class for ...
Definition MCInstrDesc.h:86

llvm::MCRegisterClass
MCRegisterClass - Base class of TargetRegisterClass.
Definition MCRegisterInfo.h:37

llvm::MCRegisterInfo
MCRegisterInfo base class - We assume that the target defines a static array of MCRegisterDesc object...
Definition MCRegisterInfo.h:151

llvm::MCRegister
Wrapper class representing physical registers. Should be passed by value.
Definition MCRegister.h:41

llvm::MCSubtargetInfo
Generic base class for all target subtargets.
Definition MCSubtargetInfo.h:77

llvm::MDNode
Metadata node.
Definition Metadata.h:1078

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition Module.h:67

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1205

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::Triple
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53

uint16_t

uint32_t

uint64_t

uint8_t

unsigned

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

OpName
Definition R600Defines.h:62

llvm::AMDGPU::DPP::ROW_NEWBCAST_LAST
@ ROW_NEWBCAST_LAST
Definition SIDefines.h:990

llvm::AMDGPU::DPP::ROW_SHARE_FIRST
@ ROW_SHARE_FIRST
Definition SIDefines.h:992

llvm::AMDGPU::DPP::ROW_NEWBCAST_FIRST
@ ROW_NEWBCAST_FIRST
Definition SIDefines.h:989

llvm::AMDGPU::DPP::ROW_SHARE_LAST
@ ROW_SHARE_LAST
Definition SIDefines.h:993

llvm::AMDGPU::DepCtr
Definition AMDGPUAsmUtils.cpp:63

llvm::AMDGPU::DepCtr::decodeFieldVaVcc
unsigned decodeFieldVaVcc(unsigned Encoded)
Definition AMDGPUBaseInfo.cpp:2095

llvm::AMDGPU::DepCtr::encodeFieldVaVcc
unsigned encodeFieldVaVcc(unsigned Encoded, unsigned VaVcc)
Definition AMDGPUBaseInfo.cpp:2143

llvm::AMDGPU::DepCtr::encodeFieldHoldCnt
unsigned encodeFieldHoldCnt(unsigned Encoded, unsigned HoldCnt)
Definition AMDGPUBaseInfo.cpp:2161

llvm::AMDGPU::DepCtr::decodeDepCtr
bool decodeDepCtr(unsigned Code, int &Id, StringRef &Name, unsigned &Val, bool &IsDefault, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2063

llvm::AMDGPU::DepCtr::getVmVsrcBitMask
unsigned getVmVsrcBitMask()
Definition AMDGPUBaseInfo.cpp:2077

llvm::AMDGPU::DepCtr::encodeFieldVaSsrc
unsigned encodeFieldVaSsrc(unsigned Encoded, unsigned VaSsrc)
Definition AMDGPUBaseInfo.cpp:2152

llvm::AMDGPU::DepCtr::encodeFieldVaVdst
unsigned encodeFieldVaVdst(unsigned Encoded, unsigned VaVdst)
Definition AMDGPUBaseInfo.cpp:2116

llvm::AMDGPU::DepCtr::decodeFieldSaSdst
unsigned decodeFieldSaSdst(unsigned Encoded)
Definition AMDGPUBaseInfo.cpp:2087

llvm::AMDGPU::DepCtr::decodeFieldVaSdst
unsigned decodeFieldVaSdst(unsigned Encoded)
Definition AMDGPUBaseInfo.cpp:2091

llvm::AMDGPU::DepCtr::getVaVdstBitMask
unsigned getVaVdstBitMask()
Definition AMDGPUBaseInfo.cpp:2075

llvm::AMDGPU::DepCtr::encodeFieldVmVsrc
unsigned encodeFieldVmVsrc(unsigned Encoded, unsigned VmVsrc)
Definition AMDGPUBaseInfo.cpp:2107

llvm::AMDGPU::DepCtr::decodeFieldVaSsrc
unsigned decodeFieldVaSsrc(unsigned Encoded)
Definition AMDGPUBaseInfo.cpp:2099

llvm::AMDGPU::DepCtr::encodeDepCtr
int encodeDepCtr(const StringRef Name, int64_t Val, unsigned &UsedOprMask, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2069

llvm::AMDGPU::DepCtr::encodeFieldSaSdst
unsigned encodeFieldSaSdst(unsigned Encoded, unsigned SaSdst)
Definition AMDGPUBaseInfo.cpp:2125

llvm::AMDGPU::DepCtr::isSymbolicDepCtrEncoding
bool isSymbolicDepCtrEncoding(unsigned Code, bool &HasNonDefaultVal, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2057

llvm::AMDGPU::DepCtr::decodeFieldVaVdst
unsigned decodeFieldVaVdst(unsigned Encoded)
Definition AMDGPUBaseInfo.cpp:2083

llvm::AMDGPU::DepCtr::decodeFieldHoldCnt
unsigned decodeFieldHoldCnt(unsigned Encoded)
Definition AMDGPUBaseInfo.cpp:2103

llvm::AMDGPU::DepCtr::getDefaultDepCtrEncoding
int getDefaultDepCtrEncoding(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2050

llvm::AMDGPU::DepCtr::decodeFieldVmVsrc
unsigned decodeFieldVmVsrc(unsigned Encoded)
Definition AMDGPUBaseInfo.cpp:2079

llvm::AMDGPU::DepCtr::encodeFieldVaSdst
unsigned encodeFieldVaSdst(unsigned Encoded, unsigned VaSdst)
Definition AMDGPUBaseInfo.cpp:2134

llvm::AMDGPU::Exp::isSupportedTgtId
bool isSupportedTgtId(unsigned Id, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2230

llvm::AMDGPU::Exp::getTgtName
bool getTgtName(unsigned Id, StringRef &Name, int &Index)
Definition AMDGPUBaseInfo.cpp:2196

llvm::AMDGPU::Exp::getTgtId
unsigned getTgtId(const StringRef Name)
Definition AMDGPUBaseInfo.cpp:2207

llvm::AMDGPU::GenericVersion
Generic target versions emitted by this version of LLVM.
Definition AMDGPUBaseInfo.h:52

llvm::AMDGPU::GenericVersion::GFX9_4
static constexpr unsigned GFX9_4
Definition AMDGPUBaseInfo.h:54

llvm::AMDGPU::GenericVersion::GFX10_1
static constexpr unsigned GFX10_1
Definition AMDGPUBaseInfo.h:55

llvm::AMDGPU::GenericVersion::GFX10_3
static constexpr unsigned GFX10_3
Definition AMDGPUBaseInfo.h:56

llvm::AMDGPU::GenericVersion::GFX11
static constexpr unsigned GFX11
Definition AMDGPUBaseInfo.h:57

llvm::AMDGPU::GenericVersion::GFX9
static constexpr unsigned GFX9
Definition AMDGPUBaseInfo.h:53

llvm::AMDGPU::GenericVersion::GFX12
static constexpr unsigned GFX12
Definition AMDGPUBaseInfo.h:58

llvm::AMDGPU::Hwreg
Definition SIDefines.h:502

llvm::AMDGPU::Hwreg::HwregOffset
EncodingField< 10, 6 > HwregOffset
Definition AMDGPUBaseInfo.h:1289

llvm::AMDGPU::Hwreg::HwregId
EncodingField< 5, 0 > HwregId
Definition AMDGPUBaseInfo.h:1288

llvm::AMDGPU::Hwreg::HwregEncoding
EncodingFields< HwregId, HwregOffset, HwregSize > HwregEncoding
Definition AMDGPUBaseInfo.h:1297

llvm::AMDGPU::IsaInfo::getVGPREncodingGranule
unsigned getVGPREncodingGranule(const MCSubtargetInfo *STI, std::optional< bool > EnableWavefrontSize32)
Definition AMDGPUBaseInfo.cpp:1379

llvm::AMDGPU::IsaInfo::TRAP_NUM_SGPRS
@ TRAP_NUM_SGPRS
Definition AMDGPUBaseInfo.h:147

llvm::AMDGPU::IsaInfo::FIXED_NUM_SGPRS_FOR_INIT_BUG
@ FIXED_NUM_SGPRS_FOR_INIT_BUG
Definition AMDGPUBaseInfo.h:146

llvm::AMDGPU::IsaInfo::getTotalNumVGPRs
unsigned getTotalNumVGPRs(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1396

llvm::AMDGPU::IsaInfo::getArchVGPRAllocGranule
unsigned getArchVGPRAllocGranule()
For subtargets with a unified VGPR file and mixed ArchVGPR/AGPR usage, returns the allocation granule...
Definition AMDGPUBaseInfo.cpp:1394

llvm::AMDGPU::IsaInfo::getWavesPerEUForWorkGroup
unsigned getWavesPerEUForWorkGroup(const MCSubtargetInfo *STI, unsigned FlatWorkGroupSize)
Definition AMDGPUBaseInfo.cpp:1233

llvm::AMDGPU::IsaInfo::getWavefrontSize
unsigned getWavefrontSize(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1150

llvm::AMDGPU::IsaInfo::getNumWavesPerEUWithNumVGPRs
unsigned getNumWavesPerEUWithNumVGPRs(const MCSubtargetInfo *STI, unsigned NumVGPRs, unsigned DynamicVGPRBlockSize)
Definition AMDGPUBaseInfo.cpp:1426

llvm::AMDGPU::IsaInfo::getMaxWorkGroupsPerCU
unsigned getMaxWorkGroupsPerCU(const MCSubtargetInfo *STI, unsigned FlatWorkGroupSize)
Definition AMDGPUBaseInfo.cpp:1203

llvm::AMDGPU::IsaInfo::getMaxFlatWorkGroupSize
unsigned getMaxFlatWorkGroupSize(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1241

llvm::AMDGPU::IsaInfo::getMaxWavesPerEU
unsigned getMaxWavesPerEU(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1224

llvm::AMDGPU::IsaInfo::getWavesPerWorkGroup
unsigned getWavesPerWorkGroup(const MCSubtargetInfo *STI, unsigned FlatWorkGroupSize)
Definition AMDGPUBaseInfo.cpp:1246

llvm::AMDGPU::IsaInfo::getNumExtraSGPRs
unsigned getNumExtraSGPRs(const MCSubtargetInfo *STI, bool VCCUsed, bool FlatScrUsed, bool XNACKUsed)
Definition AMDGPUBaseInfo.cpp:1315

llvm::AMDGPU::IsaInfo::getSGPREncodingGranule
unsigned getSGPREncodingGranule(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1260

llvm::AMDGPU::IsaInfo::getLocalMemorySize
unsigned getLocalMemorySize(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1159

llvm::AMDGPU::IsaInfo::getAddressableLocalMemorySize
unsigned getAddressableLocalMemorySize(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1171

llvm::AMDGPU::IsaInfo::getEUsPerCU
unsigned getEUsPerCU(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1183

llvm::AMDGPU::IsaInfo::getAddressableNumSGPRs
unsigned getAddressableNumSGPRs(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1269

llvm::AMDGPU::IsaInfo::getMinNumSGPRs
unsigned getMinNumSGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU)
Definition AMDGPUBaseInfo.cpp:1281

llvm::AMDGPU::IsaInfo::getMinFlatWorkGroupSize
unsigned getMinFlatWorkGroupSize(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1239

llvm::AMDGPU::IsaInfo::getVGPRAllocGranule
unsigned getVGPRAllocGranule(const MCSubtargetInfo *STI, unsigned DynamicVGPRBlockSize, std::optional< bool > EnableWavefrontSize32)
Definition AMDGPUBaseInfo.cpp:1357

llvm::AMDGPU::IsaInfo::getMaxNumSGPRs
unsigned getMaxNumSGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU, bool Addressable)
Definition AMDGPUBaseInfo.cpp:1298

llvm::AMDGPU::IsaInfo::getNumSGPRBlocks
unsigned getNumSGPRBlocks(const MCSubtargetInfo *STI, unsigned NumSGPRs)
Definition AMDGPUBaseInfo.cpp:1351

llvm::AMDGPU::IsaInfo::getMinWavesPerEU
unsigned getMinWavesPerEU(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1222

llvm::AMDGPU::IsaInfo::getMaxNumVGPRs
unsigned getMaxNumVGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU, unsigned DynamicVGPRBlockSize)
Definition AMDGPUBaseInfo.cpp:1497

llvm::AMDGPU::IsaInfo::getSGPRAllocGranule
unsigned getSGPRAllocGranule(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1251

llvm::AMDGPU::IsaInfo::TargetIDSetting
TargetIDSetting
Definition AMDGPUBaseInfo.h:150

llvm::AMDGPU::IsaInfo::TargetIDSetting::On
@ On
Definition AMDGPUBaseInfo.h:150

llvm::AMDGPU::IsaInfo::TargetIDSetting::Unsupported
@ Unsupported
Definition AMDGPUBaseInfo.h:150

llvm::AMDGPU::IsaInfo::TargetIDSetting::Off
@ Off
Definition AMDGPUBaseInfo.h:150

llvm::AMDGPU::IsaInfo::TargetIDSetting::Any
@ Any
Definition AMDGPUBaseInfo.h:150

llvm::AMDGPU::IsaInfo::getMinNumVGPRs
unsigned getMinNumVGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU, unsigned DynamicVGPRBlockSize)
Definition AMDGPUBaseInfo.cpp:1470

llvm::AMDGPU::IsaInfo::getAllocatedNumVGPRBlocks
unsigned getAllocatedNumVGPRBlocks(const MCSubtargetInfo *STI, unsigned NumVGPRs, unsigned DynamicVGPRBlockSize, std::optional< bool > EnableWavefrontSize32)
Definition AMDGPUBaseInfo.cpp:1516

llvm::AMDGPU::IsaInfo::getEncodedNumVGPRBlocks
unsigned getEncodedNumVGPRBlocks(const MCSubtargetInfo *STI, unsigned NumVGPRs, std::optional< bool > EnableWavefrontSize32)
Definition AMDGPUBaseInfo.cpp:1509

llvm::AMDGPU::IsaInfo::getOccupancyWithNumSGPRs
unsigned getOccupancyWithNumSGPRs(unsigned SGPRs, unsigned MaxWaves, AMDGPUSubtarget::Generation Gen)
Definition AMDGPUBaseInfo.cpp:1443

llvm::AMDGPU::IsaInfo::getAddressableNumArchVGPRs
unsigned getAddressableNumArchVGPRs(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1407

llvm::AMDGPU::IsaInfo::getTotalNumSGPRs
unsigned getTotalNumSGPRs(const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1262

llvm::AMDGPU::IsaInfo::getAddressableNumVGPRs
unsigned getAddressableNumVGPRs(const MCSubtargetInfo *STI, unsigned DynamicVGPRBlockSize)
Definition AMDGPUBaseInfo.cpp:1414

llvm::AMDGPU::MTBUFFormat::isValidUnifiedFormat
bool isValidUnifiedFormat(unsigned Id, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2331

llvm::AMDGPU::MTBUFFormat::getDefaultFormatEncoding
unsigned getDefaultFormatEncoding(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2356

llvm::AMDGPU::MTBUFFormat::getUnifiedFormatName
StringRef getUnifiedFormatName(unsigned Id, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2325

llvm::AMDGPU::MTBUFFormat::isValidNfmt
bool isValidNfmt(unsigned Id, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2297

llvm::AMDGPU::MTBUFFormat::isValidDfmtNfmt
bool isValidDfmtNfmt(unsigned Id, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2290

llvm::AMDGPU::MTBUFFormat::convertDfmtNfmt2Ufmt
int64_t convertDfmtNfmt2Ufmt(unsigned Dfmt, unsigned Nfmt, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2335

llvm::AMDGPU::MTBUFFormat::getDfmtName
StringRef getDfmtName(unsigned Id)
Definition AMDGPUBaseInfo.cpp:2263

llvm::AMDGPU::MTBUFFormat::encodeDfmtNfmt
int64_t encodeDfmtNfmt(unsigned Dfmt, unsigned Nfmt)
Definition AMDGPUBaseInfo.cpp:2301

llvm::AMDGPU::MTBUFFormat::getUnifiedFormat
int64_t getUnifiedFormat(const StringRef Name, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2310

llvm::AMDGPU::MTBUFFormat::isValidFormatEncoding
bool isValidFormatEncoding(unsigned Val, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2352

llvm::AMDGPU::MTBUFFormat::getNfmtName
StringRef getNfmtName(unsigned Id, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2285

llvm::AMDGPU::MTBUFFormat::getNfmt
int64_t getNfmt(const StringRef Name, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2276

llvm::AMDGPU::MTBUFFormat::getDfmt
int64_t getDfmt(const StringRef Name)
Definition AMDGPUBaseInfo.cpp:2255

llvm::AMDGPU::MTBUFFormat::decodeDfmtNfmt
void decodeDfmtNfmt(unsigned Format, unsigned &Dfmt, unsigned &Nfmt)
Definition AMDGPUBaseInfo.cpp:2305

llvm::AMDGPU::SendMsg
Definition SIDefines.h:433

llvm::AMDGPU::SendMsg::encodeMsg
uint64_t encodeMsg(uint64_t MsgId, uint64_t OpId, uint64_t StreamId)
Definition AMDGPUBaseInfo.cpp:2440

llvm::AMDGPU::SendMsg::StreamId
StreamId
Definition SIDefines.h:490

llvm::AMDGPU::SendMsg::msgSupportsStream
bool msgSupportsStream(int64_t MsgId, int64_t OpId, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2421

llvm::AMDGPU::SendMsg::decodeMsg
void decodeMsg(unsigned Val, uint16_t &MsgId, uint16_t &OpId, uint16_t &StreamId, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2428

llvm::AMDGPU::SendMsg::isValidMsgId
bool isValidMsgId(int64_t MsgId, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2374

llvm::AMDGPU::SendMsg::isValidMsgStream
bool isValidMsgStream(int64_t MsgId, int64_t OpId, int64_t StreamId, const MCSubtargetInfo &STI, bool Strict)
Definition AMDGPUBaseInfo.cpp:2395

llvm::AMDGPU::SendMsg::msgRequiresOp
bool msgRequiresOp(int64_t MsgId, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2415

llvm::AMDGPU::SendMsg::isValidMsgOp
bool isValidMsgOp(int64_t MsgId, int64_t OpId, const MCSubtargetInfo &STI, bool Strict)
Definition AMDGPUBaseInfo.cpp:2378

llvm::AMDGPU::VOPD
Definition AMDGPUBaseInfo.cpp:842

llvm::AMDGPU::VOPD::VOPD_VGPR_BANK_MASKS
constexpr unsigned VOPD_VGPR_BANK_MASKS[]
Definition AMDGPUBaseInfo.h:688

llvm::AMDGPU::VOPD::COMPONENTS_NUM
constexpr unsigned COMPONENTS_NUM
Definition AMDGPUBaseInfo.h:693

llvm::AMDGPU::VOPD::VOPD3_VGPR_BANK_MASKS
constexpr unsigned VOPD3_VGPR_BANK_MASKS[]
Definition AMDGPUBaseInfo.h:689

llvm::AMDGPU::VOPD::ComponentIndex
ComponentIndex
Definition AMDGPUBaseInfo.h:691

llvm::AMDGPU::VOPD::X
@ X
Definition AMDGPUBaseInfo.h:691

llvm::AMDGPU::VOPD::Y
@ Y
Definition AMDGPUBaseInfo.h:691

llvm::AMDGPU::VOPD::ComponentKind
ComponentKind
Definition AMDGPUBaseInfo.h:756

llvm::AMDGPU::VOPD::COMPONENT_X
@ COMPONENT_X
Definition AMDGPUBaseInfo.h:758

llvm::AMDGPU::VOPD::SINGLE
@ SINGLE
Definition AMDGPUBaseInfo.h:757

llvm::AMDGPU::VOPD::MAX
@ MAX
Definition AMDGPUBaseInfo.h:760

llvm::AMDGPU::VOPD::COMPONENT_Y
@ COMPONENT_Y
Definition AMDGPUBaseInfo.h:759

llvm::AMDGPU::VOPD::COMPONENTS
constexpr unsigned COMPONENTS[]
Definition AMDGPUBaseInfo.h:692

llvm::AMDGPU::VOPD::Component
Component
Definition AMDGPUBaseInfo.h:675

llvm::AMDGPU::VOPD::MAX_SRC_NUM
@ MAX_SRC_NUM
Definition AMDGPUBaseInfo.h:682

llvm::AMDGPU::VOPD::MAX_OPR_NUM
@ MAX_OPR_NUM
Definition AMDGPUBaseInfo.h:683

llvm::AMDGPU::VOPD::DST
@ DST
Definition AMDGPUBaseInfo.h:676

llvm::AMDGPU::VOPD::SRC2
@ SRC2
Definition AMDGPUBaseInfo.h:679

llvm::AMDGPU::VOPD::DST_NUM
@ DST_NUM
Definition AMDGPUBaseInfo.h:681

llvm::AMDGPU::VOPD::SRC1
@ SRC1
Definition AMDGPUBaseInfo.h:678

llvm::AMDGPU::VOPD::SRC0
@ SRC0
Definition AMDGPUBaseInfo.h:677

llvm::AMDGPU::isPackedFP32Inst
bool isPackedFP32Inst(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:3651

llvm::AMDGPU::isGCN3Encoding
bool isGCN3Encoding(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2608

llvm::AMDGPU::isInlinableLiteralBF16
bool isInlinableLiteralBF16(int16_t Literal, bool HasInv2Pi)
Definition AMDGPUBaseInfo.cpp:3040

llvm::AMDGPU::isGFX10_BEncoding
bool isGFX10_BEncoding(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2616

llvm::AMDGPU::getMIMGG16MappingInfo
LLVM_READONLY const MIMGG16MappingInfo * getMIMGG16MappingInfo(unsigned G)

llvm::AMDGPU::isInlineValue
bool isInlineValue(MCRegister Reg)
Definition AMDGPUBaseInfo.cpp:2764

llvm::AMDGPU::isGFX10_GFX11
bool isGFX10_GFX11(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2564

llvm::AMDGPU::isInlinableLiteralV216
bool isInlinableLiteralV216(uint32_t Literal, uint8_t OpType)
Definition AMDGPUBaseInfo.cpp:3172

llvm::AMDGPU::EncodingBit
EncodingField< Bit, Bit, D > EncodingBit
Definition AMDGPUBaseInfo.h:399

llvm::AMDGPU::getMIMGInfo
LLVM_READONLY const MIMGInfo * getMIMGInfo(unsigned Opc)

llvm::AMDGPU::decodeWaitcnt
void decodeWaitcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned &Vmcnt, unsigned &Expcnt, unsigned &Lgkmcnt)
Decodes Vmcnt, Expcnt and Lgkmcnt from given Waitcnt for given isa Version, and writes decoded values...
Definition AMDGPUBaseInfo.cpp:1837

llvm::AMDGPU::isInlinableLiteralFP16
bool isInlinableLiteralFP16(int16_t Literal, bool HasInv2Pi)
Definition AMDGPUBaseInfo.cpp:3061

llvm::AMDGPU::isSGPR
bool isSGPR(MCRegister Reg, const MCRegisterInfo *TRI)
Is Reg - scalar register.
Definition AMDGPUBaseInfo.cpp:2663

llvm::AMDGPU::convertSMRDOffsetUnits
uint64_t convertSMRDOffsetUnits(const MCSubtargetInfo &ST, uint64_t ByteOffset)
Convert ByteOffset to dwords if the subtarget uses dword SMRD immediate offsets.
Definition AMDGPUBaseInfo.cpp:3323

llvm::AMDGPU::getMCReg
MCRegister getMCReg(MCRegister Reg, const MCSubtargetInfo &STI)
If Reg is a pseudo reg, return the correct hardware register given STI otherwise return Reg.
Definition AMDGPUBaseInfo.cpp:2737

llvm::AMDGPU::getMIMGOffsetMappingInfo
LLVM_READONLY const MIMGOffsetMappingInfo * getMIMGOffsetMappingInfo(unsigned Offset)

llvm::AMDGPU::isVOPCAsmOnly
bool isVOPCAsmOnly(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:563

llvm::AMDGPU::getMIMGOpcode
int getMIMGOpcode(unsigned BaseOpcode, unsigned MIMGEncoding, unsigned VDataDwords, unsigned VAddrDwords)
Definition AMDGPUBaseInfo.cpp:303

llvm::AMDGPU::getMTBUFHasSrsrc
bool getMTBUFHasSrsrc(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:488

llvm::AMDGPU::getSMRDEncodedLiteralOffset32
std::optional< int64_t > getSMRDEncodedLiteralOffset32(const MCSubtargetInfo &ST, int64_t ByteOffset)
Definition AMDGPUBaseInfo.cpp:3361

llvm::AMDGPU::getWMMAIsXDL
bool getWMMAIsXDL(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:575

llvm::AMDGPU::wmmaScaleF8F6F4FormatToNumRegs
uint8_t wmmaScaleF8F6F4FormatToNumRegs(unsigned Fmt)
Definition AMDGPUBaseInfo.cpp:604

llvm::AMDGPU::isGFX10Before1030
bool isGFX10Before1030(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2604

llvm::AMDGPU::isShader
LLVM_READNONE constexpr bool isShader(CallingConv::ID CC)
Definition AMDGPUBaseInfo.h:1468

llvm::AMDGPU::isSISrcInlinableOperand
bool isSISrcInlinableOperand(const MCInstrDesc &Desc, unsigned OpNo)
Does this operand support only inlinable literals?
Definition AMDGPUBaseInfo.cpp:2824

llvm::AMDGPU::mapWMMA2AddrTo3AddrOpcode
unsigned mapWMMA2AddrTo3AddrOpcode(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:792

llvm::AMDGPU::shouldEmitConstantsToTextSection
bool shouldEmitConstantsToTextSection(const Triple &TT)
Definition AMDGPUBaseInfo.cpp:1574

llvm::AMDGPU::isInlinableLiteralV2I16
bool isInlinableLiteralV2I16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3191

llvm::AMDGPU::isDPMACCInstruction
bool isDPMACCInstruction(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:787

llvm::AMDGPU::getMTBUFElements
int getMTBUFElements(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:478

llvm::AMDGPU::isHi16Reg
bool isHi16Reg(MCRegister Reg, const MCRegisterInfo &MRI)
Definition AMDGPUBaseInfo.cpp:2670

llvm::AMDGPU::getTemporalHintType
unsigned getTemporalHintType(const MCInstrDesc TID)
Definition AMDGPUBaseInfo.cpp:755

llvm::AMDGPU::getTotalNumVGPRs
int32_t getTotalNumVGPRs(bool has90AInsts, int32_t ArgNumAGPR, int32_t ArgNumVGPR)
Definition AMDGPUBaseInfo.cpp:2656

llvm::AMDGPU::isGFX10
bool isGFX10(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2560

llvm::AMDGPU::isInlinableLiteralV2BF16
bool isInlinableLiteralV2BF16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3196

llvm::AMDGPU::getMaxNumUserSGPRs
unsigned getMaxNumUserSGPRs(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2516

llvm::AMDGPU::getFPDstSelType
FPType getFPDstSelType(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:775

llvm::AMDGPU::getNumFlatOffsetBits
unsigned getNumFlatOffsetBits(const MCSubtargetInfo &ST)
For pre-GFX12 FLAT instructions the offset must be positive; MSB is ignored and forced to zero.
Definition AMDGPUBaseInfo.cpp:3371

llvm::AMDGPU::AMDHSA_COV4
@ AMDHSA_COV4
Definition AMDGPUBaseInfo.h:61

llvm::AMDGPU::AMDHSA_COV5
@ AMDHSA_COV5
Definition AMDGPUBaseInfo.h:61

llvm::AMDGPU::AMDHSA_COV6
@ AMDHSA_COV6
Definition AMDGPUBaseInfo.h:61

llvm::AMDGPU::hasA16
bool hasA16(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2488

llvm::AMDGPU::isLegalSMRDEncodedSignedOffset
bool isLegalSMRDEncodedSignedOffset(const MCSubtargetInfo &ST, int64_t EncodedOffset, bool IsBuffer)
Definition AMDGPUBaseInfo.cpp:3308

llvm::AMDGPU::isGFX12Plus
bool isGFX12Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2584

llvm::AMDGPU::getNSAMaxSize
unsigned getNSAMaxSize(const MCSubtargetInfo &STI, bool HasSampler)
Definition AMDGPUBaseInfo.cpp:2505

llvm::AMDGPU::getVGPRPhysRegClass
const MCRegisterClass * getVGPRPhysRegClass(MCRegister Reg, const MCRegisterInfo &MRI)
Definition AMDGPUBaseInfo.cpp:3428

llvm::AMDGPU::isModuleEntryFunctionCC
LLVM_READNONE constexpr bool isModuleEntryFunctionCC(CallingConv::ID CC)
Definition AMDGPUBaseInfo.h:1532

llvm::AMDGPU::getIntegerAttribute
int getIntegerAttribute(const Function &F, StringRef Name, int Default)

llvm::AMDGPU::hasPackedD16
bool hasPackedD16(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2496

llvm::AMDGPU::getStorecntBitMask
unsigned getStorecntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1784

llvm::AMDGPU::getLdsDwGranularity
unsigned getLdsDwGranularity(const MCSubtargetInfo &ST)
Definition AMDGPUBaseInfo.cpp:3639

llvm::AMDGPU::isGFX940
bool isGFX940(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2632

llvm::AMDGPU::isInlinableLiteralV2F16
bool isInlinableLiteralV2F16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3201

llvm::AMDGPU::isHsaAbi
bool isHsaAbi(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:198

llvm::AMDGPU::isGFX11
bool isGFX11(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2572

llvm::AMDGPU::getSMEMIsBuffer
bool getSMEMIsBuffer(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:539

llvm::AMDGPU::isGFX10_3_GFX11
bool isGFX10_3_GFX11(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2624

llvm::AMDGPU::hasValueInRangeLikeMetadata
bool hasValueInRangeLikeMetadata(const MDNode &MD, int64_t Val)
Checks if Val is inside MD, a !range-like metadata.
Definition AMDGPUBaseInfo.cpp:1699

llvm::AMDGPU::isInvalidSingleUseProducerInst
LLVM_READONLY bool isInvalidSingleUseProducerInst(unsigned Opc)

llvm::AMDGPU::None
@ None
Definition AMDGPURegBankLegalizeRules.h:131

llvm::AMDGPU::Imm
@ Imm
Definition AMDGPURegBankLegalizeRules.h:133

llvm::AMDGPU::mfmaScaleF8F6F4FormatToNumRegs
uint8_t mfmaScaleF8F6F4FormatToNumRegs(unsigned EncodingVal)
Definition AMDGPUBaseInfo.cpp:580

llvm::AMDGPU::isInvalidSingleUseConsumerInst
LLVM_READONLY bool isInvalidSingleUseConsumerInst(unsigned Opc)

llvm::AMDGPU::getVOPDOpcode
unsigned getVOPDOpcode(unsigned Opc, bool VOPD3)
Definition AMDGPUBaseInfo.cpp:655

llvm::AMDGPU::isGroupSegment
bool isGroupSegment(const GlobalValue *GV)
Definition AMDGPUBaseInfo.cpp:1560

llvm::AMDGPU::getMIMGMIPMappingInfo
LLVM_READONLY const MIMGMIPMappingInfo * getMIMGMIPMappingInfo(unsigned MIP)

llvm::AMDGPU::getMTBUFHasSoffset
bool getMTBUFHasSoffset(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:493

llvm::AMDGPU::hasXNACK
bool hasXNACK(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2475

llvm::AMDGPU::isValid32BitLiteral
bool isValid32BitLiteral(uint64_t Val, bool IsFP64)
Definition AMDGPUBaseInfo.cpp:3205

llvm::AMDGPU::getCanBeVOPD
CanBeVOPD getCanBeVOPD(unsigned Opc, unsigned EncodingFamily, bool VOPD3)
Definition AMDGPUBaseInfo.cpp:637

llvm::AMDGPU::encodeWaitcnt
unsigned encodeWaitcnt(const IsaVersion &Version, unsigned Vmcnt, unsigned Expcnt, unsigned Lgkmcnt)
Encodes Vmcnt, Expcnt and Lgkmcnt into Waitcnt for given isa Version.
Definition AMDGPUBaseInfo.cpp:1873

llvm::AMDGPU::isLegalDPALU_DPPControl
LLVM_READNONE bool isLegalDPALU_DPPControl(const MCSubtargetInfo &ST, unsigned DC)
Definition AMDGPUBaseInfo.h:1812

llvm::AMDGPU::isVOPC64DPP
bool isVOPC64DPP(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:559

llvm::AMDGPU::getMUBUFOpcode
int getMUBUFOpcode(unsigned BaseOpc, unsigned Elements)
Definition AMDGPUBaseInfo.cpp:503

llvm::AMDGPU::getMAIIsGFX940XDL
bool getMAIIsGFX940XDL(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:570

llvm::AMDGPU::isSI
bool isSI(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2522

llvm::AMDGPU::getDefaultAMDHSACodeObjectVersion
unsigned getDefaultAMDHSACodeObjectVersion()
Definition AMDGPUBaseInfo.cpp:211

llvm::AMDGPU::isReadOnlySegment
bool isReadOnlySegment(const GlobalValue *GV)
Definition AMDGPUBaseInfo.cpp:1568

llvm::AMDGPU::isArgPassedInSGPR
bool isArgPassedInSGPR(const Argument *A)
Definition AMDGPUBaseInfo.cpp:3240

llvm::AMDGPU::mayTailCallThisCC
LLVM_READNONE constexpr bool mayTailCallThisCC(CallingConv::ID CC)
Return true if we might ever do TCO for calls with this calling convention.
Definition AMDGPUBaseInfo.h:1561

llvm::AMDGPU::isIntrinsicAlwaysUniform
bool isIntrinsicAlwaysUniform(unsigned IntrID)
Definition AMDGPUBaseInfo.cpp:3406

llvm::AMDGPU::getMUBUFBaseOpcode
int getMUBUFBaseOpcode(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:498

llvm::AMDGPU::getAMDHSACodeObjectVersion
unsigned getAMDHSACodeObjectVersion(const Module &M)
Definition AMDGPUBaseInfo.cpp:202

llvm::AMDGPU::decodeLgkmcnt
unsigned decodeLgkmcnt(const IsaVersion &Version, unsigned Waitcnt)
Definition AMDGPUBaseInfo.cpp:1832

llvm::AMDGPU::getWaitcntBitMask
unsigned getWaitcntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1807

llvm::AMDGPU::hasNamedOperand
LLVM_READONLY bool hasNamedOperand(uint64_t Opcode, OpName NamedIdx)
Definition AMDGPUBaseInfo.h:414

llvm::AMDGPU::getVOP3IsSingle
bool getVOP3IsSingle(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:554

llvm::AMDGPU::isGFX9
bool isGFX9(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2534

llvm::AMDGPU::isDPALU_DPP32BitOpc
bool isDPALU_DPP32BitOpc(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:3608

llvm::AMDGPU::getVOP1IsSingle
bool getVOP1IsSingle(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:544

llvm::AMDGPU::getVOPDEncodingFamily
unsigned getVOPDEncodingFamily(const MCSubtargetInfo &ST)
Definition AMDGPUBaseInfo.cpp:627

llvm::AMDGPU::isGFX10_AEncoding
bool isGFX10_AEncoding(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2612

llvm::AMDGPU::isKImmOperand
bool isKImmOperand(const MCInstrDesc &Desc, unsigned OpNo)
Is this a KImm operand?
Definition AMDGPUBaseInfo.cpp:2795

llvm::AMDGPU::getHasColorExport
bool getHasColorExport(const Function &F)
Definition AMDGPUBaseInfo.cpp:2454

llvm::AMDGPU::getMTBUFBaseOpcode
int getMTBUFBaseOpcode(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:467

llvm::AMDGPU::isGFX90A
bool isGFX90A(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2628

llvm::AMDGPU::getSamplecntBitMask
unsigned getSamplecntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1756

llvm::AMDGPU::getDefaultQueueImplicitArgPosition
unsigned getDefaultQueueImplicitArgPosition(unsigned CodeObjectVersion)
Definition AMDGPUBaseInfo.cpp:269

llvm::AMDGPU::parseAsmPhysRegName
std::tuple< char, unsigned, unsigned > parseAsmPhysRegName(StringRef RegName)
Returns a valid charcode or 0 in the first entry if this is a valid physical register name.
Definition AMDGPUBaseInfo.cpp:1582

llvm::AMDGPU::hasSRAMECC
bool hasSRAMECC(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2479

llvm::AMDGPU::getHasDepthExport
bool getHasDepthExport(const Function &F)
Definition AMDGPUBaseInfo.cpp:2461

llvm::AMDGPU::isGFX8_GFX9_GFX10
bool isGFX8_GFX9_GFX10(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2546

llvm::AMDGPU::isKernel
LLVM_READNONE constexpr bool isKernel(CallingConv::ID CC)
Definition AMDGPUBaseInfo.h:1542

llvm::AMDGPU::getMUBUFHasVAddr
bool getMUBUFHasVAddr(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:514

llvm::AMDGPU::isTrue16Inst
bool isTrue16Inst(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:770

llvm::AMDGPU::isEntryFunctionCC
LLVM_READNONE constexpr bool isEntryFunctionCC(CallingConv::ID CC)
Definition AMDGPUBaseInfo.h:1497

llvm::AMDGPU::getVGPREncodingMSBs
unsigned getVGPREncodingMSBs(MCRegister Reg, const MCRegisterInfo &MRI)
Definition AMDGPUBaseInfo.cpp:3449

llvm::AMDGPU::getVOPDComponents
std::pair< unsigned, unsigned > getVOPDComponents(unsigned VOPDOpcode)
Definition AMDGPUBaseInfo.cpp:833

llvm::AMDGPU::getMIMGDimInfoByEncoding
LLVM_READONLY const MIMGDimInfo * getMIMGDimInfoByEncoding(uint8_t DimEnc)

llvm::AMDGPU::isInlinableLiteral32
bool isInlinableLiteral32(int32_t Literal, bool HasInv2Pi)
Definition AMDGPUBaseInfo.cpp:3014

llvm::AMDGPU::isCompute
LLVM_READNONE constexpr bool isCompute(CallingConv::ID CC)
Definition AMDGPUBaseInfo.h:1492

llvm::AMDGPU::isGFX12
bool isGFX12(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2580

llvm::AMDGPU::getInitialPSInputAddr
unsigned getInitialPSInputAddr(const Function &F)
Definition AMDGPUBaseInfo.cpp:2450

llvm::AMDGPU::encodeExpcnt
unsigned encodeExpcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned Expcnt)
Definition AMDGPUBaseInfo.cpp:1861

llvm::AMDGPU::isAsyncStore
bool isAsyncStore(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:739

llvm::AMDGPU::getDynamicVGPRBlockSize
unsigned getDynamicVGPRBlockSize(const Function &F)
Definition AMDGPUBaseInfo.cpp:2465

llvm::AMDGPU::isLegalSMRDImmOffset
bool isLegalSMRDImmOffset(const MCSubtargetInfo &ST, int64_t ByteOffset)

llvm::AMDGPU::getKmcntBitMask
unsigned getKmcntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1776

llvm::AMDGPU::getVGPRWithMSBs
MCRegister getVGPRWithMSBs(MCRegister Reg, unsigned MSBs, const MCRegisterInfo &MRI)
If Reg is a low VGPR return a corresponding high VGPR with MSBs set.
Definition AMDGPUBaseInfo.cpp:3455

llvm::AMDGPU::getVmcntBitMask
unsigned getVmcntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1746

llvm::AMDGPU::FPType
FPType
Definition AMDGPUBaseInfo.h:63

llvm::AMDGPU::FPType::FP4
@ FP4
Definition AMDGPUBaseInfo.h:63

llvm::AMDGPU::FPType::FP8
@ FP8
Definition AMDGPUBaseInfo.h:63

llvm::AMDGPU::isNotGFX10Plus
bool isNotGFX10Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2600

llvm::AMDGPU::hasMAIInsts
bool hasMAIInsts(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2640

llvm::AMDGPU::getBitOp2
unsigned getBitOp2(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:809

llvm::AMDGPU::isIntrinsicSourceOfDivergence
bool isIntrinsicSourceOfDivergence(unsigned IntrID)
Definition AMDGPUBaseInfo.cpp:3402

llvm::AMDGPU::isSISrcOperand
constexpr bool isSISrcOperand(const MCOperandInfo &OpInfo)
Is this an AMDGPU specific source operand?
Definition AMDGPUBaseInfo.h:1644

llvm::AMDGPU::getXcntBitMask
unsigned getXcntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1780

llvm::AMDGPU::isGenericAtomic
bool isGenericAtomic(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:717

llvm::AMDGPU::getWMMA_F8F6F4_WithFormatArgs
const MFMA_F8F6F4_Info * getWMMA_F8F6F4_WithFormatArgs(unsigned FmtA, unsigned FmtB, unsigned F8F8Opcode)
Definition AMDGPUBaseInfo.cpp:619

llvm::AMDGPU::decodeStorecntDscnt
Waitcnt decodeStorecntDscnt(const IsaVersion &Version, unsigned StorecntDscnt)
Definition AMDGPUBaseInfo.cpp:1910

llvm::AMDGPU::isGFX8Plus
bool isGFX8Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2550

llvm::AMDGPU::isInlinableIntLiteral
LLVM_READNONE bool isInlinableIntLiteral(int64_t Literal)
Is this literal inlinable, and not one of the values intended for floating point values.
Definition AMDGPUBaseInfo.h:1720

llvm::AMDGPU::getLgkmcntBitMask
unsigned getLgkmcntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1768

llvm::AMDGPU::getMUBUFTfe
bool getMUBUFTfe(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:534

llvm::AMDGPU::getMIMGBiasMappingInfo
LLVM_READONLY const MIMGBiasMappingInfo * getMIMGBiasMappingInfo(unsigned Bias)

llvm::AMDGPU::getBvhcntBitMask
unsigned getBvhcntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1760

llvm::AMDGPU::hasSMRDSignedImmOffset
bool hasSMRDSignedImmOffset(const MCSubtargetInfo &ST)
Definition AMDGPUBaseInfo.cpp:193

llvm::AMDGPU::getMIMGDimInfoByAsmSuffix
LLVM_READONLY const MIMGDimInfo * getMIMGDimInfoByAsmSuffix(StringRef AsmSuffix)

llvm::AMDGPU::hasMIMG_R128
bool hasMIMG_R128(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2483

llvm::AMDGPU::hasGFX10_3Insts
bool hasGFX10_3Insts(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2620

llvm::AMDGPU::getVGPRLoweringOperandTables
std::pair< const AMDGPU::OpName *, const AMDGPU::OpName * > getVGPRLoweringOperandTables(const MCInstrDesc &Desc)
Definition AMDGPUBaseInfo.cpp:3478

llvm::AMDGPU::hasG16
bool hasG16(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2492

llvm::AMDGPU::getAddrSizeMIMGOp
unsigned getAddrSizeMIMGOp(const MIMGBaseOpcodeInfo *BaseOpcode, const MIMGDimInfo *Dim, bool IsA16, bool IsG16Supported)
Definition AMDGPUBaseInfo.cpp:323

llvm::AMDGPU::getMTBUFOpcode
int getMTBUFOpcode(unsigned BaseOpc, unsigned Elements)
Definition AMDGPUBaseInfo.cpp:472

llvm::AMDGPU::getExpcntBitMask
unsigned getExpcntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1764

llvm::AMDGPU::hasArchitectedFlatScratch
bool hasArchitectedFlatScratch(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2636

llvm::AMDGPU::getMUBUFHasSoffset
bool getMUBUFHasSoffset(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:524

llvm::AMDGPU::isNotGFX11Plus
bool isNotGFX11Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2598

llvm::AMDGPU::isGFX11Plus
bool isGFX11Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2576

llvm::AMDGPU::getInlineEncodingV2F16
std::optional< unsigned > getInlineEncodingV2F16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3167

llvm::AMDGPU::isSISrcFPOperand
bool isSISrcFPOperand(const MCInstrDesc &Desc, unsigned OpNo)
Is this floating-point operand?
Definition AMDGPUBaseInfo.cpp:2802

llvm::AMDGPU::parseAsmConstraintPhysReg
std::tuple< char, unsigned, unsigned > parseAsmConstraintPhysReg(StringRef Constraint)
Returns a valid charcode or 0 in the first entry if this is a valid physical register constraint.
Definition AMDGPUBaseInfo.cpp:1610

llvm::AMDGPU::getHostcallImplicitArgPosition
unsigned getHostcallImplicitArgPosition(unsigned CodeObjectVersion)
Definition AMDGPUBaseInfo.cpp:258

llvm::AMDGPU::isGFX10Plus
bool isGFX10Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2568

llvm::AMDGPU::getSMRDEncodedOffset
std::optional< int64_t > getSMRDEncodedOffset(const MCSubtargetInfo &ST, int64_t ByteOffset, bool IsBuffer, bool HasSOffset)
Definition AMDGPUBaseInfo.cpp:3332

llvm::AMDGPU::isGlobalSegment
bool isGlobalSegment(const GlobalValue *GV)
Definition AMDGPUBaseInfo.cpp:1564

llvm::AMDGPU::encode32BitLiteral
int64_t encode32BitLiteral(int64_t Imm, OperandType Type, bool IsLit)
Definition AMDGPUBaseInfo.cpp:3212

llvm::AMDGPU::OperandType
OperandType
Definition SIDefines.h:199

llvm::AMDGPU::OPERAND_KIMM32
@ OPERAND_KIMM32
Operand with 32-bit immediate that uses the constant bus.
Definition SIDefines.h:231

llvm::AMDGPU::OPERAND_REG_IMM_INT64
@ OPERAND_REG_IMM_INT64
Definition SIDefines.h:202

llvm::AMDGPU::OPERAND_REG_IMM_V2FP16
@ OPERAND_REG_IMM_V2FP16
Definition SIDefines.h:209

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP64
@ OPERAND_REG_INLINE_C_FP64
Definition SIDefines.h:222

llvm::AMDGPU::OPERAND_REG_INLINE_C_BF16
@ OPERAND_REG_INLINE_C_BF16
Definition SIDefines.h:219

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2BF16
@ OPERAND_REG_INLINE_C_V2BF16
Definition SIDefines.h:224

llvm::AMDGPU::OPERAND_REG_IMM_V2INT16
@ OPERAND_REG_IMM_V2INT16
Definition SIDefines.h:210

llvm::AMDGPU::OPERAND_REG_IMM_BF16
@ OPERAND_REG_IMM_BF16
Definition SIDefines.h:206

llvm::AMDGPU::OPERAND_REG_IMM_INT32
@ OPERAND_REG_IMM_INT32
Operands with register, 32-bit, or 64-bit immediate.
Definition SIDefines.h:201

llvm::AMDGPU::OPERAND_SRC_FIRST
@ OPERAND_SRC_FIRST
Definition SIDefines.h:259

llvm::AMDGPU::OPERAND_REG_IMM_V2BF16
@ OPERAND_REG_IMM_V2BF16
Definition SIDefines.h:208

llvm::AMDGPU::OPERAND_REG_IMM_FP16
@ OPERAND_REG_IMM_FP16
Definition SIDefines.h:207

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT64
@ OPERAND_REG_INLINE_C_INT64
Definition SIDefines.h:218

llvm::AMDGPU::OPERAND_KIMM64
@ OPERAND_KIMM64
Definition SIDefines.h:233

llvm::AMDGPU::OPERAND_KIMM16
@ OPERAND_KIMM16
Definition SIDefines.h:232

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT16
@ OPERAND_REG_INLINE_C_INT16
Operands with register or inline constant.
Definition SIDefines.h:216

llvm::AMDGPU::OPERAND_REG_IMM_NOINLINE_V2FP16
@ OPERAND_REG_IMM_NOINLINE_V2FP16
Definition SIDefines.h:211

llvm::AMDGPU::OPERAND_REG_IMM_FP64
@ OPERAND_REG_IMM_FP64
Definition SIDefines.h:205

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2FP16
@ OPERAND_REG_INLINE_C_V2FP16
Definition SIDefines.h:225

llvm::AMDGPU::OPERAND_REG_INLINE_AC_INT32
@ OPERAND_REG_INLINE_AC_INT32
Operands with an AccVGPR register or inline constant.
Definition SIDefines.h:236

llvm::AMDGPU::OPERAND_REG_INLINE_AC_FP32
@ OPERAND_REG_INLINE_AC_FP32
Definition SIDefines.h:237

llvm::AMDGPU::OPERAND_REG_IMM_V2INT32
@ OPERAND_REG_IMM_V2INT32
Definition SIDefines.h:212

llvm::AMDGPU::OPERAND_REG_IMM_FP32
@ OPERAND_REG_IMM_FP32
Definition SIDefines.h:204

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP32
@ OPERAND_REG_INLINE_C_FP32
Definition SIDefines.h:221

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT32
@ OPERAND_REG_INLINE_C_INT32
Definition SIDefines.h:217

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2INT16
@ OPERAND_REG_INLINE_C_V2INT16
Definition SIDefines.h:223

llvm::AMDGPU::OPERAND_REG_IMM_V2FP32
@ OPERAND_REG_IMM_V2FP32
Definition SIDefines.h:213

llvm::AMDGPU::OPERAND_REG_INLINE_AC_FP64
@ OPERAND_REG_INLINE_AC_FP64
Definition SIDefines.h:238

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP16
@ OPERAND_REG_INLINE_C_FP16
Definition SIDefines.h:220

llvm::AMDGPU::OPERAND_REG_IMM_INT16
@ OPERAND_REG_IMM_INT16
Definition SIDefines.h:203

llvm::AMDGPU::OPERAND_INLINE_SPLIT_BARRIER_INT32
@ OPERAND_INLINE_SPLIT_BARRIER_INT32
Definition SIDefines.h:228

llvm::AMDGPU::OPERAND_SRC_LAST
@ OPERAND_SRC_LAST
Definition SIDefines.h:260

llvm::AMDGPU::initDefaultAMDKernelCodeT
void initDefaultAMDKernelCodeT(AMDGPUMCKernelCodeT &KernelCode, const MCSubtargetInfo *STI)
Definition AMDGPUBaseInfo.cpp:1526

llvm::AMDGPU::isNotGFX9Plus
bool isNotGFX9Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2558

llvm::AMDGPU::getMIMGLZMappingInfo
LLVM_READONLY const MIMGLZMappingInfo * getMIMGLZMappingInfo(unsigned L)

llvm::AMDGPU::isDPALU_DPP
bool isDPALU_DPP(const MCInstrDesc &OpDesc, const MCInstrInfo &MII, const MCSubtargetInfo &ST)
Definition AMDGPUBaseInfo.cpp:3628

llvm::AMDGPU::hasGDS
bool hasGDS(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2501

llvm::AMDGPU::isLegalSMRDEncodedUnsignedOffset
bool isLegalSMRDEncodedUnsignedOffset(const MCSubtargetInfo &ST, int64_t EncodedOffset)
Definition AMDGPUBaseInfo.cpp:3299

llvm::AMDGPU::isGFX9Plus
bool isGFX9Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2554

llvm::AMDGPU::hasDPPSrc1SGPR
bool hasDPPSrc1SGPR(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2648

llvm::AMDGPU::isVOPD
bool isVOPD(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:662

llvm::AMDGPU::getVOPDInstInfo
VOPD::InstInfo getVOPDInstInfo(const MCInstrDesc &OpX, const MCInstrDesc &OpY)
Definition AMDGPUBaseInfo.cpp:1003

llvm::AMDGPU::encodeVmcnt
unsigned encodeVmcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned Vmcnt)
Definition AMDGPUBaseInfo.cpp:1852

llvm::AMDGPU::decodeExpcnt
unsigned decodeExpcnt(const IsaVersion &Version, unsigned Waitcnt)
Definition AMDGPUBaseInfo.cpp:1827

llvm::AMDGPU::isCvt_F32_Fp8_Bf8_e64
bool isCvt_F32_Fp8_Bf8_e64(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:704

llvm::AMDGPU::decodeLoadcntDscnt
Waitcnt decodeLoadcntDscnt(const IsaVersion &Version, unsigned LoadcntDscnt)
Definition AMDGPUBaseInfo.cpp:1900

llvm::AMDGPU::getInlineEncodingV2I16
std::optional< unsigned > getInlineEncodingV2I16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3133

llvm::AMDGPU::getRegBitWidth
unsigned getRegBitWidth(const TargetRegisterClass &RC)
Get the size in bits of a register from the register class RC.
Definition SIRegisterInfo.cpp:3327

llvm::AMDGPU::encodeStorecntDscnt
static unsigned encodeStorecntDscnt(const IsaVersion &Version, unsigned Storecnt, unsigned Dscnt)
Definition AMDGPUBaseInfo.cpp:1950

llvm::AMDGPU::isGFX1250
bool isGFX1250(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2588

llvm::AMDGPU::supportsWave32
bool supportsWave32(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.h:1617

llvm::AMDGPU::getMCOpcode
int getMCOpcode(uint16_t Opcode, unsigned Gen)
Definition AMDGPUBaseInfo.cpp:805

llvm::AMDGPU::getMIMGBaseOpcode
const MIMGBaseOpcodeInfo * getMIMGBaseOpcode(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:310

llvm::AMDGPU::isVI
bool isVI(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2530

llvm::AMDGPU::isTensorStore
bool isTensorStore(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:750

llvm::AMDGPU::getMIMGDimInfo
LLVM_READONLY const MIMGDimInfo * getMIMGDimInfo(unsigned DimEnum)

llvm::AMDGPU::getMUBUFIsBufferInv
bool getMUBUFIsBufferInv(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:529

llvm::AMDGPU::supportsScaleOffset
bool supportsScaleOffset(const MCInstrInfo &MII, unsigned Opcode)
Definition AMDGPUBaseInfo.cpp:3571

llvm::AMDGPU::mc2PseudoReg
MCRegister mc2PseudoReg(MCRegister Reg)
Convert hardware register Reg to a pseudo register.
Definition AMDGPUBaseInfo.cpp:2762

llvm::AMDGPU::getInlineEncodingV2BF16
std::optional< unsigned > getInlineEncodingV2BF16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3139

llvm::AMDGPU::hasKernargPreload
unsigned hasKernargPreload(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2652

llvm::AMDGPU::supportsWGP
bool supportsWGP(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2592

llvm::AMDGPU::hasDynamicVGPR
bool hasDynamicVGPR(const Function &F)

llvm::AMDGPU::isMAC
bool isMAC(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:666

llvm::AMDGPU::getOperandSize
LLVM_READNONE unsigned getOperandSize(const MCOperandInfo &OpInfo)
Definition AMDGPUBaseInfo.h:1669

llvm::AMDGPU::isCI
bool isCI(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2526

llvm::AMDGPU::encodeLgkmcnt
unsigned encodeLgkmcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned Lgkmcnt)
Definition AMDGPUBaseInfo.cpp:1867

llvm::AMDGPU::getVOP2IsSingle
bool getVOP2IsSingle(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:549

llvm::AMDGPU::getMAIIsDGEMM
bool getMAIIsDGEMM(unsigned Opc)
Returns true if MAI operation is a double precision GEMM.
Definition AMDGPUBaseInfo.cpp:565

llvm::AMDGPU::getMIMGBaseOpcodeInfo
LLVM_READONLY const MIMGBaseOpcodeInfo * getMIMGBaseOpcodeInfo(unsigned BaseOpcode)

llvm::AMDGPU::getCompletionActionImplicitArgPosition
unsigned getCompletionActionImplicitArgPosition(unsigned CodeObjectVersion)
Definition AMDGPUBaseInfo.cpp:280

llvm::AMDGPU::getIntegerVecAttribute
SmallVector< unsigned > getIntegerVecAttribute(const Function &F, StringRef Name, unsigned Size, unsigned DefaultVal)
Definition AMDGPUBaseInfo.cpp:1653

llvm::AMDGPU::isChainCC
LLVM_READNONE constexpr bool isChainCC(CallingConv::ID CC)
Definition AMDGPUBaseInfo.h:1515

llvm::AMDGPU::getMaskedMIMGOp
int getMaskedMIMGOp(unsigned Opc, unsigned NewChannels)
Definition AMDGPUBaseInfo.cpp:315

llvm::AMDGPU::isNotGFX12Plus
bool isNotGFX12Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2586

llvm::AMDGPU::getMTBUFHasVAddr
bool getMTBUFHasVAddr(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:483

llvm::AMDGPU::decodeVmcnt
unsigned decodeVmcnt(const IsaVersion &Version, unsigned Waitcnt)
Definition AMDGPUBaseInfo.cpp:1819

llvm::AMDGPU::getELFABIVersion
uint8_t getELFABIVersion(const Triple &T, unsigned CodeObjectVersion)
Definition AMDGPUBaseInfo.cpp:228

llvm::AMDGPU::getIntegerPairAttribute
std::pair< unsigned, unsigned > getIntegerPairAttribute(const Function &F, StringRef Name, std::pair< unsigned, unsigned > Default, bool OnlyFirstRequired)
Definition AMDGPUBaseInfo.cpp:1618

llvm::AMDGPU::getLoadcntBitMask
unsigned getLoadcntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1752

llvm::AMDGPU::isInlinableLiteralI16
bool isInlinableLiteralI16(int32_t Literal, bool HasInv2Pi)
Definition AMDGPUBaseInfo.cpp:3057

llvm::AMDGPU::hasVOPD
bool hasVOPD(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2644

llvm::AMDGPU::canGuaranteeTCO
LLVM_READNONE constexpr bool canGuaranteeTCO(CallingConv::ID CC)
Definition AMDGPUBaseInfo.h:1555

llvm::AMDGPU::isGraphics
LLVM_READNONE constexpr bool isGraphics(CallingConv::ID CC)
Definition AMDGPUBaseInfo.h:1486

llvm::AMDGPU::getVOPDFull
int getVOPDFull(unsigned OpX, unsigned OpY, unsigned EncodingFamily, bool VOPD3)
Definition AMDGPUBaseInfo.cpp:824

llvm::AMDGPU::isInlinableLiteral64
bool isInlinableLiteral64(int64_t Literal, bool HasInv2Pi)
Is this literal inlinable.
Definition AMDGPUBaseInfo.cpp:2997

llvm::AMDGPU::getMFMA_F8F6F4_WithFormatArgs
const MFMA_F8F6F4_Info * getMFMA_F8F6F4_WithFormatArgs(unsigned CBSZ, unsigned BLGP, unsigned F8F8Opcode)
Definition AMDGPUBaseInfo.cpp:596

llvm::AMDGPU::getMultigridSyncArgImplicitArgPosition
unsigned getMultigridSyncArgImplicitArgPosition(unsigned CodeObjectVersion)
Definition AMDGPUBaseInfo.cpp:245

llvm::AMDGPU::isGFX9_GFX10_GFX11
bool isGFX9_GFX10_GFX11(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2542

llvm::AMDGPU::isGFX9_GFX10
bool isGFX9_GFX10(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2538

llvm::AMDGPU::getMUBUFElements
int getMUBUFElements(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:509

llvm::AMDGPU::encodeLoadcntDscnt
static unsigned encodeLoadcntDscnt(const IsaVersion &Version, unsigned Loadcnt, unsigned Dscnt)
Definition AMDGPUBaseInfo.cpp:1938

llvm::AMDGPU::getGcnBufferFormatInfo
const GcnBufferFormatInfo * getGcnBufferFormatInfo(uint8_t BitsPerComp, uint8_t NumComponents, uint8_t NumFormat, const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:3410

llvm::AMDGPU::mapWMMA3AddrTo2AddrOpcode
unsigned mapWMMA3AddrTo2AddrOpcode(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:797

llvm::AMDGPU::isPermlane16
bool isPermlane16(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:693

llvm::AMDGPU::getSOPPWithRelaxation
LLVM_READONLY int getSOPPWithRelaxation(uint16_t Opcode)

llvm::AMDGPU::getMUBUFHasSrsrc
bool getMUBUFHasSrsrc(unsigned Opc)
Definition AMDGPUBaseInfo.cpp:519

llvm::AMDGPU::getDscntBitMask
unsigned getDscntBitMask(const IsaVersion &Version)
Definition AMDGPUBaseInfo.cpp:1772

llvm::AMDGPU::hasAny64BitVGPROperands
bool hasAny64BitVGPROperands(const MCInstrDesc &OpDesc, const MCInstrInfo &MII, const MCSubtargetInfo &ST)
Definition AMDGPUBaseInfo.cpp:3590

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24

llvm::CallingConv::AMDGPU_CS
@ AMDGPU_CS
Used for Mesa/AMDPAL compute shaders.
Definition CallingConv.h:197

llvm::CallingConv::AMDGPU_VS
@ AMDGPU_VS
Used for Mesa vertex shaders, or AMDPAL last shader stage before rasterization (vertex shader if tess...
Definition CallingConv.h:188

llvm::CallingConv::AMDGPU_KERNEL
@ AMDGPU_KERNEL
Used for AMDGPU code object kernels.
Definition CallingConv.h:200

llvm::CallingConv::AMDGPU_Gfx
@ AMDGPU_Gfx
Used for AMD graphics targets.
Definition CallingConv.h:232

llvm::CallingConv::AMDGPU_CS_ChainPreserve
@ AMDGPU_CS_ChainPreserve
Used on AMDGPUs to give the middle-end more control over argument placement.
Definition CallingConv.h:249

llvm::CallingConv::AMDGPU_HS
@ AMDGPU_HS
Used for Mesa/AMDPAL hull shaders (= tessellation control shaders).
Definition CallingConv.h:206

llvm::CallingConv::AMDGPU_GS
@ AMDGPU_GS
Used for Mesa/AMDPAL geometry shaders.
Definition CallingConv.h:191

llvm::CallingConv::AMDGPU_CS_Chain
@ AMDGPU_CS_Chain
Used on AMDGPUs to give the middle-end more control over argument placement.
Definition CallingConv.h:245

llvm::CallingConv::AMDGPU_PS
@ AMDGPU_PS
Used for Mesa/AMDPAL pixel shaders.
Definition CallingConv.h:194

llvm::CallingConv::SPIR_KERNEL
@ SPIR_KERNEL
Used for SPIR kernel functions.
Definition CallingConv.h:144

llvm::CallingConv::Fast
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition CallingConv.h:41

llvm::CallingConv::AMDGPU_Gfx_WholeWave
@ AMDGPU_Gfx_WholeWave
Definition CallingConv.h:288

llvm::CallingConv::AMDGPU_ES
@ AMDGPU_ES
Used for AMDPAL shader stage before geometry shader if geometry is in use.
Definition CallingConv.h:218

llvm::CallingConv::AMDGPU_LS
@ AMDGPU_LS
Used for AMDPAL vertex shader if tessellation is in use.
Definition CallingConv.h:213

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26

llvm::Offset
@ Offset
Definition DWP.cpp:532

llvm::maxUIntN
constexpr uint64_t maxUIntN(uint64_t N)
Gets the maximum value for a N-bit unsigned integer.
Definition MathExtras.h:207

llvm::Wait
@ Wait
Definition Threading.h:60

llvm::Desc
Op::Description Desc
Definition DWARFExpressionPrinter.cpp:23

llvm::Version
FunctionAddr VTableAddr uintptr_t uintptr_t Version
Definition InstrProf.h:302

llvm::IRMemLocation::Other
@ Other
Any other memory.
Definition ModRef.h:68

llvm::ReplacementType::Format
@ Format
Definition FormatVariadic.h:46

llvm::ReplacementType::Literal
@ Literal
Definition FormatVariadic.h:46

llvm::operator<<
raw_ostream & operator<<(raw_ostream &OS, const APFixedPoint &FX)
Definition APFixedPoint.h:312

llvm::InstructionUniformity::Default
@ Default
The result values are uniform if and only if all operands are uniform.
Definition Uniformity.h:20

amd_kernel_code_t
AMD Kernel Code Object (amd_kernel_code_t).
Definition AMDKernelCodeT.h:526

llvm::AMDGPU::AMDGPUMCKernelCodeT
Definition AMDKernelCodeTUtils.h:33

llvm::AMDGPU::CanBeVOPD
Definition AMDGPUBaseInfo.h:611

llvm::AMDGPU::CanBeVOPD::X
bool X
Definition AMDGPUBaseInfo.h:612

llvm::AMDGPU::CanBeVOPD::Y
bool Y
Definition AMDGPUBaseInfo.h:613

llvm::AMDGPU::CvtScaleF32_F32F16ToF8F4_Info
Definition AMDGPUBaseInfo.h:113

llvm::AMDGPU::CvtScaleF32_F32F16ToF8F4_Info::Opcode
unsigned Opcode
Definition AMDGPUBaseInfo.h:114

llvm::AMDGPU::EncodingField
Definition AMDGPUBaseInfo.h:382

llvm::AMDGPU::EncodingField< Bit, Bit, D >::Width
static constexpr unsigned Width
Definition AMDGPUBaseInfo.h:385

llvm::AMDGPU::EncodingField::ValueType
unsigned ValueType
Definition AMDGPUBaseInfo.h:387

llvm::AMDGPU::EncodingField::EncodingField
constexpr EncodingField(ValueType Value)
Definition AMDGPUBaseInfo.h:391

llvm::AMDGPU::EncodingField< Bit, Bit, D >::Offset
static constexpr unsigned Offset
Definition AMDGPUBaseInfo.h:384

llvm::AMDGPU::EncodingField< Bit, Bit, D >::Value
ValueType Value
Definition AMDGPUBaseInfo.h:390

llvm::AMDGPU::EncodingField< Bit, Bit, D >::Default
static constexpr ValueType Default
Definition AMDGPUBaseInfo.h:388

llvm::AMDGPU::EncodingField::decode
static ValueType decode(uint64_t Encoded)
Definition AMDGPUBaseInfo.h:394

llvm::AMDGPU::EncodingField::encode
constexpr uint64_t encode() const
Definition AMDGPUBaseInfo.h:393

llvm::AMDGPU::EncodingFields
Definition AMDGPUBaseInfo.h:402

llvm::AMDGPU::EncodingFields::encode
static constexpr uint64_t encode(Fields... Values)
Definition AMDGPUBaseInfo.h:403

llvm::AMDGPU::EncodingFields::decode
static std::tuple< typename Fields::ValueType... > decode(uint64_t Encoded)
Definition AMDGPUBaseInfo.h:407

llvm::AMDGPU::GcnBufferFormatInfo
Definition AMDGPUBaseInfo.h:92

llvm::AMDGPU::GcnBufferFormatInfo::BitsPerComp
unsigned BitsPerComp
Definition AMDGPUBaseInfo.h:94

llvm::AMDGPU::GcnBufferFormatInfo::Format
unsigned Format
Definition AMDGPUBaseInfo.h:93

llvm::AMDGPU::GcnBufferFormatInfo::DataFormat
unsigned DataFormat
Definition AMDGPUBaseInfo.h:97

llvm::AMDGPU::GcnBufferFormatInfo::NumFormat
unsigned NumFormat
Definition AMDGPUBaseInfo.h:96

llvm::AMDGPU::GcnBufferFormatInfo::NumComponents
unsigned NumComponents
Definition AMDGPUBaseInfo.h:95

llvm::AMDGPU::HardwareLimits::ExpcntMax
unsigned ExpcntMax
Definition AMDGPUBaseInfo.h:1137

llvm::AMDGPU::HardwareLimits::VmVsrcMax
unsigned VmVsrcMax
Definition AMDGPUBaseInfo.h:1145

llvm::AMDGPU::HardwareLimits::SamplecntMax
unsigned SamplecntMax
Definition AMDGPUBaseInfo.h:1140

llvm::AMDGPU::HardwareLimits::BvhcntMax
unsigned BvhcntMax
Definition AMDGPUBaseInfo.h:1141

llvm::AMDGPU::HardwareLimits::LoadcntMax
unsigned LoadcntMax
Definition AMDGPUBaseInfo.h:1136

llvm::AMDGPU::HardwareLimits::XcntMax
unsigned XcntMax
Definition AMDGPUBaseInfo.h:1143

llvm::AMDGPU::HardwareLimits::HardwareLimits
HardwareLimits()=default

llvm::AMDGPU::HardwareLimits::KmcntMax
unsigned KmcntMax
Definition AMDGPUBaseInfo.h:1142

llvm::AMDGPU::HardwareLimits::DscntMax
unsigned DscntMax
Definition AMDGPUBaseInfo.h:1138

llvm::AMDGPU::HardwareLimits::VaVdstMax
unsigned VaVdstMax
Definition AMDGPUBaseInfo.h:1144

llvm::AMDGPU::HardwareLimits::StorecntMax
unsigned StorecntMax
Definition AMDGPUBaseInfo.h:1139

llvm::AMDGPU::Hwreg::HwregSize
Definition AMDGPUBaseInfo.h:1291

llvm::AMDGPU::Hwreg::HwregSize::EncodingField
constexpr EncodingField(ValueType Value)
Definition AMDGPUBaseInfo.h:391

llvm::AMDGPU::Hwreg::HwregSize::encode
constexpr uint64_t encode() const
Definition AMDGPUBaseInfo.h:1293

llvm::AMDGPU::Hwreg::HwregSize::decode
static ValueType decode(uint64_t Encoded)
Definition AMDGPUBaseInfo.h:1294

llvm::AMDGPU::IsaVersion
Instruction set architecture version.
Definition TargetParser.h:133

llvm::AMDGPU::MAIInstInfo
Definition AMDGPUBaseInfo.h:100

llvm::AMDGPU::MAIInstInfo::is_gfx940_xdl
bool is_gfx940_xdl
Definition AMDGPUBaseInfo.h:103

llvm::AMDGPU::MAIInstInfo::Opcode
uint16_t Opcode
Definition AMDGPUBaseInfo.h:101

llvm::AMDGPU::MAIInstInfo::is_dgemm
bool is_dgemm
Definition AMDGPUBaseInfo.h:102

llvm::AMDGPU::MFMA_F8F6F4_Info
Definition AMDGPUBaseInfo.h:106

llvm::AMDGPU::MFMA_F8F6F4_Info::F8F8Opcode
unsigned F8F8Opcode
Definition AMDGPUBaseInfo.h:108

llvm::AMDGPU::MFMA_F8F6F4_Info::NumRegsSrcB
uint8_t NumRegsSrcB
Definition AMDGPUBaseInfo.h:110

llvm::AMDGPU::MFMA_F8F6F4_Info::Opcode
unsigned Opcode
Definition AMDGPUBaseInfo.h:107

llvm::AMDGPU::MFMA_F8F6F4_Info::NumRegsSrcA
uint8_t NumRegsSrcA
Definition AMDGPUBaseInfo.h:109

llvm::AMDGPU::MIMGBaseOpcodeInfo
Definition AMDGPUBaseInfo.h:421

llvm::AMDGPU::MIMGBaseOpcodeInfo::Gather4
bool Gather4
Definition AMDGPUBaseInfo.h:427

llvm::AMDGPU::MIMGBaseOpcodeInfo::Gradients
bool Gradients
Definition AMDGPUBaseInfo.h:430

llvm::AMDGPU::MIMGBaseOpcodeInfo::G16
bool G16
Definition AMDGPUBaseInfo.h:431

llvm::AMDGPU::MIMGBaseOpcodeInfo::AtomicX2
bool AtomicX2
Definition AMDGPUBaseInfo.h:425

llvm::AMDGPU::MIMGBaseOpcodeInfo::Sampler
bool Sampler
Definition AMDGPUBaseInfo.h:426

llvm::AMDGPU::MIMGBaseOpcodeInfo::BaseOpcode
MIMGBaseOpcode BaseOpcode
Definition AMDGPUBaseInfo.h:422

llvm::AMDGPU::MIMGBaseOpcodeInfo::NoReturn
bool NoReturn
Definition AMDGPUBaseInfo.h:438

llvm::AMDGPU::MIMGBaseOpcodeInfo::HasD16
bool HasD16
Definition AMDGPUBaseInfo.h:434

llvm::AMDGPU::MIMGBaseOpcodeInfo::LodOrClampOrMip
bool LodOrClampOrMip
Definition AMDGPUBaseInfo.h:433

llvm::AMDGPU::MIMGBaseOpcodeInfo::Coordinates
bool Coordinates
Definition AMDGPUBaseInfo.h:432

llvm::AMDGPU::MIMGBaseOpcodeInfo::MSAA
bool MSAA
Definition AMDGPUBaseInfo.h:435

llvm::AMDGPU::MIMGBaseOpcodeInfo::Store
bool Store
Definition AMDGPUBaseInfo.h:423

llvm::AMDGPU::MIMGBaseOpcodeInfo::Atomic
bool Atomic
Definition AMDGPUBaseInfo.h:424

llvm::AMDGPU::MIMGBaseOpcodeInfo::A16
bool A16
Definition AMDGPUBaseInfo.h:437

llvm::AMDGPU::MIMGBaseOpcodeInfo::PointSampleAccel
bool PointSampleAccel
Definition AMDGPUBaseInfo.h:439

llvm::AMDGPU::MIMGBaseOpcodeInfo::BVH
bool BVH
Definition AMDGPUBaseInfo.h:436

llvm::AMDGPU::MIMGBaseOpcodeInfo::NumExtraArgs
uint8_t NumExtraArgs
Definition AMDGPUBaseInfo.h:429

llvm::AMDGPU::MIMGBiasMappingInfo
Definition AMDGPUBaseInfo.h:477

llvm::AMDGPU::MIMGBiasMappingInfo::NoBias
MIMGBaseOpcode NoBias
Definition AMDGPUBaseInfo.h:479

llvm::AMDGPU::MIMGBiasMappingInfo::Bias
MIMGBaseOpcode Bias
Definition AMDGPUBaseInfo.h:478

llvm::AMDGPU::MIMGDimInfo
Definition AMDGPUBaseInfo.h:448

llvm::AMDGPU::MIMGDimInfo::NumCoords
uint8_t NumCoords
Definition AMDGPUBaseInfo.h:450

llvm::AMDGPU::MIMGDimInfo::MSAA
bool MSAA
Definition AMDGPUBaseInfo.h:452

llvm::AMDGPU::MIMGDimInfo::AsmSuffix
const char * AsmSuffix
Definition AMDGPUBaseInfo.h:455

llvm::AMDGPU::MIMGDimInfo::Dim
MIMGDim Dim
Definition AMDGPUBaseInfo.h:449

llvm::AMDGPU::MIMGDimInfo::NumGradients
uint8_t NumGradients
Definition AMDGPUBaseInfo.h:451

llvm::AMDGPU::MIMGDimInfo::Encoding
uint8_t Encoding
Definition AMDGPUBaseInfo.h:454

llvm::AMDGPU::MIMGDimInfo::DA
bool DA
Definition AMDGPUBaseInfo.h:453

llvm::AMDGPU::MIMGG16MappingInfo
Definition AMDGPUBaseInfo.h:487

llvm::AMDGPU::MIMGG16MappingInfo::G
MIMGBaseOpcode G
Definition AMDGPUBaseInfo.h:488

llvm::AMDGPU::MIMGG16MappingInfo::G16
MIMGBaseOpcode G16
Definition AMDGPUBaseInfo.h:489

llvm::AMDGPU::MIMGInfo
Definition AMDGPUBaseInfo.h:524

llvm::AMDGPU::MIMGInfo::VDataDwords
uint8_t VDataDwords
Definition AMDGPUBaseInfo.h:528

llvm::AMDGPU::MIMGInfo::BaseOpcode
uint16_t BaseOpcode
Definition AMDGPUBaseInfo.h:526

llvm::AMDGPU::MIMGInfo::Opcode
uint16_t Opcode
Definition AMDGPUBaseInfo.h:525

llvm::AMDGPU::MIMGInfo::VAddrDwords
uint8_t VAddrDwords
Definition AMDGPUBaseInfo.h:529

llvm::AMDGPU::MIMGInfo::VAddrOperands
uint8_t VAddrOperands
Definition AMDGPUBaseInfo.h:530

llvm::AMDGPU::MIMGInfo::MIMGEncoding
uint8_t MIMGEncoding
Definition AMDGPUBaseInfo.h:527

llvm::AMDGPU::MIMGLZMappingInfo
Definition AMDGPUBaseInfo.h:467

llvm::AMDGPU::MIMGLZMappingInfo::LZ
MIMGBaseOpcode LZ
Definition AMDGPUBaseInfo.h:469

llvm::AMDGPU::MIMGLZMappingInfo::L
MIMGBaseOpcode L
Definition AMDGPUBaseInfo.h:468

llvm::AMDGPU::MIMGMIPMappingInfo
Definition AMDGPUBaseInfo.h:472

llvm::AMDGPU::MIMGMIPMappingInfo::NONMIP
MIMGBaseOpcode NONMIP
Definition AMDGPUBaseInfo.h:474

llvm::AMDGPU::MIMGMIPMappingInfo::MIP
MIMGBaseOpcode MIP
Definition AMDGPUBaseInfo.h:473

llvm::AMDGPU::MIMGOffsetMappingInfo
Definition AMDGPUBaseInfo.h:482

llvm::AMDGPU::MIMGOffsetMappingInfo::Offset
MIMGBaseOpcode Offset
Definition AMDGPUBaseInfo.h:483

llvm::AMDGPU::MIMGOffsetMappingInfo::NoOffset
MIMGBaseOpcode NoOffset
Definition AMDGPUBaseInfo.h:484

llvm::AMDGPU::True16D16Info
Definition AMDGPUBaseInfo.h:117

llvm::AMDGPU::True16D16Info::T16Op
unsigned T16Op
Definition AMDGPUBaseInfo.h:118

llvm::AMDGPU::True16D16Info::HiOp
unsigned HiOp
Definition AMDGPUBaseInfo.h:119

llvm::AMDGPU::True16D16Info::LoOp
unsigned LoOp
Definition AMDGPUBaseInfo.h:120

llvm::AMDGPU::WMMAInstInfo
Definition AMDGPUBaseInfo.h:123

llvm::AMDGPU::WMMAInstInfo::is_wmma_xdl
bool is_wmma_xdl
Definition AMDGPUBaseInfo.h:125

llvm::AMDGPU::WMMAInstInfo::Opcode
uint16_t Opcode
Definition AMDGPUBaseInfo.h:124

llvm::AMDGPU::WMMAOpcodeMappingInfo
Definition AMDGPUBaseInfo.h:495

llvm::AMDGPU::WMMAOpcodeMappingInfo::Opcode3Addr
unsigned Opcode3Addr
Definition AMDGPUBaseInfo.h:497

llvm::AMDGPU::WMMAOpcodeMappingInfo::Opcode2Addr
unsigned Opcode2Addr
Definition AMDGPUBaseInfo.h:496

llvm::AMDGPU::Waitcnt
Represents the counter values to wait for in an s_waitcnt instruction.
Definition AMDGPUBaseInfo.h:1083

llvm::AMDGPU::Waitcnt::Waitcnt
Waitcnt()=default

llvm::AMDGPU::Waitcnt::ExpCnt
unsigned ExpCnt
Definition AMDGPUBaseInfo.h:1085

llvm::AMDGPU::Waitcnt::XCnt
unsigned XCnt
Definition AMDGPUBaseInfo.h:1091

llvm::AMDGPU::Waitcnt::LoadCnt
unsigned LoadCnt
Definition AMDGPUBaseInfo.h:1084

llvm::AMDGPU::Waitcnt::VaVdst
unsigned VaVdst
Definition AMDGPUBaseInfo.h:1092

llvm::AMDGPU::Waitcnt::hasWait
bool hasWait() const
Definition AMDGPUBaseInfo.h:1108

llvm::AMDGPU::Waitcnt::BvhCnt
unsigned BvhCnt
Definition AMDGPUBaseInfo.h:1089

llvm::AMDGPU::Waitcnt::StoreCnt
unsigned StoreCnt
Definition AMDGPUBaseInfo.h:1087

llvm::AMDGPU::Waitcnt::SampleCnt
unsigned SampleCnt
Definition AMDGPUBaseInfo.h:1088

llvm::AMDGPU::Waitcnt::hasWaitDepctr
bool hasWaitDepctr() const
Definition AMDGPUBaseInfo.h:1118

llvm::AMDGPU::Waitcnt::Waitcnt
Waitcnt(unsigned LoadCnt, unsigned ExpCnt, unsigned DsCnt, unsigned StoreCnt, unsigned SampleCnt, unsigned BvhCnt, unsigned KmCnt, unsigned XCnt, unsigned VaVdst, unsigned VmVsrc)
Definition AMDGPUBaseInfo.h:1101

llvm::AMDGPU::Waitcnt::KmCnt
unsigned KmCnt
Definition AMDGPUBaseInfo.h:1090

llvm::AMDGPU::Waitcnt::hasWaitExceptStoreCnt
bool hasWaitExceptStoreCnt() const
Definition AMDGPUBaseInfo.h:1110

llvm::AMDGPU::Waitcnt::VmVsrc
unsigned VmVsrc
Definition AMDGPUBaseInfo.h:1093

llvm::AMDGPU::Waitcnt::hasWaitStoreCnt
bool hasWaitStoreCnt() const
Definition AMDGPUBaseInfo.h:1116

llvm::AMDGPU::Waitcnt::Waitcnt
Waitcnt(unsigned VmCnt, unsigned ExpCnt, unsigned LgkmCnt, unsigned VsCnt)
Definition AMDGPUBaseInfo.h:1097

llvm::AMDGPU::Waitcnt::combined
Waitcnt combined(const Waitcnt &Other) const
Definition AMDGPUBaseInfo.h:1120

llvm::AMDGPU::Waitcnt::DsCnt
unsigned DsCnt
Definition AMDGPUBaseInfo.h:1086

llvm::AMDGPU::Waitcnt::operator<<
friend raw_ostream & operator<<(raw_ostream &OS, const AMDGPU::Waitcnt &Wait)
Definition AMDGPUBaseInfo.cpp:1722