doxygen/AMDGPUBaseInfo_8h_source.html

//===- AMDGPUBaseInfo.h - Top level definitions for AMDGPU ------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_AMDGPU_UTILS_AMDGPUBASEINFO_H

#define LLVM_LIB_TARGET_AMDGPU_UTILS_AMDGPUBASEINFO_H


#include "AMDGPUSubtarget.h"

#include "SIDefines.h"

#include "llvm/IR/CallingConv.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Module.h"

#include "llvm/Support/Alignment.h"

#include <array>

#include <functional>

#include <utility>


struct amd_kernel_code_t;


namespace llvm {


struct Align;

class Argument;

class Function;

class GlobalValue;

class MCInstrInfo;

class MCRegisterClass;

class MCRegisterInfo;

class MCSubtargetInfo;

class StringRef;

class Triple;

class raw_ostream;


namespace AMDGPU {


struct AMDGPUMCKernelCodeT;

struct IsaVersion;


/// Generic target versions emitted by this version of LLVM.

///

/// These numbers are incremented every time a codegen breaking change occurs

/// within a generic family.

namespace GenericVersion {

static constexpr unsigned GFX9 = 1;

static constexpr unsigned GFX9_4 = 1;

static constexpr unsigned GFX10_1 = 1;

static constexpr unsigned GFX10_3 = 1;

static constexpr unsigned GFX11 = 1;

static constexpr unsigned GFX12 = 1;

} // namespace GenericVersion


enum { AMDHSA_COV4 = 4, AMDHSA_COV5 = 5, AMDHSA_COV6 = 6 };


enum class FPType { None, FP4, FP8 };


/// \returns True if \p STI is AMDHSA.

bool isHsaAbi(const MCSubtargetInfo &STI);


/// \returns Code object version from the IR module flag.

unsigned getAMDHSACodeObjectVersion(const Module &M);


/// \returns Code object version from ELF's e_ident[EI_ABIVERSION].

unsigned getAMDHSACodeObjectVersion(unsigned ABIVersion);


/// \returns The default HSA code object version. This should only be used when

/// we lack a more accurate CodeObjectVersion value (e.g. from the IR module

/// flag or a .amdhsa_code_object_version directive)

unsigned getDefaultAMDHSACodeObjectVersion();


/// \returns ABIVersion suitable for use in ELF's e_ident[EI_ABIVERSION]. \param

/// CodeObjectVersion is a value returned by getAMDHSACodeObjectVersion().

uint8_t getELFABIVersion(const Triple &OS, unsigned CodeObjectVersion);


/// \returns The offset of the multigrid_sync_arg argument from implicitarg_ptr

unsigned getMultigridSyncArgImplicitArgPosition(unsigned COV);


/// \returns The offset of the hostcall pointer argument from implicitarg_ptr

unsigned getHostcallImplicitArgPosition(unsigned COV);


unsigned getDefaultQueueImplicitArgPosition(unsigned COV);

unsigned getCompletionActionImplicitArgPosition(unsigned COV);


struct GcnBufferFormatInfo {

  unsigned Format;

  unsigned BitsPerComp;

  unsigned NumComponents;

  unsigned NumFormat;

  unsigned DataFormat;

};


struct MAIInstInfo {

  uint16_t Opcode;

  bool is_dgemm;

  bool is_gfx940_xdl;

};


struct MFMA_F8F6F4_Info {

  unsigned Opcode;

  unsigned F8F8Opcode;

  uint8_t NumRegsSrcA;

  uint8_t NumRegsSrcB;

};


struct CvtScaleF32_F32F16ToF8F4_Info {

  unsigned Opcode;

};


#define GET_MIMGBaseOpcode_DECL

#define GET_MIMGDim_DECL

#define GET_MIMGEncoding_DECL

#define GET_MIMGLZMapping_DECL

#define GET_MIMGMIPMapping_DECL

#define GET_MIMGBiASMapping_DECL

#define GET_MAIInstInfoTable_DECL

#define GET_MAIInstInfoTable_DECL

#define GET_isMFMA_F8F6F4Table_DECL

#define GET_isCvtScaleF32_F32F16ToF8F4Table_DECL

#include "AMDGPUGenSearchableTables.inc"


namespace IsaInfo {


enum {

  // The closed Vulkan driver sets 96, which limits the wave count to 8 but

  // doesn't spill SGPRs as much as when 80 is set.

  FIXED_NUM_SGPRS_FOR_INIT_BUG = 96,

  TRAP_NUM_SGPRS = 16

};


enum class TargetIDSetting {

  Unsupported,

  Any,

  Off,

  On

};


class AMDGPUTargetID {

private:

  const MCSubtargetInfo &STI;

  TargetIDSetting XnackSetting;

  TargetIDSetting SramEccSetting;


public:

  explicit AMDGPUTargetID(const MCSubtargetInfo &STI);

  ~AMDGPUTargetID() = default;


  /// \return True if the current xnack setting is not "Unsupported".

  bool isXnackSupported() const {

    return XnackSetting != TargetIDSetting::Unsupported;

  }


  /// \returns True if the current xnack setting is "On" or "Any".

  bool isXnackOnOrAny() const {

    return XnackSetting == TargetIDSetting::On ||

        XnackSetting == TargetIDSetting::Any;

  }


  /// \returns True if current xnack setting is "On" or "Off",

  /// false otherwise.

  bool isXnackOnOrOff() const {

    return getXnackSetting() == TargetIDSetting::On ||

        getXnackSetting() == TargetIDSetting::Off;

  }


  /// \returns The current xnack TargetIDSetting, possible options are

  /// "Unsupported", "Any", "Off", and "On".

  TargetIDSetting getXnackSetting() const {

    return XnackSetting;

  }


  /// Sets xnack setting to \p NewXnackSetting.

  void setXnackSetting(TargetIDSetting NewXnackSetting) {

    XnackSetting = NewXnackSetting;

  }


  /// \return True if the current sramecc setting is not "Unsupported".

  bool isSramEccSupported() const {

    return SramEccSetting != TargetIDSetting::Unsupported;

  }


  /// \returns True if the current sramecc setting is "On" or "Any".

  bool isSramEccOnOrAny() const {

  return SramEccSetting == TargetIDSetting::On ||

      SramEccSetting == TargetIDSetting::Any;

  }


  /// \returns True if current sramecc setting is "On" or "Off",

  /// false otherwise.

  bool isSramEccOnOrOff() const {

    return getSramEccSetting() == TargetIDSetting::On ||

        getSramEccSetting() == TargetIDSetting::Off;

  }


  /// \returns The current sramecc TargetIDSetting, possible options are

  /// "Unsupported", "Any", "Off", and "On".

  TargetIDSetting getSramEccSetting() const {

    return SramEccSetting;

  }


  /// Sets sramecc setting to \p NewSramEccSetting.

  void setSramEccSetting(TargetIDSetting NewSramEccSetting) {

    SramEccSetting = NewSramEccSetting;

  }


  void setTargetIDFromFeaturesString(StringRef FS);

  void setTargetIDFromTargetIDStream(StringRef TargetID);


  /// \returns String representation of an object.

  std::string toString() const;

};


/// \returns Wavefront size for given subtarget \p STI.

unsigned getWavefrontSize(const MCSubtargetInfo *STI);


/// \returns Local memory size in bytes for given subtarget \p STI.

unsigned getLocalMemorySize(const MCSubtargetInfo *STI);


/// \returns Maximum addressable local memory size in bytes for given subtarget

/// \p STI.

unsigned getAddressableLocalMemorySize(const MCSubtargetInfo *STI);


/// \returns Number of execution units per compute unit for given subtarget \p

/// STI.

unsigned getEUsPerCU(const MCSubtargetInfo *STI);


/// \returns Maximum number of work groups per compute unit for given subtarget

/// \p STI and limited by given \p FlatWorkGroupSize.

unsigned getMaxWorkGroupsPerCU(const MCSubtargetInfo *STI,

                               unsigned FlatWorkGroupSize);


/// \returns Minimum number of waves per execution unit for given subtarget \p

/// STI.

unsigned getMinWavesPerEU(const MCSubtargetInfo *STI);


/// \returns Maximum number of waves per execution unit for given subtarget \p

/// STI without any kind of limitation.

unsigned getMaxWavesPerEU(const MCSubtargetInfo *STI);


/// \returns Number of waves per execution unit required to support the given \p

/// FlatWorkGroupSize.

unsigned getWavesPerEUForWorkGroup(const MCSubtargetInfo *STI,

                                   unsigned FlatWorkGroupSize);


/// \returns Minimum flat work group size for given subtarget \p STI.

unsigned getMinFlatWorkGroupSize(const MCSubtargetInfo *STI);


/// \returns Maximum flat work group size for given subtarget \p STI.

unsigned getMaxFlatWorkGroupSize(const MCSubtargetInfo *STI);


/// \returns Number of waves per work group for given subtarget \p STI and

/// \p FlatWorkGroupSize.

unsigned getWavesPerWorkGroup(const MCSubtargetInfo *STI,

                              unsigned FlatWorkGroupSize);


/// \returns SGPR allocation granularity for given subtarget \p STI.

unsigned getSGPRAllocGranule(const MCSubtargetInfo *STI);


/// \returns SGPR encoding granularity for given subtarget \p STI.

unsigned getSGPREncodingGranule(const MCSubtargetInfo *STI);


/// \returns Total number of SGPRs for given subtarget \p STI.

unsigned getTotalNumSGPRs(const MCSubtargetInfo *STI);


/// \returns Addressable number of SGPRs for given subtarget \p STI.

unsigned getAddressableNumSGPRs(const MCSubtargetInfo *STI);


/// \returns Minimum number of SGPRs that meets the given number of waves per

/// execution unit requirement for given subtarget \p STI.

unsigned getMinNumSGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU);


/// \returns Maximum number of SGPRs that meets the given number of waves per

/// execution unit requirement for given subtarget \p STI.

unsigned getMaxNumSGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU,

                        bool Addressable);


/// \returns Number of extra SGPRs implicitly required by given subtarget \p

/// STI when the given special registers are used.

unsigned getNumExtraSGPRs(const MCSubtargetInfo *STI, bool VCCUsed,

                          bool FlatScrUsed, bool XNACKUsed);


/// \returns Number of extra SGPRs implicitly required by given subtarget \p

/// STI when the given special registers are used. XNACK is inferred from

/// \p STI.

unsigned getNumExtraSGPRs(const MCSubtargetInfo *STI, bool VCCUsed,

                          bool FlatScrUsed);


/// \returns Number of SGPR blocks needed for given subtarget \p STI when

/// \p NumSGPRs are used. \p NumSGPRs should already include any special

/// register counts.

unsigned getNumSGPRBlocks(const MCSubtargetInfo *STI, unsigned NumSGPRs);


/// \returns VGPR allocation granularity for given subtarget \p STI.

///

/// For subtargets which support it, \p EnableWavefrontSize32 should match

/// the ENABLE_WAVEFRONT_SIZE32 kernel descriptor field.

unsigned

getVGPRAllocGranule(const MCSubtargetInfo *STI,

                    std::optional<bool> EnableWavefrontSize32 = std::nullopt);


/// \returns VGPR encoding granularity for given subtarget \p STI.

///

/// For subtargets which support it, \p EnableWavefrontSize32 should match

/// the ENABLE_WAVEFRONT_SIZE32 kernel descriptor field.

unsigned getVGPREncodingGranule(

    const MCSubtargetInfo *STI,

    std::optional<bool> EnableWavefrontSize32 = std::nullopt);


/// \returns Total number of VGPRs for given subtarget \p STI.

unsigned getTotalNumVGPRs(const MCSubtargetInfo *STI);


/// \returns Addressable number of architectural VGPRs for a given subtarget \p

/// STI.

unsigned getAddressableNumArchVGPRs(const MCSubtargetInfo *STI);


/// \returns Addressable number of VGPRs for given subtarget \p STI.

unsigned getAddressableNumVGPRs(const MCSubtargetInfo *STI);


/// \returns Minimum number of VGPRs that meets given number of waves per

/// execution unit requirement for given subtarget \p STI.

unsigned getMinNumVGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU);


/// \returns Maximum number of VGPRs that meets given number of waves per

/// execution unit requirement for given subtarget \p STI.

unsigned getMaxNumVGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU);


/// \returns Number of waves reachable for a given \p NumVGPRs usage for given

/// subtarget \p STI.

unsigned getNumWavesPerEUWithNumVGPRs(const MCSubtargetInfo *STI,

                                      unsigned NumVGPRs);


/// \returns Number of waves reachable for a given \p NumVGPRs usage, \p Granule

/// size, \p MaxWaves possible, and \p TotalNumVGPRs available.

unsigned getNumWavesPerEUWithNumVGPRs(unsigned NumVGPRs, unsigned Granule,

                                      unsigned MaxWaves,

                                      unsigned TotalNumVGPRs);


/// \returns Occupancy for a given \p SGPRs usage, \p MaxWaves possible, and \p

/// Gen.

unsigned getOccupancyWithNumSGPRs(unsigned SGPRs, unsigned MaxWaves,

                                  AMDGPUSubtarget::Generation Gen);


/// \returns Number of VGPR blocks needed for given subtarget \p STI when

/// \p NumVGPRs are used. We actually return the number of blocks -1, since

/// that's what we encode.

///

/// For subtargets which support it, \p EnableWavefrontSize32 should match the

/// ENABLE_WAVEFRONT_SIZE32 kernel descriptor field.

unsigned getEncodedNumVGPRBlocks(

    const MCSubtargetInfo *STI, unsigned NumVGPRs,

    std::optional<bool> EnableWavefrontSize32 = std::nullopt);


/// \returns Number of VGPR blocks that need to be allocated for the given

/// subtarget \p STI when \p NumVGPRs are used.

unsigned getAllocatedNumVGPRBlocks(

    const MCSubtargetInfo *STI, unsigned NumVGPRs,

    std::optional<bool> EnableWavefrontSize32 = std::nullopt);


} // end namespace IsaInfo


// Represents a field in an encoded value.

template <unsigned HighBit, unsigned LowBit, unsigned D = 0>

struct EncodingField {

  static_assert(HighBit >= LowBit, "Invalid bit range!");

  static constexpr unsigned Offset = LowBit;

  static constexpr unsigned Width = HighBit - LowBit + 1;


  using ValueType = unsigned;

  static constexpr ValueType Default = D;


  ValueType Value;

  constexpr EncodingField(ValueType Value) : Value(Value) {}


  constexpr uint64_t encode() const { return Value; }

  static ValueType decode(uint64_t Encoded) { return Encoded; }

};


// Represents a single bit in an encoded value.

template <unsigned Bit, unsigned D = 0>

using EncodingBit = EncodingField<Bit, Bit, D>;


// A helper for encoding and decoding multiple fields.

template <typename... Fields> struct EncodingFields {

  static constexpr uint64_t encode(Fields... Values) {

    return ((Values.encode() << Values.Offset) | ...);

  }


  static std::tuple<typename Fields::ValueType...> decode(uint64_t Encoded) {

    return {Fields::decode((Encoded >> Fields::Offset) &

                           maxUIntN(Fields::Width))...};

  }

};


LLVM_READONLY

int16_t getNamedOperandIdx(uint16_t Opcode, uint16_t NamedIdx);


LLVM_READONLY

inline bool hasNamedOperand(uint64_t Opcode, uint64_t NamedIdx) {

  return getNamedOperandIdx(Opcode, NamedIdx) != -1;

}


LLVM_READONLY

int getSOPPWithRelaxation(uint16_t Opcode);


struct MIMGBaseOpcodeInfo {

  MIMGBaseOpcode BaseOpcode;

  bool Store;

  bool Atomic;

  bool AtomicX2;

  bool Sampler;

  bool Gather4;


  uint8_t NumExtraArgs;

  bool Gradients;

  bool G16;

  bool Coordinates;

  bool LodOrClampOrMip;

  bool HasD16;

  bool MSAA;

  bool BVH;

  bool A16;

  bool NoReturn;

};


LLVM_READONLY

const MIMGBaseOpcodeInfo *getMIMGBaseOpcode(unsigned Opc);


LLVM_READONLY

const MIMGBaseOpcodeInfo *getMIMGBaseOpcodeInfo(unsigned BaseOpcode);


struct MIMGDimInfo {

  MIMGDim Dim;

  uint8_t NumCoords;

  uint8_t NumGradients;

  bool MSAA;

  bool DA;

  uint8_t Encoding;

  const char *AsmSuffix;

};


LLVM_READONLY

const MIMGDimInfo *getMIMGDimInfo(unsigned DimEnum);


LLVM_READONLY

const MIMGDimInfo *getMIMGDimInfoByEncoding(uint8_t DimEnc);


LLVM_READONLY

const MIMGDimInfo *getMIMGDimInfoByAsmSuffix(StringRef AsmSuffix);


struct MIMGLZMappingInfo {

  MIMGBaseOpcode L;

  MIMGBaseOpcode LZ;

};


struct MIMGMIPMappingInfo {

  MIMGBaseOpcode MIP;

  MIMGBaseOpcode NONMIP;

};


struct MIMGBiasMappingInfo {

  MIMGBaseOpcode Bias;

  MIMGBaseOpcode NoBias;

};


struct MIMGOffsetMappingInfo {

  MIMGBaseOpcode Offset;

  MIMGBaseOpcode NoOffset;

};


struct MIMGG16MappingInfo {

  MIMGBaseOpcode G;

  MIMGBaseOpcode G16;

};


LLVM_READONLY

const MIMGLZMappingInfo *getMIMGLZMappingInfo(unsigned L);


struct WMMAOpcodeMappingInfo {

  unsigned Opcode2Addr;

  unsigned Opcode3Addr;

};


LLVM_READONLY

const MIMGMIPMappingInfo *getMIMGMIPMappingInfo(unsigned MIP);


LLVM_READONLY

const MIMGBiasMappingInfo *getMIMGBiasMappingInfo(unsigned Bias);


LLVM_READONLY

const MIMGOffsetMappingInfo *getMIMGOffsetMappingInfo(unsigned Offset);


LLVM_READONLY

const MIMGG16MappingInfo *getMIMGG16MappingInfo(unsigned G);


LLVM_READONLY

int getMIMGOpcode(unsigned BaseOpcode, unsigned MIMGEncoding,

                  unsigned VDataDwords, unsigned VAddrDwords);


LLVM_READONLY

int getMaskedMIMGOp(unsigned Opc, unsigned NewChannels);


LLVM_READONLY

unsigned getAddrSizeMIMGOp(const MIMGBaseOpcodeInfo *BaseOpcode,

                           const MIMGDimInfo *Dim, bool IsA16,

                           bool IsG16Supported);


struct MIMGInfo {

  uint16_t Opcode;

  uint16_t BaseOpcode;

  uint8_t MIMGEncoding;

  uint8_t VDataDwords;

  uint8_t VAddrDwords;

  uint8_t VAddrOperands;

};


LLVM_READONLY

const MIMGInfo *getMIMGInfo(unsigned Opc);


LLVM_READONLY

int getMTBUFBaseOpcode(unsigned Opc);


LLVM_READONLY

int getMTBUFOpcode(unsigned BaseOpc, unsigned Elements);


LLVM_READONLY

int getMTBUFElements(unsigned Opc);


LLVM_READONLY

bool getMTBUFHasVAddr(unsigned Opc);


LLVM_READONLY

bool getMTBUFHasSrsrc(unsigned Opc);


LLVM_READONLY

bool getMTBUFHasSoffset(unsigned Opc);


LLVM_READONLY

int getMUBUFBaseOpcode(unsigned Opc);


LLVM_READONLY

int getMUBUFOpcode(unsigned BaseOpc, unsigned Elements);


LLVM_READONLY

int getMUBUFElements(unsigned Opc);


LLVM_READONLY

bool getMUBUFHasVAddr(unsigned Opc);


LLVM_READONLY

bool getMUBUFHasSrsrc(unsigned Opc);


LLVM_READONLY

bool getMUBUFHasSoffset(unsigned Opc);


LLVM_READONLY

bool getMUBUFIsBufferInv(unsigned Opc);


LLVM_READONLY

bool getMUBUFTfe(unsigned Opc);


LLVM_READONLY

bool getSMEMIsBuffer(unsigned Opc);


LLVM_READONLY

bool getVOP1IsSingle(unsigned Opc);


LLVM_READONLY

bool getVOP2IsSingle(unsigned Opc);


LLVM_READONLY

bool getVOP3IsSingle(unsigned Opc);


LLVM_READONLY

bool isVOPC64DPP(unsigned Opc);


LLVM_READONLY

bool isVOPCAsmOnly(unsigned Opc);


/// Returns true if MAI operation is a double precision GEMM.

LLVM_READONLY

bool getMAIIsDGEMM(unsigned Opc);


LLVM_READONLY

bool getMAIIsGFX940XDL(unsigned Opc);


struct CanBeVOPD {

  bool X;

  bool Y;

};


/// \returns SIEncodingFamily used for VOPD encoding on a \p ST.

LLVM_READONLY

unsigned getVOPDEncodingFamily(const MCSubtargetInfo &ST);


LLVM_READONLY

CanBeVOPD getCanBeVOPD(unsigned Opc);


LLVM_READNONE

uint8_t mfmaScaleF8F6F4FormatToNumRegs(unsigned EncodingVal);


LLVM_READONLY

const MFMA_F8F6F4_Info *getMFMA_F8F6F4_WithFormatArgs(unsigned CBSZ,

                                                      unsigned BLGP,

                                                      unsigned F8F8Opcode);


LLVM_READONLY

const GcnBufferFormatInfo *getGcnBufferFormatInfo(uint8_t BitsPerComp,

                                                  uint8_t NumComponents,

                                                  uint8_t NumFormat,

                                                  const MCSubtargetInfo &STI);

LLVM_READONLY

const GcnBufferFormatInfo *getGcnBufferFormatInfo(uint8_t Format,

                                                  const MCSubtargetInfo &STI);


LLVM_READONLY

int getMCOpcode(uint16_t Opcode, unsigned Gen);


LLVM_READONLY

unsigned getVOPDOpcode(unsigned Opc);


LLVM_READONLY

int getVOPDFull(unsigned OpX, unsigned OpY, unsigned EncodingFamily);


LLVM_READONLY

bool isVOPD(unsigned Opc);


LLVM_READNONE

bool isMAC(unsigned Opc);


LLVM_READNONE

bool isPermlane16(unsigned Opc);


LLVM_READNONE

bool isGenericAtomic(unsigned Opc);


LLVM_READNONE

bool isCvt_F32_Fp8_Bf8_e64(unsigned Opc);


namespace VOPD {


enum Component : unsigned {

  DST = 0,

  SRC0,

  SRC1,

  SRC2,


  DST_NUM = 1,

  MAX_SRC_NUM = 3,

  MAX_OPR_NUM = DST_NUM + MAX_SRC_NUM

};


// LSB mask for VGPR banks per VOPD component operand.

// 4 banks result in a mask 3, setting 2 lower bits.

constexpr unsigned VOPD_VGPR_BANK_MASKS[] = {1, 3, 3, 1};


enum ComponentIndex : unsigned { X = 0, Y = 1 };

constexpr unsigned COMPONENTS[] = {ComponentIndex::X, ComponentIndex::Y};

constexpr unsigned COMPONENTS_NUM = 2;


// Properties of VOPD components.

class ComponentProps {

private:

  unsigned SrcOperandsNum = 0;

  unsigned MandatoryLiteralIdx = ~0u;

  bool HasSrc2Acc = false;


public:

  ComponentProps() = default;

  ComponentProps(const MCInstrDesc &OpDesc);


  // Return the total number of src operands this component has.

  unsigned getCompSrcOperandsNum() const { return SrcOperandsNum; }


  // Return the number of src operands of this component visible to the parser.

  unsigned getCompParsedSrcOperandsNum() const {

    return SrcOperandsNum - HasSrc2Acc;

  }


  // Return true iif this component has a mandatory literal.

  bool hasMandatoryLiteral() const { return MandatoryLiteralIdx != ~0u; }


  // If this component has a mandatory literal, return component operand

  // index of this literal (i.e. either Component::SRC1 or Component::SRC2).

  unsigned getMandatoryLiteralCompOperandIndex() const {

    assert(hasMandatoryLiteral());

    return MandatoryLiteralIdx;

  }


  // Return true iif this component has operand

  // with component index CompSrcIdx and this operand may be a register.

  bool hasRegSrcOperand(unsigned CompSrcIdx) const {

    assert(CompSrcIdx < Component::MAX_SRC_NUM);

    return SrcOperandsNum > CompSrcIdx && !hasMandatoryLiteralAt(CompSrcIdx);

  }


  // Return true iif this component has tied src2.

  bool hasSrc2Acc() const { return HasSrc2Acc; }


private:

  bool hasMandatoryLiteralAt(unsigned CompSrcIdx) const {

    assert(CompSrcIdx < Component::MAX_SRC_NUM);

    return MandatoryLiteralIdx == Component::DST_NUM + CompSrcIdx;

  }

};


enum ComponentKind : unsigned {

  SINGLE = 0,  // A single VOP1 or VOP2 instruction which may be used in VOPD.

  COMPONENT_X, // A VOPD instruction, X component.

  COMPONENT_Y, // A VOPD instruction, Y component.

  MAX = COMPONENT_Y

};


// Interface functions of this class map VOPD component operand indices

// to indices of operands in MachineInstr/MCInst or parsed operands array.

//

// Note that this class operates with 3 kinds of indices:

// - VOPD component operand indices (Component::DST, Component::SRC0, etc.);

// - MC operand indices (they refer operands in a MachineInstr/MCInst);

// - parsed operand indices (they refer operands in parsed operands array).

//

// For SINGLE components mapping between these indices is trivial.

// But things get more complicated for COMPONENT_X and

// COMPONENT_Y because these components share the same

// MachineInstr/MCInst and the same parsed operands array.

// Below is an example of component operand to parsed operand

// mapping for the following instruction:

//

//   v_dual_add_f32 v255, v4, v5 :: v_dual_mov_b32 v6, v1

//

//                          PARSED        COMPONENT         PARSED

// COMPONENT               OPERANDS     OPERAND INDEX    OPERAND INDEX

// -------------------------------------------------------------------

//                     "v_dual_add_f32"                        0

// v_dual_add_f32            v255          0 (DST)    -->      1

//                           v4            1 (SRC0)   -->      2

//                           v5            2 (SRC1)   -->      3

//                          "::"                               4

//                     "v_dual_mov_b32"                        5

// v_dual_mov_b32            v6            0 (DST)    -->      6

//                           v1            1 (SRC0)   -->      7

// -------------------------------------------------------------------

//

class ComponentLayout {

private:

  // Regular MachineInstr/MCInst operands are ordered as follows:

  //   dst, src0 [, other src operands]

  // VOPD MachineInstr/MCInst operands are ordered as follows:

  //   dstX, dstY, src0X [, other OpX operands], src0Y [, other OpY operands]

  // Each ComponentKind has operand indices defined below.

  static constexpr unsigned MC_DST_IDX[] = {0, 0, 1};

  static constexpr unsigned FIRST_MC_SRC_IDX[] = {1, 2, 2 /* + OpX.MCSrcNum */};


  // Parsed operands of regular instructions are ordered as follows:

  //   Mnemo dst src0 [vsrc1 ...]

  // Parsed VOPD operands are ordered as follows:

  //   OpXMnemo dstX src0X [vsrc1X|imm vsrc1X|vsrc1X imm] '::'

  //   OpYMnemo dstY src0Y [vsrc1Y|imm vsrc1Y|vsrc1Y imm]

  // Each ComponentKind has operand indices defined below.

  static constexpr unsigned PARSED_DST_IDX[] = {1, 1,

                                                4 /* + OpX.ParsedSrcNum */};

  static constexpr unsigned FIRST_PARSED_SRC_IDX[] = {

      2, 2, 5 /* + OpX.ParsedSrcNum */};


private:

  const ComponentKind Kind;

  const ComponentProps PrevComp;


public:

  // Create layout for COMPONENT_X or SINGLE component.

  ComponentLayout(ComponentKind Kind) : Kind(Kind) {

    assert(Kind == ComponentKind::SINGLE || Kind == ComponentKind::COMPONENT_X);

  }


  // Create layout for COMPONENT_Y which depends on COMPONENT_X layout.

  ComponentLayout(const ComponentProps &OpXProps)

      : Kind(ComponentKind::COMPONENT_Y), PrevComp(OpXProps) {}


public:

  // Return the index of dst operand in MCInst operands.

  unsigned getIndexOfDstInMCOperands() const { return MC_DST_IDX[Kind]; }


  // Return the index of the specified src operand in MCInst operands.

  unsigned getIndexOfSrcInMCOperands(unsigned CompSrcIdx) const {

    assert(CompSrcIdx < Component::MAX_SRC_NUM);

    return FIRST_MC_SRC_IDX[Kind] + getPrevCompSrcNum() + CompSrcIdx;

  }


  // Return the index of dst operand in the parsed operands array.

  unsigned getIndexOfDstInParsedOperands() const {

    return PARSED_DST_IDX[Kind] + getPrevCompParsedSrcNum();

  }


  // Return the index of the specified src operand in the parsed operands array.

  unsigned getIndexOfSrcInParsedOperands(unsigned CompSrcIdx) const {

    assert(CompSrcIdx < Component::MAX_SRC_NUM);

    return FIRST_PARSED_SRC_IDX[Kind] + getPrevCompParsedSrcNum() + CompSrcIdx;

  }


private:

  unsigned getPrevCompSrcNum() const {

    return PrevComp.getCompSrcOperandsNum();

  }

  unsigned getPrevCompParsedSrcNum() const {

    return PrevComp.getCompParsedSrcOperandsNum();

  }

};


// Layout and properties of VOPD components.

class ComponentInfo : public ComponentLayout, public ComponentProps {

public:

  // Create ComponentInfo for COMPONENT_X or SINGLE component.

  ComponentInfo(const MCInstrDesc &OpDesc,

                ComponentKind Kind = ComponentKind::SINGLE)

      : ComponentLayout(Kind), ComponentProps(OpDesc) {}


  // Create ComponentInfo for COMPONENT_Y which depends on COMPONENT_X layout.

  ComponentInfo(const MCInstrDesc &OpDesc, const ComponentProps &OpXProps)

      : ComponentLayout(OpXProps), ComponentProps(OpDesc) {}


  // Map component operand index to parsed operand index.

  // Return 0 if the specified operand does not exist.

  unsigned getIndexInParsedOperands(unsigned CompOprIdx) const;

};


// Properties of VOPD instructions.

class InstInfo {

private:

  const ComponentInfo CompInfo[COMPONENTS_NUM];


public:

  using RegIndices = std::array<unsigned, Component::MAX_OPR_NUM>;


  InstInfo(const MCInstrDesc &OpX, const MCInstrDesc &OpY)

      : CompInfo{OpX, OpY} {}


  InstInfo(const ComponentInfo &OprInfoX, const ComponentInfo &OprInfoY)

      : CompInfo{OprInfoX, OprInfoY} {}


  const ComponentInfo &operator[](size_t ComponentIdx) const {

    assert(ComponentIdx < COMPONENTS_NUM);

    return CompInfo[ComponentIdx];

  }


  // Check VOPD operands constraints.

  // GetRegIdx(Component, MCOperandIdx) must return a VGPR register index

  // for the specified component and MC operand. The callback must return 0

  // if the operand is not a register or not a VGPR.

  // If \p SkipSrc is set to true then constraints for source operands are not

  // checked.

  bool hasInvalidOperand(std::function<unsigned(unsigned, unsigned)> GetRegIdx,

                         bool SkipSrc = false) const {

    return getInvalidCompOperandIndex(GetRegIdx, SkipSrc).has_value();

  }


  // Check VOPD operands constraints.

  // Return the index of an invalid component operand, if any.

  // If \p SkipSrc is set to true then constraints for source operands are not

  // checked.

  std::optional<unsigned> getInvalidCompOperandIndex(

      std::function<unsigned(unsigned, unsigned)> GetRegIdx,

      bool SkipSrc = false) const;


private:

  RegIndices

  getRegIndices(unsigned ComponentIdx,

                std::function<unsigned(unsigned, unsigned)> GetRegIdx) const;

};


} // namespace VOPD


LLVM_READONLY

std::pair<unsigned, unsigned> getVOPDComponents(unsigned VOPDOpcode);


LLVM_READONLY

// Get properties of 2 single VOP1/VOP2 instructions

// used as components to create a VOPD instruction.

VOPD::InstInfo getVOPDInstInfo(const MCInstrDesc &OpX, const MCInstrDesc &OpY);


LLVM_READONLY

// Get properties of VOPD X and Y components.

VOPD::InstInfo

getVOPDInstInfo(unsigned VOPDOpcode, const MCInstrInfo *InstrInfo);


LLVM_READONLY

bool isTrue16Inst(unsigned Opc);


LLVM_READONLY

FPType getFPDstSelType(unsigned Opc);


LLVM_READONLY

bool isInvalidSingleUseConsumerInst(unsigned Opc);


LLVM_READONLY

bool isInvalidSingleUseProducerInst(unsigned Opc);


bool isDPMACCInstruction(unsigned Opc);


LLVM_READONLY

unsigned mapWMMA2AddrTo3AddrOpcode(unsigned Opc);


LLVM_READONLY

unsigned mapWMMA3AddrTo2AddrOpcode(unsigned Opc);


void initDefaultAMDKernelCodeT(AMDGPUMCKernelCodeT &Header,

                               const MCSubtargetInfo *STI);


bool isGroupSegment(const GlobalValue *GV);

bool isGlobalSegment(const GlobalValue *GV);

bool isReadOnlySegment(const GlobalValue *GV);


/// \returns True if constants should be emitted to .text section for given

/// target triple \p TT, false otherwise.

bool shouldEmitConstantsToTextSection(const Triple &TT);


/// \returns Integer value requested using \p F's \p Name attribute.

///

/// \returns \p Default if attribute is not present.

///

/// \returns \p Default and emits error if requested value cannot be converted

/// to integer.

int getIntegerAttribute(const Function &F, StringRef Name, int Default);


/// \returns A pair of integer values requested using \p F's \p Name attribute

/// in "first[,second]" format ("second" is optional unless \p OnlyFirstRequired

/// is false).

///

/// \returns \p Default if attribute is not present.

///

/// \returns \p Default and emits error if one of the requested values cannot be

/// converted to integer, or \p OnlyFirstRequired is false and "second" value is

/// not present.

std::pair<unsigned, unsigned>

getIntegerPairAttribute(const Function &F, StringRef Name,

                        std::pair<unsigned, unsigned> Default,

                        bool OnlyFirstRequired = false);


/// \returns A pair of integer values requested using \p F's \p Name attribute

/// in "first[,second]" format ("second" is optional unless \p OnlyFirstRequired

/// is false).

///

/// \returns \p std::nullopt if attribute is not present.

///

/// \returns \p std::nullopt and emits error if one of the requested values

/// cannot be converted to integer, or \p OnlyFirstRequired is false and

/// "second" value is not present.

std::optional<std::pair<unsigned, std::optional<unsigned>>>

getIntegerPairAttribute(const Function &F, StringRef Name,

                        bool OnlyFirstRequired = false);


/// \returns Generate a vector of integer values requested using \p F's \p Name

/// attribute.

///

/// \returns true if exactly Size (>2) number of integers are found in the

/// attribute.

///

/// \returns false if any error occurs.

SmallVector<unsigned> getIntegerVecAttribute(const Function &F, StringRef Name,

                                             unsigned Size,

                                             unsigned DefaultVal = 0);


/// Represents the counter values to wait for in an s_waitcnt instruction.

///

/// Large values (including the maximum possible integer) can be used to

/// represent "don't care" waits.

struct Waitcnt {

  unsigned LoadCnt = ~0u; // Corresponds to Vmcnt prior to gfx12.

  unsigned ExpCnt = ~0u;

  unsigned DsCnt = ~0u;     // Corresponds to LGKMcnt prior to gfx12.

  unsigned StoreCnt = ~0u;  // Corresponds to VScnt on gfx10/gfx11.

  unsigned SampleCnt = ~0u; // gfx12+ only.

  unsigned BvhCnt = ~0u;    // gfx12+ only.

  unsigned KmCnt = ~0u;     // gfx12+ only.


  Waitcnt() = default;

  // Pre-gfx12 constructor.

  Waitcnt(unsigned VmCnt, unsigned ExpCnt, unsigned LgkmCnt, unsigned VsCnt)

      : LoadCnt(VmCnt), ExpCnt(ExpCnt), DsCnt(LgkmCnt), StoreCnt(VsCnt),

        SampleCnt(~0u), BvhCnt(~0u), KmCnt(~0u) {}


  // gfx12+ constructor.

  Waitcnt(unsigned LoadCnt, unsigned ExpCnt, unsigned DsCnt, unsigned StoreCnt,

          unsigned SampleCnt, unsigned BvhCnt, unsigned KmCnt)

      : LoadCnt(LoadCnt), ExpCnt(ExpCnt), DsCnt(DsCnt), StoreCnt(StoreCnt),

        SampleCnt(SampleCnt), BvhCnt(BvhCnt), KmCnt(KmCnt) {}


  bool hasWait() const { return StoreCnt != ~0u || hasWaitExceptStoreCnt(); }


  bool hasWaitExceptStoreCnt() const {

    return LoadCnt != ~0u || ExpCnt != ~0u || DsCnt != ~0u ||

           SampleCnt != ~0u || BvhCnt != ~0u || KmCnt != ~0u;

  }


  bool hasWaitStoreCnt() const { return StoreCnt != ~0u; }


  Waitcnt combined(const Waitcnt &Other) const {

    // Does the right thing provided self and Other are either both pre-gfx12

    // or both gfx12+.

    return Waitcnt(

        std::min(LoadCnt, Other.LoadCnt), std::min(ExpCnt, Other.ExpCnt),

        std::min(DsCnt, Other.DsCnt), std::min(StoreCnt, Other.StoreCnt),

        std::min(SampleCnt, Other.SampleCnt), std::min(BvhCnt, Other.BvhCnt),

        std::min(KmCnt, Other.KmCnt));

  }

};


// The following methods are only meaningful on targets that support

// S_WAITCNT.


/// \returns Vmcnt bit mask for given isa \p Version.

unsigned getVmcntBitMask(const IsaVersion &Version);


/// \returns Expcnt bit mask for given isa \p Version.

unsigned getExpcntBitMask(const IsaVersion &Version);


/// \returns Lgkmcnt bit mask for given isa \p Version.

unsigned getLgkmcntBitMask(const IsaVersion &Version);


/// \returns Waitcnt bit mask for given isa \p Version.

unsigned getWaitcntBitMask(const IsaVersion &Version);


/// \returns Decoded Vmcnt from given \p Waitcnt for given isa \p Version.

unsigned decodeVmcnt(const IsaVersion &Version, unsigned Waitcnt);


/// \returns Decoded Expcnt from given \p Waitcnt for given isa \p Version.

unsigned decodeExpcnt(const IsaVersion &Version, unsigned Waitcnt);


/// \returns Decoded Lgkmcnt from given \p Waitcnt for given isa \p Version.

unsigned decodeLgkmcnt(const IsaVersion &Version, unsigned Waitcnt);


/// Decodes Vmcnt, Expcnt and Lgkmcnt from given \p Waitcnt for given isa

/// \p Version, and writes decoded values into \p Vmcnt, \p Expcnt and

/// \p Lgkmcnt respectively. Should not be used on gfx12+, the instruction

/// which needs it is deprecated

///

/// \details \p Vmcnt, \p Expcnt and \p Lgkmcnt are decoded as follows:

///     \p Vmcnt = \p Waitcnt[3:0]        (pre-gfx9)

///     \p Vmcnt = \p Waitcnt[15:14,3:0]  (gfx9,10)

///     \p Vmcnt = \p Waitcnt[15:10]      (gfx11)

///     \p Expcnt = \p Waitcnt[6:4]       (pre-gfx11)

///     \p Expcnt = \p Waitcnt[2:0]       (gfx11)

///     \p Lgkmcnt = \p Waitcnt[11:8]     (pre-gfx10)

///     \p Lgkmcnt = \p Waitcnt[13:8]     (gfx10)

///     \p Lgkmcnt = \p Waitcnt[9:4]      (gfx11)

///

void decodeWaitcnt(const IsaVersion &Version, unsigned Waitcnt,

                   unsigned &Vmcnt, unsigned &Expcnt, unsigned &Lgkmcnt);


Waitcnt decodeWaitcnt(const IsaVersion &Version, unsigned Encoded);


/// \returns \p Waitcnt with encoded \p Vmcnt for given isa \p Version.

unsigned encodeVmcnt(const IsaVersion &Version, unsigned Waitcnt,

                     unsigned Vmcnt);


/// \returns \p Waitcnt with encoded \p Expcnt for given isa \p Version.

unsigned encodeExpcnt(const IsaVersion &Version, unsigned Waitcnt,

                      unsigned Expcnt);


/// \returns \p Waitcnt with encoded \p Lgkmcnt for given isa \p Version.

unsigned encodeLgkmcnt(const IsaVersion &Version, unsigned Waitcnt,

                       unsigned Lgkmcnt);


/// Encodes \p Vmcnt, \p Expcnt and \p Lgkmcnt into Waitcnt for given isa

/// \p Version. Should not be used on gfx12+, the instruction which needs

/// it is deprecated

///

/// \details \p Vmcnt, \p Expcnt and \p Lgkmcnt are encoded as follows:

///     Waitcnt[2:0]   = \p Expcnt      (gfx11+)

///     Waitcnt[3:0]   = \p Vmcnt       (pre-gfx9)

///     Waitcnt[3:0]   = \p Vmcnt[3:0]  (gfx9,10)

///     Waitcnt[6:4]   = \p Expcnt      (pre-gfx11)

///     Waitcnt[9:4]   = \p Lgkmcnt     (gfx11)

///     Waitcnt[11:8]  = \p Lgkmcnt     (pre-gfx10)

///     Waitcnt[13:8]  = \p Lgkmcnt     (gfx10)

///     Waitcnt[15:10] = \p Vmcnt       (gfx11)

///     Waitcnt[15:14] = \p Vmcnt[5:4]  (gfx9,10)

///

/// \returns Waitcnt with encoded \p Vmcnt, \p Expcnt and \p Lgkmcnt for given

/// isa \p Version.

///

unsigned encodeWaitcnt(const IsaVersion &Version,

                       unsigned Vmcnt, unsigned Expcnt, unsigned Lgkmcnt);


unsigned encodeWaitcnt(const IsaVersion &Version, const Waitcnt &Decoded);


// The following methods are only meaningful on targets that support

// S_WAIT_*CNT, introduced with gfx12.


/// \returns Loadcnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support LOADcnt

unsigned getLoadcntBitMask(const IsaVersion &Version);


/// \returns Samplecnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support SAMPLEcnt

unsigned getSamplecntBitMask(const IsaVersion &Version);


/// \returns Bvhcnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support BVHcnt

unsigned getBvhcntBitMask(const IsaVersion &Version);


/// \returns Dscnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support DScnt

unsigned getDscntBitMask(const IsaVersion &Version);


/// \returns Dscnt bit mask for given isa \p Version.

/// Returns 0 for versions that do not support KMcnt

unsigned getKmcntBitMask(const IsaVersion &Version);


/// \return STOREcnt or VScnt bit mask for given isa \p Version.

/// returns 0 for versions that do not support STOREcnt or VScnt.

/// STOREcnt and VScnt are the same counter, the name used

/// depends on the ISA version.

unsigned getStorecntBitMask(const IsaVersion &Version);


// The following are only meaningful on targets that support

// S_WAIT_LOADCNT_DSCNT and S_WAIT_STORECNT_DSCNT.


/// \returns Decoded Waitcnt structure from given \p LoadcntDscnt for given

/// isa \p Version.

Waitcnt decodeLoadcntDscnt(const IsaVersion &Version, unsigned LoadcntDscnt);


/// \returns Decoded Waitcnt structure from given \p StorecntDscnt for given

/// isa \p Version.

Waitcnt decodeStorecntDscnt(const IsaVersion &Version, unsigned StorecntDscnt);


/// \returns \p Loadcnt and \p Dscnt components of \p Decoded  encoded as an

/// immediate that can be used with S_WAIT_LOADCNT_DSCNT for given isa

/// \p Version.

unsigned encodeLoadcntDscnt(const IsaVersion &Version, const Waitcnt &Decoded);


/// \returns \p Storecnt and \p Dscnt components of \p Decoded  encoded as an

/// immediate that can be used with S_WAIT_STORECNT_DSCNT for given isa

/// \p Version.

unsigned encodeStorecntDscnt(const IsaVersion &Version, const Waitcnt &Decoded);


namespace Hwreg {


using HwregId = EncodingField<5, 0>;

using HwregOffset = EncodingField<10, 6>;


struct HwregSize : EncodingField<15, 11, 32> {

  using EncodingField::EncodingField;

  constexpr uint64_t encode() const { return Value - 1; }

  static ValueType decode(uint64_t Encoded) { return Encoded + 1; }

};


using HwregEncoding = EncodingFields<HwregId, HwregOffset, HwregSize>;


} // namespace Hwreg


namespace DepCtr {


int getDefaultDepCtrEncoding(const MCSubtargetInfo &STI);

int encodeDepCtr(const StringRef Name, int64_t Val, unsigned &UsedOprMask,

                 const MCSubtargetInfo &STI);

bool isSymbolicDepCtrEncoding(unsigned Code, bool &HasNonDefaultVal,

                              const MCSubtargetInfo &STI);

bool decodeDepCtr(unsigned Code, int &Id, StringRef &Name, unsigned &Val,

                  bool &IsDefault, const MCSubtargetInfo &STI);


/// \returns Decoded VaVdst from given immediate \p Encoded.

unsigned decodeFieldVaVdst(unsigned Encoded);


/// \returns Decoded VmVsrc from given immediate \p Encoded.

unsigned decodeFieldVmVsrc(unsigned Encoded);


/// \returns Decoded SaSdst from given immediate \p Encoded.

unsigned decodeFieldSaSdst(unsigned Encoded);


/// \returns \p VmVsrc as an encoded Depctr immediate.

unsigned encodeFieldVmVsrc(unsigned VmVsrc);


/// \returns \p Encoded combined with encoded \p VmVsrc.

unsigned encodeFieldVmVsrc(unsigned Encoded, unsigned VmVsrc);


/// \returns \p VaVdst as an encoded Depctr immediate.

unsigned encodeFieldVaVdst(unsigned VaVdst);


/// \returns \p Encoded combined with encoded \p VaVdst.

unsigned encodeFieldVaVdst(unsigned Encoded, unsigned VaVdst);


/// \returns \p SaSdst as an encoded Depctr immediate.

unsigned encodeFieldSaSdst(unsigned SaSdst);


/// \returns \p Encoded combined with encoded \p SaSdst.

unsigned encodeFieldSaSdst(unsigned Encoded, unsigned SaSdst);


} // namespace DepCtr


namespace Exp {


bool getTgtName(unsigned Id, StringRef &Name, int &Index);


LLVM_READONLY

unsigned getTgtId(const StringRef Name);


LLVM_READNONE

bool isSupportedTgtId(unsigned Id, const MCSubtargetInfo &STI);


} // namespace Exp


namespace MTBUFFormat {


LLVM_READNONE

int64_t encodeDfmtNfmt(unsigned Dfmt, unsigned Nfmt);


void decodeDfmtNfmt(unsigned Format, unsigned &Dfmt, unsigned &Nfmt);


int64_t getDfmt(const StringRef Name);


StringRef getDfmtName(unsigned Id);


int64_t getNfmt(const StringRef Name, const MCSubtargetInfo &STI);


StringRef getNfmtName(unsigned Id, const MCSubtargetInfo &STI);


bool isValidDfmtNfmt(unsigned Val, const MCSubtargetInfo &STI);


bool isValidNfmt(unsigned Val, const MCSubtargetInfo &STI);


int64_t getUnifiedFormat(const StringRef Name, const MCSubtargetInfo &STI);


StringRef getUnifiedFormatName(unsigned Id, const MCSubtargetInfo &STI);


bool isValidUnifiedFormat(unsigned Val, const MCSubtargetInfo &STI);


int64_t convertDfmtNfmt2Ufmt(unsigned Dfmt, unsigned Nfmt,

                             const MCSubtargetInfo &STI);


bool isValidFormatEncoding(unsigned Val, const MCSubtargetInfo &STI);


unsigned getDefaultFormatEncoding(const MCSubtargetInfo &STI);


} // namespace MTBUFFormat


namespace SendMsg {


LLVM_READNONE

bool isValidMsgId(int64_t MsgId, const MCSubtargetInfo &STI);


LLVM_READNONE

bool isValidMsgOp(int64_t MsgId, int64_t OpId, const MCSubtargetInfo &STI,

                  bool Strict = true);


LLVM_READNONE

bool isValidMsgStream(int64_t MsgId, int64_t OpId, int64_t StreamId,

                      const MCSubtargetInfo &STI, bool Strict = true);


LLVM_READNONE

bool msgRequiresOp(int64_t MsgId, const MCSubtargetInfo &STI);


LLVM_READNONE

bool msgSupportsStream(int64_t MsgId, int64_t OpId, const MCSubtargetInfo &STI);


void decodeMsg(unsigned Val, uint16_t &MsgId, uint16_t &OpId,

               uint16_t &StreamId, const MCSubtargetInfo &STI);


LLVM_READNONE

uint64_t encodeMsg(uint64_t MsgId,

                   uint64_t OpId,

                   uint64_t StreamId);


} // namespace SendMsg


unsigned getInitialPSInputAddr(const Function &F);


bool getHasColorExport(const Function &F);


bool getHasDepthExport(const Function &F);


LLVM_READNONE

bool isShader(CallingConv::ID CC);


LLVM_READNONE

bool isGraphics(CallingConv::ID CC);


LLVM_READNONE

bool isCompute(CallingConv::ID CC);


LLVM_READNONE

bool isEntryFunctionCC(CallingConv::ID CC);


// These functions are considered entrypoints into the current module, i.e. they

// are allowed to be called from outside the current module. This is different

// from isEntryFunctionCC, which is only true for functions that are entered by

// the hardware. Module entry points include all entry functions but also

// include functions that can be called from other functions inside or outside

// the current module. Module entry functions are allowed to allocate LDS.

LLVM_READNONE

bool isModuleEntryFunctionCC(CallingConv::ID CC);


LLVM_READNONE

bool isChainCC(CallingConv::ID CC);


bool isKernelCC(const Function *Func);


// FIXME: Remove this when calling conventions cleaned up

LLVM_READNONE

inline bool isKernel(CallingConv::ID CC) {

  switch (CC) {

  case CallingConv::AMDGPU_KERNEL:

  case CallingConv::SPIR_KERNEL:

    return true;

  default:

    return false;

  }

}


bool hasXNACK(const MCSubtargetInfo &STI);

bool hasSRAMECC(const MCSubtargetInfo &STI);

bool hasMIMG_R128(const MCSubtargetInfo &STI);

bool hasA16(const MCSubtargetInfo &STI);

bool hasG16(const MCSubtargetInfo &STI);

bool hasPackedD16(const MCSubtargetInfo &STI);

bool hasGDS(const MCSubtargetInfo &STI);

unsigned getNSAMaxSize(const MCSubtargetInfo &STI, bool HasSampler = false);

unsigned getMaxNumUserSGPRs(const MCSubtargetInfo &STI);


bool isSI(const MCSubtargetInfo &STI);

bool isCI(const MCSubtargetInfo &STI);

bool isVI(const MCSubtargetInfo &STI);

bool isGFX9(const MCSubtargetInfo &STI);

bool isGFX9_GFX10(const MCSubtargetInfo &STI);

bool isGFX9_GFX10_GFX11(const MCSubtargetInfo &STI);

bool isGFX8_GFX9_GFX10(const MCSubtargetInfo &STI);

bool isGFX8Plus(const MCSubtargetInfo &STI);

bool isGFX9Plus(const MCSubtargetInfo &STI);

bool isNotGFX9Plus(const MCSubtargetInfo &STI);

bool isGFX10(const MCSubtargetInfo &STI);

bool isGFX10_GFX11(const MCSubtargetInfo &STI);

bool isGFX10Plus(const MCSubtargetInfo &STI);

bool isNotGFX10Plus(const MCSubtargetInfo &STI);

bool isGFX10Before1030(const MCSubtargetInfo &STI);

bool isGFX11(const MCSubtargetInfo &STI);

bool isGFX11Plus(const MCSubtargetInfo &STI);

bool isGFX12(const MCSubtargetInfo &STI);

bool isGFX12Plus(const MCSubtargetInfo &STI);

bool isNotGFX12Plus(const MCSubtargetInfo &STI);

bool isNotGFX11Plus(const MCSubtargetInfo &STI);

bool isGCN3Encoding(const MCSubtargetInfo &STI);

bool isGFX10_AEncoding(const MCSubtargetInfo &STI);

bool isGFX10_BEncoding(const MCSubtargetInfo &STI);

bool hasGFX10_3Insts(const MCSubtargetInfo &STI);

bool isGFX10_3_GFX11(const MCSubtargetInfo &STI);

bool isGFX90A(const MCSubtargetInfo &STI);

bool isGFX940(const MCSubtargetInfo &STI);

bool hasArchitectedFlatScratch(const MCSubtargetInfo &STI);

bool hasMAIInsts(const MCSubtargetInfo &STI);

bool hasVOPD(const MCSubtargetInfo &STI);

bool hasDPPSrc1SGPR(const MCSubtargetInfo &STI);

int getTotalNumVGPRs(bool has90AInsts, int32_t ArgNumAGPR, int32_t ArgNumVGPR);

unsigned hasKernargPreload(const MCSubtargetInfo &STI);

bool hasSMRDSignedImmOffset(const MCSubtargetInfo &ST);


/// Is Reg - scalar register

bool isSGPR(MCRegister Reg, const MCRegisterInfo *TRI);


/// \returns if \p Reg occupies the high 16-bits of a 32-bit register.

bool isHi16Reg(MCRegister Reg, const MCRegisterInfo &MRI);


/// If \p Reg is a pseudo reg, return the correct hardware register given

/// \p STI otherwise return \p Reg.

MCRegister getMCReg(MCRegister Reg, const MCSubtargetInfo &STI);


/// Convert hardware register \p Reg to a pseudo register

LLVM_READNONE

MCRegister mc2PseudoReg(MCRegister Reg);


LLVM_READNONE

bool isInlineValue(unsigned Reg);


/// Is this an AMDGPU specific source operand? These include registers,

/// inline constants, literals and mandatory literals (KImm).

bool isSISrcOperand(const MCInstrDesc &Desc, unsigned OpNo);


/// Is this a KImm operand?

bool isKImmOperand(const MCInstrDesc &Desc, unsigned OpNo);


/// Is this floating-point operand?

bool isSISrcFPOperand(const MCInstrDesc &Desc, unsigned OpNo);


/// Does this operand support only inlinable literals?

bool isSISrcInlinableOperand(const MCInstrDesc &Desc, unsigned OpNo);


/// Get the size in bits of a register from the register class \p RC.

unsigned getRegBitWidth(unsigned RCID);


/// Get the size in bits of a register from the register class \p RC.

unsigned getRegBitWidth(const MCRegisterClass &RC);


/// Get size of register operand

unsigned getRegOperandSize(const MCRegisterInfo *MRI, const MCInstrDesc &Desc,

                           unsigned OpNo);


LLVM_READNONE

inline unsigned getOperandSize(const MCOperandInfo &OpInfo) {

  switch (OpInfo.OperandType) {

  case AMDGPU::OPERAND_REG_IMM_INT32:

  case AMDGPU::OPERAND_REG_IMM_FP32:

  case AMDGPU::OPERAND_REG_IMM_FP32_DEFERRED:

  case AMDGPU::OPERAND_REG_INLINE_C_INT32:

  case AMDGPU::OPERAND_REG_INLINE_C_FP32:

  case AMDGPU::OPERAND_REG_INLINE_AC_INT32:

  case AMDGPU::OPERAND_REG_INLINE_AC_FP32:

  case AMDGPU::OPERAND_REG_IMM_V2INT32:

  case AMDGPU::OPERAND_REG_IMM_V2FP32:

  case AMDGPU::OPERAND_REG_INLINE_C_V2INT32:

  case AMDGPU::OPERAND_REG_INLINE_C_V2FP32:

  case AMDGPU::OPERAND_KIMM32:

  case AMDGPU::OPERAND_KIMM16: // mandatory literal is always size 4

  case AMDGPU::OPERAND_INLINE_SPLIT_BARRIER_INT32:

    return 4;


  case AMDGPU::OPERAND_REG_IMM_INT64:

  case AMDGPU::OPERAND_REG_IMM_FP64:

  case AMDGPU::OPERAND_REG_INLINE_C_INT64:

  case AMDGPU::OPERAND_REG_INLINE_C_FP64:

  case AMDGPU::OPERAND_REG_INLINE_AC_FP64:

    return 8;


  case AMDGPU::OPERAND_REG_IMM_INT16:

  case AMDGPU::OPERAND_REG_IMM_BF16:

  case AMDGPU::OPERAND_REG_IMM_FP16:

  case AMDGPU::OPERAND_REG_IMM_BF16_DEFERRED:

  case AMDGPU::OPERAND_REG_IMM_FP16_DEFERRED:

  case AMDGPU::OPERAND_REG_INLINE_C_INT16:

  case AMDGPU::OPERAND_REG_INLINE_C_BF16:

  case AMDGPU::OPERAND_REG_INLINE_C_FP16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2INT16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2BF16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2FP16:

  case AMDGPU::OPERAND_REG_INLINE_AC_INT16:

  case AMDGPU::OPERAND_REG_INLINE_AC_BF16:

  case AMDGPU::OPERAND_REG_INLINE_AC_FP16:

  case AMDGPU::OPERAND_REG_INLINE_AC_V2INT16:

  case AMDGPU::OPERAND_REG_INLINE_AC_V2BF16:

  case AMDGPU::OPERAND_REG_INLINE_AC_V2FP16:

  case AMDGPU::OPERAND_REG_IMM_V2INT16:

  case AMDGPU::OPERAND_REG_IMM_V2BF16:

  case AMDGPU::OPERAND_REG_IMM_V2FP16:

    return 2;


  default:

    llvm_unreachable("unhandled operand type");

  }

}


LLVM_READNONE

inline unsigned getOperandSize(const MCInstrDesc &Desc, unsigned OpNo) {

  return getOperandSize(Desc.operands()[OpNo]);

}


/// Is this literal inlinable, and not one of the values intended for floating

/// point values.

LLVM_READNONE

inline bool isInlinableIntLiteral(int64_t Literal) {

  return Literal >= -16 && Literal <= 64;

}


/// Is this literal inlinable

LLVM_READNONE

bool isInlinableLiteral64(int64_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteral32(int32_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteralBF16(int16_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteralFP16(int16_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteralBF16(int16_t Literal, bool HasInv2Pi);


LLVM_READNONE

bool isInlinableLiteralI16(int32_t Literal, bool HasInv2Pi);


LLVM_READNONE

std::optional<unsigned> getInlineEncodingV2I16(uint32_t Literal);


LLVM_READNONE

std::optional<unsigned> getInlineEncodingV2BF16(uint32_t Literal);


LLVM_READNONE

std::optional<unsigned> getInlineEncodingV2F16(uint32_t Literal);


LLVM_READNONE

bool isInlinableLiteralV216(uint32_t Literal, uint8_t OpType);


LLVM_READNONE

bool isInlinableLiteralV2I16(uint32_t Literal);


LLVM_READNONE

bool isInlinableLiteralV2BF16(uint32_t Literal);


LLVM_READNONE

bool isInlinableLiteralV2F16(uint32_t Literal);


LLVM_READNONE

bool isValid32BitLiteral(uint64_t Val, bool IsFP64);


bool isArgPassedInSGPR(const Argument *Arg);


bool isArgPassedInSGPR(const CallBase *CB, unsigned ArgNo);


LLVM_READONLY

bool isLegalSMRDEncodedUnsignedOffset(const MCSubtargetInfo &ST,

                                      int64_t EncodedOffset);


LLVM_READONLY

bool isLegalSMRDEncodedSignedOffset(const MCSubtargetInfo &ST,

                                    int64_t EncodedOffset,

                                    bool IsBuffer);


/// Convert \p ByteOffset to dwords if the subtarget uses dword SMRD immediate

/// offsets.

uint64_t convertSMRDOffsetUnits(const MCSubtargetInfo &ST, uint64_t ByteOffset);


/// \returns The encoding that will be used for \p ByteOffset in the

/// SMRD offset field, or std::nullopt if it won't fit. On GFX9 and GFX10

/// S_LOAD instructions have a signed offset, on other subtargets it is

/// unsigned. S_BUFFER has an unsigned offset for all subtargets.

std::optional<int64_t> getSMRDEncodedOffset(const MCSubtargetInfo &ST,

                                            int64_t ByteOffset, bool IsBuffer,

                                            bool HasSOffset = false);


/// \return The encoding that can be used for a 32-bit literal offset in an SMRD

/// instruction. This is only useful on CI.s

std::optional<int64_t> getSMRDEncodedLiteralOffset32(const MCSubtargetInfo &ST,

                                                     int64_t ByteOffset);


/// For pre-GFX12 FLAT instructions the offset must be positive;

/// MSB is ignored and forced to zero.

///

/// \return The number of bits available for the signed offset field in flat

/// instructions. Note that some forms of the instruction disallow negative

/// offsets.

unsigned getNumFlatOffsetBits(const MCSubtargetInfo &ST);


/// \returns true if this offset is small enough to fit in the SMRD

/// offset field.  \p ByteOffset should be the offset in bytes and

/// not the encoded offset.

bool isLegalSMRDImmOffset(const MCSubtargetInfo &ST, int64_t ByteOffset);


LLVM_READNONE

inline bool isLegalDPALU_DPPControl(unsigned DC) {

  return DC >= DPP::ROW_NEWBCAST_FIRST && DC <= DPP::ROW_NEWBCAST_LAST;

}


/// \returns true if an instruction may have a 64-bit VGPR operand.

bool hasAny64BitVGPROperands(const MCInstrDesc &OpDesc);


/// \returns true if an instruction is a DP ALU DPP.

bool isDPALU_DPP(const MCInstrDesc &OpDesc);


/// \returns true if the intrinsic is divergent

bool isIntrinsicSourceOfDivergence(unsigned IntrID);


/// \returns true if the intrinsic is uniform

bool isIntrinsicAlwaysUniform(unsigned IntrID);


/// \returns lds block size in terms of dwords. \p

/// This is used to calculate the lds size encoded for PAL metadata 3.0+ which

/// must be defined in terms of bytes.

unsigned getLdsDwGranularity(const MCSubtargetInfo &ST);


} // end namespace AMDGPU


raw_ostream &operator<<(raw_ostream &OS,

                        const AMDGPU::IsaInfo::TargetIDSetting S);


} // end namespace llvm


#endif // LLVM_LIB_TARGET_AMDGPU_UTILS_AMDGPUBASEINFO_H

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:105

AMDGPUSubtarget.h
Base class for AMDGPU specific classes of TargetSubtarget.

Alignment.h

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

CallingConv.h

LLVM_READNONE
#define LLVM_READNONE
Definition: Compiler.h:299

LLVM_READONLY
#define LLVM_READONLY
Definition: Compiler.h:306

Align
uint64_t Align
Definition: ELFObjHandler.cpp:82

Name
std::string Name
Definition: ELFObjHandler.cpp:77

Index
uint32_t Index
Definition: ELFObjHandler.cpp:83

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

Module.h
Module.h This file contains the declarations for the Module class.

InstrTypes.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

G
#define G(x, y, z)
Definition: MD5.cpp:56

TRI
unsigned const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:2029

Reg
unsigned Reg
Definition: MachineSink.cpp:2028

CC
auto CC
Definition: RISCVRedundantCopyElimination.cpp:79

SIDefines.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

DefaultVal
unsigned unsigned DefaultVal
Definition: SPIRVModuleAnalysis.cpp:64

OS
raw_pwrite_stream & OS
Definition: SampleProfWriter.cpp:51

llvm::AMDGPUSubtarget::Generation
Generation
Definition: AMDGPUSubtarget.h:31

llvm::AMDGPU::IsaInfo::AMDGPUTargetID
Definition: AMDGPUBaseInfo.h:140

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isSramEccSupported
bool isSramEccSupported() const
Definition: AMDGPUBaseInfo.h:180

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::setTargetIDFromFeaturesString
void setTargetIDFromFeaturesString(StringRef FS)
Definition: AMDGPUBaseInfo.cpp:815

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::setXnackSetting
void setXnackSetting(TargetIDSetting NewXnackSetting)
Sets xnack setting to NewXnackSetting.
Definition: AMDGPUBaseInfo.h:175

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isSramEccOnOrAny
bool isSramEccOnOrAny() const
Definition: AMDGPUBaseInfo.h:185

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::getXnackSetting
TargetIDSetting getXnackSetting() const
Definition: AMDGPUBaseInfo.h:170

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isXnackOnOrAny
bool isXnackOnOrAny() const
Definition: AMDGPUBaseInfo.h:156

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isXnackOnOrOff
bool isXnackOnOrOff() const
Definition: AMDGPUBaseInfo.h:163

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isXnackSupported
bool isXnackSupported() const
Definition: AMDGPUBaseInfo.h:151

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::setTargetIDFromTargetIDStream
void setTargetIDFromTargetIDStream(StringRef TargetID)
Definition: AMDGPUBaseInfo.cpp:883

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::~AMDGPUTargetID
~AMDGPUTargetID()=default

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::setSramEccSetting
void setSramEccSetting(TargetIDSetting NewSramEccSetting)
Sets sramecc setting to NewSramEccSetting.
Definition: AMDGPUBaseInfo.h:204

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::isSramEccOnOrOff
bool isSramEccOnOrOff() const
Definition: AMDGPUBaseInfo.h:192

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::toString
std::string toString() const
Definition: AMDGPUBaseInfo.cpp:895

llvm::AMDGPU::IsaInfo::AMDGPUTargetID::getSramEccSetting
TargetIDSetting getSramEccSetting() const
Definition: AMDGPUBaseInfo.h:199

llvm::AMDGPU::VOPD::ComponentInfo
Definition: AMDGPUBaseInfo.h:811

llvm::AMDGPU::VOPD::ComponentInfo::getIndexInParsedOperands
unsigned getIndexInParsedOperands(unsigned CompOprIdx) const
Definition: AMDGPUBaseInfo.cpp:727

llvm::AMDGPU::VOPD::ComponentInfo::ComponentInfo
ComponentInfo(const MCInstrDesc &OpDesc, ComponentKind Kind=ComponentKind::SINGLE)
Definition: AMDGPUBaseInfo.h:814

llvm::AMDGPU::VOPD::ComponentInfo::ComponentInfo
ComponentInfo(const MCInstrDesc &OpDesc, const ComponentProps &OpXProps)
Definition: AMDGPUBaseInfo.h:819

llvm::AMDGPU::VOPD::ComponentLayout
Definition: AMDGPUBaseInfo.h:745

llvm::AMDGPU::VOPD::ComponentLayout::getIndexOfDstInMCOperands
unsigned getIndexOfDstInMCOperands() const
Definition: AMDGPUBaseInfo.h:782

llvm::AMDGPU::VOPD::ComponentLayout::getIndexOfSrcInMCOperands
unsigned getIndexOfSrcInMCOperands(unsigned CompSrcIdx) const
Definition: AMDGPUBaseInfo.h:785

llvm::AMDGPU::VOPD::ComponentLayout::getIndexOfDstInParsedOperands
unsigned getIndexOfDstInParsedOperands() const
Definition: AMDGPUBaseInfo.h:791

llvm::AMDGPU::VOPD::ComponentLayout::ComponentLayout
ComponentLayout(const ComponentProps &OpXProps)
Definition: AMDGPUBaseInfo.h:777

llvm::AMDGPU::VOPD::ComponentLayout::getIndexOfSrcInParsedOperands
unsigned getIndexOfSrcInParsedOperands(unsigned CompSrcIdx) const
Definition: AMDGPUBaseInfo.h:796

llvm::AMDGPU::VOPD::ComponentLayout::ComponentLayout
ComponentLayout(ComponentKind Kind)
Definition: AMDGPUBaseInfo.h:772

llvm::AMDGPU::VOPD::ComponentProps
Definition: AMDGPUBaseInfo.h:663

llvm::AMDGPU::VOPD::ComponentProps::hasMandatoryLiteral
bool hasMandatoryLiteral() const
Definition: AMDGPUBaseInfo.h:682

llvm::AMDGPU::VOPD::ComponentProps::hasRegSrcOperand
bool hasRegSrcOperand(unsigned CompSrcIdx) const
Definition: AMDGPUBaseInfo.h:693

llvm::AMDGPU::VOPD::ComponentProps::hasSrc2Acc
bool hasSrc2Acc() const
Definition: AMDGPUBaseInfo.h:699

llvm::AMDGPU::VOPD::ComponentProps::ComponentProps
ComponentProps()=default

llvm::AMDGPU::VOPD::ComponentProps::getCompSrcOperandsNum
unsigned getCompSrcOperandsNum() const
Definition: AMDGPUBaseInfo.h:674

llvm::AMDGPU::VOPD::ComponentProps::getMandatoryLiteralCompOperandIndex
unsigned getMandatoryLiteralCompOperandIndex() const
Definition: AMDGPUBaseInfo.h:686

llvm::AMDGPU::VOPD::ComponentProps::getCompParsedSrcOperandsNum
unsigned getCompParsedSrcOperandsNum() const
Definition: AMDGPUBaseInfo.h:677

llvm::AMDGPU::VOPD::InstInfo
Definition: AMDGPUBaseInfo.h:828

llvm::AMDGPU::VOPD::InstInfo::InstInfo
InstInfo(const ComponentInfo &OprInfoX, const ComponentInfo &OprInfoY)
Definition: AMDGPUBaseInfo.h:838

llvm::AMDGPU::VOPD::InstInfo::hasInvalidOperand
bool hasInvalidOperand(std::function< unsigned(unsigned, unsigned)> GetRegIdx, bool SkipSrc=false) const
Definition: AMDGPUBaseInfo.h:852

llvm::AMDGPU::VOPD::InstInfo::operator[]
const ComponentInfo & operator[](size_t ComponentIdx) const
Definition: AMDGPUBaseInfo.h:841

llvm::AMDGPU::VOPD::InstInfo::InstInfo
InstInfo(const MCInstrDesc &OpX, const MCInstrDesc &OpY)
Definition: AMDGPUBaseInfo.h:835

llvm::AMDGPU::VOPD::InstInfo::getInvalidCompOperandIndex
std::optional< unsigned > getInvalidCompOperandIndex(std::function< unsigned(unsigned, unsigned)> GetRegIdx, bool SkipSrc=false) const
Definition: AMDGPUBaseInfo.cpp:741

llvm::AMDGPU::VOPD::InstInfo::RegIndices
std::array< unsigned, Component::MAX_OPR_NUM > RegIndices
Definition: AMDGPUBaseInfo.h:833

llvm::Argument
This class represents an incoming formal argument to a Function.
Definition: Argument.h:31

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1112

llvm::Function
Definition: Function.h:63

llvm::GlobalValue
Definition: GlobalValue.h:48

llvm::MCInstrDesc
Describe properties that are true of each instruction in the target description file.
Definition: MCInstrDesc.h:198

llvm::MCInstrInfo
Interface to description of machine instruction set.
Definition: MCInstrInfo.h:26

llvm::MCOperandInfo
This holds information about one operand of a machine instruction, indicating the register class for ...
Definition: MCInstrDesc.h:85

llvm::MCOperandInfo::OperandType
uint8_t OperandType
Information about the type of the operand.
Definition: MCInstrDesc.h:97

llvm::MCRegisterClass
MCRegisterClass - Base class of TargetRegisterClass.
Definition: MCRegisterInfo.h:35

llvm::MCRegisterInfo
MCRegisterInfo base class - We assume that the target defines a static array of MCRegisterDesc object...
Definition: MCRegisterInfo.h:149

llvm::MCRegister
Wrapper class representing physical registers. Should be passed by value.
Definition: MCRegister.h:33

llvm::MCSubtargetInfo
Generic base class for all target subtargets.
Definition: MCSubtargetInfo.h:76

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:65

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51

llvm::Triple
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

uint16_t

uint32_t

uint64_t

uint8_t

unsigned

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::AMDGPU::DPP::ROW_NEWBCAST_LAST
@ ROW_NEWBCAST_LAST
Definition: SIDefines.h:974

llvm::AMDGPU::DPP::ROW_NEWBCAST_FIRST
@ ROW_NEWBCAST_FIRST
Definition: SIDefines.h:973

llvm::AMDGPU::DepCtr::decodeDepCtr
bool decodeDepCtr(unsigned Code, int &Id, StringRef &Name, unsigned &Val, bool &IsDefault, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1698

llvm::AMDGPU::DepCtr::encodeFieldVaVdst
unsigned encodeFieldVaVdst(unsigned Encoded, unsigned VaVdst)
Definition: AMDGPUBaseInfo.cpp:1730

llvm::AMDGPU::DepCtr::decodeFieldSaSdst
unsigned decodeFieldSaSdst(unsigned Encoded)
Definition: AMDGPUBaseInfo.cpp:1718

llvm::AMDGPU::DepCtr::encodeFieldVmVsrc
unsigned encodeFieldVmVsrc(unsigned Encoded, unsigned VmVsrc)
Definition: AMDGPUBaseInfo.cpp:1722

llvm::AMDGPU::DepCtr::encodeDepCtr
int encodeDepCtr(const StringRef Name, int64_t Val, unsigned &UsedOprMask, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1704

llvm::AMDGPU::DepCtr::encodeFieldSaSdst
unsigned encodeFieldSaSdst(unsigned Encoded, unsigned SaSdst)
Definition: AMDGPUBaseInfo.cpp:1738

llvm::AMDGPU::DepCtr::isSymbolicDepCtrEncoding
bool isSymbolicDepCtrEncoding(unsigned Code, bool &HasNonDefaultVal, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1692

llvm::AMDGPU::DepCtr::decodeFieldVaVdst
unsigned decodeFieldVaVdst(unsigned Encoded)
Definition: AMDGPUBaseInfo.cpp:1714

llvm::AMDGPU::DepCtr::getDefaultDepCtrEncoding
int getDefaultDepCtrEncoding(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1685

llvm::AMDGPU::DepCtr::decodeFieldVmVsrc
unsigned decodeFieldVmVsrc(unsigned Encoded)
Definition: AMDGPUBaseInfo.cpp:1710

llvm::AMDGPU::Exp::isSupportedTgtId
bool isSupportedTgtId(unsigned Id, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1804

llvm::AMDGPU::Exp::getTgtName
bool getTgtName(unsigned Id, StringRef &Name, int &Index)
Definition: AMDGPUBaseInfo.cpp:1770

llvm::AMDGPU::Exp::getTgtId
unsigned getTgtId(const StringRef Name)
Definition: AMDGPUBaseInfo.cpp:1781

llvm::AMDGPU::GenericVersion::GFX9_4
static constexpr unsigned GFX9_4
Definition: AMDGPUBaseInfo.h:49

llvm::AMDGPU::GenericVersion::GFX10_1
static constexpr unsigned GFX10_1
Definition: AMDGPUBaseInfo.h:50

llvm::AMDGPU::GenericVersion::GFX10_3
static constexpr unsigned GFX10_3
Definition: AMDGPUBaseInfo.h:51

llvm::AMDGPU::GenericVersion::GFX11
static constexpr unsigned GFX11
Definition: AMDGPUBaseInfo.h:52

llvm::AMDGPU::GenericVersion::GFX9
static constexpr unsigned GFX9
Definition: AMDGPUBaseInfo.h:48

llvm::AMDGPU::GenericVersion::GFX12
static constexpr unsigned GFX12
Definition: AMDGPUBaseInfo.h:53

llvm::AMDGPU::IsaInfo::getVGPREncodingGranule
unsigned getVGPREncodingGranule(const MCSubtargetInfo *STI, std::optional< bool > EnableWavefrontSize32)
Definition: AMDGPUBaseInfo.cpp:1157

llvm::AMDGPU::IsaInfo::getTotalNumVGPRs
unsigned getTotalNumVGPRs(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1169

llvm::AMDGPU::IsaInfo::getWavesPerEUForWorkGroup
unsigned getWavesPerEUForWorkGroup(const MCSubtargetInfo *STI, unsigned FlatWorkGroupSize)
Definition: AMDGPUBaseInfo.cpp:1011

llvm::AMDGPU::IsaInfo::getWavefrontSize
unsigned getWavefrontSize(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:937

llvm::AMDGPU::IsaInfo::getMaxWorkGroupsPerCU
unsigned getMaxWorkGroupsPerCU(const MCSubtargetInfo *STI, unsigned FlatWorkGroupSize)
Definition: AMDGPUBaseInfo.cpp:979

llvm::AMDGPU::IsaInfo::getMaxFlatWorkGroupSize
unsigned getMaxFlatWorkGroupSize(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1021

llvm::AMDGPU::IsaInfo::getMaxWavesPerEU
unsigned getMaxWavesPerEU(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1002

llvm::AMDGPU::IsaInfo::getWavesPerWorkGroup
unsigned getWavesPerWorkGroup(const MCSubtargetInfo *STI, unsigned FlatWorkGroupSize)
Definition: AMDGPUBaseInfo.cpp:1026

llvm::AMDGPU::IsaInfo::getNumExtraSGPRs
unsigned getNumExtraSGPRs(const MCSubtargetInfo *STI, bool VCCUsed, bool FlatScrUsed, bool XNACKUsed)
Definition: AMDGPUBaseInfo.cpp:1097

llvm::AMDGPU::IsaInfo::getSGPREncodingGranule
unsigned getSGPREncodingGranule(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1040

llvm::AMDGPU::IsaInfo::getLocalMemorySize
unsigned getLocalMemorySize(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:946

llvm::AMDGPU::IsaInfo::getAddressableLocalMemorySize
unsigned getAddressableLocalMemorySize(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:958

llvm::AMDGPU::IsaInfo::getMinNumVGPRs
unsigned getMinNumVGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU)
Definition: AMDGPUBaseInfo.cpp:1231

llvm::AMDGPU::IsaInfo::getEUsPerCU
unsigned getEUsPerCU(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:968

llvm::AMDGPU::IsaInfo::TRAP_NUM_SGPRS
@ TRAP_NUM_SGPRS
Definition: AMDGPUBaseInfo.h:130

llvm::AMDGPU::IsaInfo::FIXED_NUM_SGPRS_FOR_INIT_BUG
@ FIXED_NUM_SGPRS_FOR_INIT_BUG
Definition: AMDGPUBaseInfo.h:129

llvm::AMDGPU::IsaInfo::getAddressableNumSGPRs
unsigned getAddressableNumSGPRs(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1051

llvm::AMDGPU::IsaInfo::getAddressableNumVGPRs
unsigned getAddressableNumVGPRs(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1182

llvm::AMDGPU::IsaInfo::getMinNumSGPRs
unsigned getMinNumSGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU)
Definition: AMDGPUBaseInfo.cpp:1063

llvm::AMDGPU::IsaInfo::getMinFlatWorkGroupSize
unsigned getMinFlatWorkGroupSize(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1017

llvm::AMDGPU::IsaInfo::getMaxNumSGPRs
unsigned getMaxNumSGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU, bool Addressable)
Definition: AMDGPUBaseInfo.cpp:1080

llvm::AMDGPU::IsaInfo::getNumSGPRBlocks
unsigned getNumSGPRBlocks(const MCSubtargetInfo *STI, unsigned NumSGPRs)
Definition: AMDGPUBaseInfo.cpp:1133

llvm::AMDGPU::IsaInfo::getMinWavesPerEU
unsigned getMinWavesPerEU(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:998

llvm::AMDGPU::IsaInfo::getSGPRAllocGranule
unsigned getSGPRAllocGranule(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1031

llvm::AMDGPU::IsaInfo::getNumWavesPerEUWithNumVGPRs
unsigned getNumWavesPerEUWithNumVGPRs(const MCSubtargetInfo *STI, unsigned NumVGPRs)
Definition: AMDGPUBaseInfo.cpp:1188

llvm::AMDGPU::IsaInfo::TargetIDSetting
TargetIDSetting
Definition: AMDGPUBaseInfo.h:133

llvm::AMDGPU::IsaInfo::TargetIDSetting::On
@ On

llvm::AMDGPU::IsaInfo::TargetIDSetting::Unsupported
@ Unsupported

llvm::AMDGPU::IsaInfo::TargetIDSetting::Off
@ Off

llvm::AMDGPU::IsaInfo::TargetIDSetting::Any
@ Any

llvm::AMDGPU::IsaInfo::getMaxNumVGPRs
unsigned getMaxNumVGPRs(const MCSubtargetInfo *STI, unsigned WavesPerEU)
Definition: AMDGPUBaseInfo.cpp:1255

llvm::AMDGPU::IsaInfo::getEncodedNumVGPRBlocks
unsigned getEncodedNumVGPRBlocks(const MCSubtargetInfo *STI, unsigned NumVGPRs, std::optional< bool > EnableWavefrontSize32)
Definition: AMDGPUBaseInfo.cpp:1264

llvm::AMDGPU::IsaInfo::getOccupancyWithNumSGPRs
unsigned getOccupancyWithNumSGPRs(unsigned SGPRs, unsigned MaxWaves, AMDGPUSubtarget::Generation Gen)
Definition: AMDGPUBaseInfo.cpp:1204

llvm::AMDGPU::IsaInfo::getVGPRAllocGranule
unsigned getVGPRAllocGranule(const MCSubtargetInfo *STI, std::optional< bool > EnableWavefrontSize32)
Definition: AMDGPUBaseInfo.cpp:1139

llvm::AMDGPU::IsaInfo::getAddressableNumArchVGPRs
unsigned getAddressableNumArchVGPRs(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1180

llvm::AMDGPU::IsaInfo::getAllocatedNumVGPRBlocks
unsigned getAllocatedNumVGPRBlocks(const MCSubtargetInfo *STI, unsigned NumVGPRs, std::optional< bool > EnableWavefrontSize32)
Definition: AMDGPUBaseInfo.cpp:1271

llvm::AMDGPU::IsaInfo::getTotalNumSGPRs
unsigned getTotalNumSGPRs(const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1044

llvm::AMDGPU::MTBUFFormat::isValidUnifiedFormat
bool isValidUnifiedFormat(unsigned Id, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1905

llvm::AMDGPU::MTBUFFormat::getDefaultFormatEncoding
unsigned getDefaultFormatEncoding(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1930

llvm::AMDGPU::MTBUFFormat::getUnifiedFormatName
StringRef getUnifiedFormatName(unsigned Id, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1899

llvm::AMDGPU::MTBUFFormat::isValidNfmt
bool isValidNfmt(unsigned Id, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1871

llvm::AMDGPU::MTBUFFormat::isValidDfmtNfmt
bool isValidDfmtNfmt(unsigned Id, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1864

llvm::AMDGPU::MTBUFFormat::convertDfmtNfmt2Ufmt
int64_t convertDfmtNfmt2Ufmt(unsigned Dfmt, unsigned Nfmt, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1909

llvm::AMDGPU::MTBUFFormat::getDfmtName
StringRef getDfmtName(unsigned Id)
Definition: AMDGPUBaseInfo.cpp:1837

llvm::AMDGPU::MTBUFFormat::encodeDfmtNfmt
int64_t encodeDfmtNfmt(unsigned Dfmt, unsigned Nfmt)
Definition: AMDGPUBaseInfo.cpp:1875

llvm::AMDGPU::MTBUFFormat::getUnifiedFormat
int64_t getUnifiedFormat(const StringRef Name, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1884

llvm::AMDGPU::MTBUFFormat::isValidFormatEncoding
bool isValidFormatEncoding(unsigned Val, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1926

llvm::AMDGPU::MTBUFFormat::getNfmtName
StringRef getNfmtName(unsigned Id, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1859

llvm::AMDGPU::MTBUFFormat::getNfmt
int64_t getNfmt(const StringRef Name, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1850

llvm::AMDGPU::MTBUFFormat::getDfmt
int64_t getDfmt(const StringRef Name)
Definition: AMDGPUBaseInfo.cpp:1829

llvm::AMDGPU::MTBUFFormat::decodeDfmtNfmt
void decodeDfmtNfmt(unsigned Format, unsigned &Dfmt, unsigned &Nfmt)
Definition: AMDGPUBaseInfo.cpp:1879

llvm::AMDGPU::SendMsg::encodeMsg
uint64_t encodeMsg(uint64_t MsgId, uint64_t OpId, uint64_t StreamId)
Definition: AMDGPUBaseInfo.cpp:2014

llvm::AMDGPU::SendMsg::StreamId
StreamId
Definition: SIDefines.h:491

llvm::AMDGPU::SendMsg::msgSupportsStream
bool msgSupportsStream(int64_t MsgId, int64_t OpId, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1995

llvm::AMDGPU::SendMsg::decodeMsg
void decodeMsg(unsigned Val, uint16_t &MsgId, uint16_t &OpId, uint16_t &StreamId, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2002

llvm::AMDGPU::SendMsg::isValidMsgId
bool isValidMsgId(int64_t MsgId, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1948

llvm::AMDGPU::SendMsg::isValidMsgStream
bool isValidMsgStream(int64_t MsgId, int64_t OpId, int64_t StreamId, const MCSubtargetInfo &STI, bool Strict)
Definition: AMDGPUBaseInfo.cpp:1969

llvm::AMDGPU::SendMsg::msgRequiresOp
bool msgRequiresOp(int64_t MsgId, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:1989

llvm::AMDGPU::SendMsg::isValidMsgOp
bool isValidMsgOp(int64_t MsgId, int64_t OpId, const MCSubtargetInfo &STI, bool Strict)
Definition: AMDGPUBaseInfo.cpp:1952

llvm::AMDGPU::VOPD::VOPD_VGPR_BANK_MASKS
constexpr unsigned VOPD_VGPR_BANK_MASKS[]
Definition: AMDGPUBaseInfo.h:656

llvm::AMDGPU::VOPD::COMPONENTS_NUM
constexpr unsigned COMPONENTS_NUM
Definition: AMDGPUBaseInfo.h:660

llvm::AMDGPU::VOPD::ComponentIndex
ComponentIndex
Definition: AMDGPUBaseInfo.h:658

llvm::AMDGPU::VOPD::X
@ X
Definition: AMDGPUBaseInfo.h:658

llvm::AMDGPU::VOPD::Y
@ Y
Definition: AMDGPUBaseInfo.h:658

llvm::AMDGPU::VOPD::ComponentKind
ComponentKind
Definition: AMDGPUBaseInfo.h:708

llvm::AMDGPU::VOPD::COMPONENT_X
@ COMPONENT_X
Definition: AMDGPUBaseInfo.h:710

llvm::AMDGPU::VOPD::SINGLE
@ SINGLE
Definition: AMDGPUBaseInfo.h:709

llvm::AMDGPU::VOPD::MAX
@ MAX
Definition: AMDGPUBaseInfo.h:712

llvm::AMDGPU::VOPD::COMPONENT_Y
@ COMPONENT_Y
Definition: AMDGPUBaseInfo.h:711

llvm::AMDGPU::VOPD::COMPONENTS
constexpr unsigned COMPONENTS[]
Definition: AMDGPUBaseInfo.h:659

llvm::AMDGPU::VOPD::Component
Component
Definition: AMDGPUBaseInfo.h:643

llvm::AMDGPU::VOPD::MAX_SRC_NUM
@ MAX_SRC_NUM
Definition: AMDGPUBaseInfo.h:650

llvm::AMDGPU::VOPD::MAX_OPR_NUM
@ MAX_OPR_NUM
Definition: AMDGPUBaseInfo.h:651

llvm::AMDGPU::VOPD::DST
@ DST
Definition: AMDGPUBaseInfo.h:644

llvm::AMDGPU::VOPD::SRC2
@ SRC2
Definition: AMDGPUBaseInfo.h:647

llvm::AMDGPU::VOPD::DST_NUM
@ DST_NUM
Definition: AMDGPUBaseInfo.h:649

llvm::AMDGPU::VOPD::SRC1
@ SRC1
Definition: AMDGPUBaseInfo.h:646

llvm::AMDGPU::VOPD::SRC0
@ SRC0
Definition: AMDGPUBaseInfo.h:645

llvm::AMDGPU::isGCN3Encoding
bool isGCN3Encoding(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2226

llvm::AMDGPU::isInlinableLiteralBF16
bool isInlinableLiteralBF16(int16_t Literal, bool HasInv2Pi)
Definition: AMDGPUBaseInfo.cpp:2642

llvm::AMDGPU::isGFX10_BEncoding
bool isGFX10_BEncoding(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2234

llvm::AMDGPU::getMIMGG16MappingInfo
LLVM_READONLY const MIMGG16MappingInfo * getMIMGG16MappingInfo(unsigned G)

llvm::AMDGPU::isGFX10_GFX11
bool isGFX10_GFX11(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2190

llvm::AMDGPU::isInlinableLiteralV216
bool isInlinableLiteralV216(uint32_t Literal, uint8_t OpType)
Definition: AMDGPUBaseInfo.cpp:2774

llvm::AMDGPU::getMIMGInfo
LLVM_READONLY const MIMGInfo * getMIMGInfo(unsigned Opc)

llvm::AMDGPU::getRegOperandSize
unsigned getRegOperandSize(const MCRegisterInfo *MRI, const MCInstrDesc &Desc, unsigned OpNo)
Get size of register operand.
Definition: AMDGPUBaseInfo.cpp:2592

llvm::AMDGPU::decodeWaitcnt
void decodeWaitcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned &Vmcnt, unsigned &Expcnt, unsigned &Lgkmcnt)
Decodes Vmcnt, Expcnt and Lgkmcnt from given Waitcnt for given isa Version, and writes decoded values...
Definition: AMDGPUBaseInfo.cpp:1472

llvm::AMDGPU::isInlinableLiteralFP16
bool isInlinableLiteralFP16(int16_t Literal, bool HasInv2Pi)
Definition: AMDGPUBaseInfo.cpp:2663

llvm::AMDGPU::isSGPR
bool isSGPR(MCRegister Reg, const MCRegisterInfo *TRI)
Is Reg - scalar register.
Definition: AMDGPUBaseInfo.cpp:2281

llvm::AMDGPU::convertSMRDOffsetUnits
uint64_t convertSMRDOffsetUnits(const MCSubtargetInfo &ST, uint64_t ByteOffset)
Convert ByteOffset to dwords if the subtarget uses dword SMRD immediate offsets.
Definition: AMDGPUBaseInfo.cpp:2898

llvm::AMDGPU::getMCReg
MCRegister getMCReg(MCRegister Reg, const MCSubtargetInfo &STI)
If Reg is a pseudo reg, return the correct hardware register given STI otherwise return Reg.
Definition: AMDGPUBaseInfo.cpp:2349

llvm::AMDGPU::getMIMGOffsetMappingInfo
LLVM_READONLY const MIMGOffsetMappingInfo * getMIMGOffsetMappingInfo(unsigned Offset)

llvm::AMDGPU::isVOPCAsmOnly
bool isVOPCAsmOnly(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:526

llvm::AMDGPU::getMIMGOpcode
int getMIMGOpcode(unsigned BaseOpcode, unsigned MIMGEncoding, unsigned VDataDwords, unsigned VAddrDwords)
Definition: AMDGPUBaseInfo.cpp:273

llvm::AMDGPU::getMTBUFHasSrsrc
bool getMTBUFHasSrsrc(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:452

llvm::AMDGPU::getSMRDEncodedLiteralOffset32
std::optional< int64_t > getSMRDEncodedLiteralOffset32(const MCSubtargetInfo &ST, int64_t ByteOffset)
Definition: AMDGPUBaseInfo.cpp:2936

llvm::AMDGPU::isLegalDPALU_DPPControl
LLVM_READNONE bool isLegalDPALU_DPPControl(unsigned DC)
Definition: AMDGPUBaseInfo.h:1549

llvm::AMDGPU::isGFX10Before1030
bool isGFX10Before1030(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2222

llvm::AMDGPU::isSISrcInlinableOperand
bool isSISrcInlinableOperand(const MCInstrDesc &Desc, unsigned OpNo)
Does this operand support only inlinable literals?
Definition: AMDGPUBaseInfo.cpp:2436

llvm::AMDGPU::mapWMMA2AddrTo3AddrOpcode
unsigned mapWMMA2AddrTo3AddrOpcode(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:671

llvm::AMDGPU::shouldEmitConstantsToTextSection
bool shouldEmitConstantsToTextSection(const Triple &TT)
Definition: AMDGPUBaseInfo.cpp:1327

llvm::AMDGPU::isInlinableLiteralV2I16
bool isInlinableLiteralV2I16(uint32_t Literal)
Definition: AMDGPUBaseInfo.cpp:2794

llvm::AMDGPU::isDPMACCInstruction
bool isDPMACCInstruction(unsigned Opc)

llvm::AMDGPU::getMTBUFElements
int getMTBUFElements(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:442

llvm::AMDGPU::isHi16Reg
bool isHi16Reg(MCRegister Reg, const MCRegisterInfo &MRI)
Definition: AMDGPUBaseInfo.cpp:2288

llvm::AMDGPU::getTotalNumVGPRs
int32_t getTotalNumVGPRs(bool has90AInsts, int32_t ArgNumAGPR, int32_t ArgNumVGPR)
Definition: AMDGPUBaseInfo.cpp:2274

llvm::AMDGPU::isGFX10
bool isGFX10(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2186

llvm::AMDGPU::getNamedOperandIdx
LLVM_READONLY int16_t getNamedOperandIdx(uint16_t Opcode, uint16_t NamedIdx)

llvm::AMDGPU::isInlinableLiteralV2BF16
bool isInlinableLiteralV2BF16(uint32_t Literal)
Definition: AMDGPUBaseInfo.cpp:2799

llvm::AMDGPU::getMaxNumUserSGPRs
unsigned getMaxNumUserSGPRs(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2146

llvm::AMDGPU::getFPDstSelType
FPType getFPDstSelType(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:659

llvm::AMDGPU::getNumFlatOffsetBits
unsigned getNumFlatOffsetBits(const MCSubtargetInfo &ST)
For pre-GFX12 FLAT instructions the offset must be positive; MSB is ignored and forced to zero.
Definition: AMDGPUBaseInfo.cpp:2946

llvm::AMDGPU::AMDHSA_COV4
@ AMDHSA_COV4
Definition: AMDGPUBaseInfo.h:56

llvm::AMDGPU::AMDHSA_COV5
@ AMDHSA_COV5
Definition: AMDGPUBaseInfo.h:56

llvm::AMDGPU::AMDHSA_COV6
@ AMDHSA_COV6
Definition: AMDGPUBaseInfo.h:56

llvm::AMDGPU::hasA16
bool hasA16(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2118

llvm::AMDGPU::isLegalSMRDEncodedSignedOffset
bool isLegalSMRDEncodedSignedOffset(const MCSubtargetInfo &ST, int64_t EncodedOffset, bool IsBuffer)
Definition: AMDGPUBaseInfo.cpp:2883

llvm::AMDGPU::isGFX12Plus
bool isGFX12Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2210

llvm::AMDGPU::getNSAMaxSize
unsigned getNSAMaxSize(const MCSubtargetInfo &STI, bool HasSampler)
Definition: AMDGPUBaseInfo.cpp:2135

llvm::AMDGPU::getCanBeVOPD
CanBeVOPD getCanBeVOPD(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:570

llvm::AMDGPU::getIntegerAttribute
int getIntegerAttribute(const Function &F, StringRef Name, int Default)

llvm::AMDGPU::hasPackedD16
bool hasPackedD16(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2126

llvm::AMDGPU::getStorecntBitMask
unsigned getStorecntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1438

llvm::AMDGPU::getLdsDwGranularity
unsigned getLdsDwGranularity(const MCSubtargetInfo &ST)
Definition: AMDGPUBaseInfo.cpp:3024

llvm::AMDGPU::isGFX940
bool isGFX940(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2250

llvm::AMDGPU::isEntryFunctionCC
bool isEntryFunctionCC(CallingConv::ID CC)
Definition: AMDGPUBaseInfo.cpp:2066

llvm::AMDGPU::isKernel
LLVM_READNONE bool isKernel(CallingConv::ID CC)
Definition: AMDGPUBaseInfo.h:1301

llvm::AMDGPU::isInlinableLiteralV2F16
bool isInlinableLiteralV2F16(uint32_t Literal)
Definition: AMDGPUBaseInfo.cpp:2804

llvm::AMDGPU::isHsaAbi
bool isHsaAbi(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:168

llvm::AMDGPU::isGFX11
bool isGFX11(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2198

llvm::AMDGPU::getSMEMIsBuffer
bool getSMEMIsBuffer(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:502

llvm::AMDGPU::isGFX10_3_GFX11
bool isGFX10_3_GFX11(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2242

llvm::AMDGPU::isInvalidSingleUseProducerInst
LLVM_READONLY bool isInvalidSingleUseProducerInst(unsigned Opc)

llvm::AMDGPU::None
@ None
Definition: AMDGPURegBankLegalizeRules.h:103

llvm::AMDGPU::mfmaScaleF8F6F4FormatToNumRegs
uint8_t mfmaScaleF8F6F4FormatToNumRegs(unsigned EncodingVal)
Definition: AMDGPUBaseInfo.cpp:538

llvm::AMDGPU::isInvalidSingleUseConsumerInst
LLVM_READONLY bool isInvalidSingleUseConsumerInst(unsigned Opc)

llvm::AMDGPU::isGroupSegment
bool isGroupSegment(const GlobalValue *GV)
Definition: AMDGPUBaseInfo.cpp:1313

llvm::AMDGPU::getMIMGMIPMappingInfo
LLVM_READONLY const MIMGMIPMappingInfo * getMIMGMIPMappingInfo(unsigned MIP)

llvm::AMDGPU::getMTBUFHasSoffset
bool getMTBUFHasSoffset(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:457

llvm::AMDGPU::hasXNACK
bool hasXNACK(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2106

llvm::AMDGPU::isValid32BitLiteral
bool isValid32BitLiteral(uint64_t Val, bool IsFP64)
Definition: AMDGPUBaseInfo.cpp:2808

llvm::AMDGPU::getVOPDOpcode
unsigned getVOPDOpcode(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:577

llvm::AMDGPU::isDPALU_DPP
bool isDPALU_DPP(const MCInstrDesc &OpDesc)
Definition: AMDGPUBaseInfo.cpp:3020

llvm::AMDGPU::encodeWaitcnt
unsigned encodeWaitcnt(const IsaVersion &Version, unsigned Vmcnt, unsigned Expcnt, unsigned Lgkmcnt)
Encodes Vmcnt, Expcnt and Lgkmcnt into Waitcnt for given isa Version.
Definition: AMDGPUBaseInfo.cpp:1508

llvm::AMDGPU::isVOPC64DPP
bool isVOPC64DPP(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:522

llvm::AMDGPU::getMUBUFOpcode
int getMUBUFOpcode(unsigned BaseOpc, unsigned Elements)
Definition: AMDGPUBaseInfo.cpp:467

llvm::AMDGPU::isCompute
bool isCompute(CallingConv::ID cc)
Definition: AMDGPUBaseInfo.cpp:2062

llvm::AMDGPU::getMAIIsGFX940XDL
bool getMAIIsGFX940XDL(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:533

llvm::AMDGPU::isSI
bool isSI(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2148

llvm::AMDGPU::getDefaultAMDHSACodeObjectVersion
unsigned getDefaultAMDHSACodeObjectVersion()
Definition: AMDGPUBaseInfo.cpp:181

llvm::AMDGPU::isReadOnlySegment
bool isReadOnlySegment(const GlobalValue *GV)
Definition: AMDGPUBaseInfo.cpp:1321

llvm::AMDGPU::isArgPassedInSGPR
bool isArgPassedInSGPR(const Argument *A)
Definition: AMDGPUBaseInfo.cpp:2815

llvm::AMDGPU::isIntrinsicAlwaysUniform
bool isIntrinsicAlwaysUniform(unsigned IntrID)
Definition: AMDGPUBaseInfo.cpp:2981

llvm::AMDGPU::getMUBUFBaseOpcode
int getMUBUFBaseOpcode(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:462

llvm::AMDGPU::getAMDHSACodeObjectVersion
unsigned getAMDHSACodeObjectVersion(const Module &M)
Definition: AMDGPUBaseInfo.cpp:172

llvm::AMDGPU::decodeLgkmcnt
unsigned decodeLgkmcnt(const IsaVersion &Version, unsigned Waitcnt)
Definition: AMDGPUBaseInfo.cpp:1467

llvm::AMDGPU::getWaitcntBitMask
unsigned getWaitcntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1442

llvm::AMDGPU::getVOP3IsSingle
bool getVOP3IsSingle(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:517

llvm::AMDGPU::isGFX9
bool isGFX9(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2160

llvm::AMDGPU::getVOP1IsSingle
bool getVOP1IsSingle(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:507

llvm::AMDGPU::getVOPDEncodingFamily
unsigned getVOPDEncodingFamily(const MCSubtargetInfo &ST)
Definition: AMDGPUBaseInfo.cpp:562

llvm::AMDGPU::isGFX10_AEncoding
bool isGFX10_AEncoding(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2230

llvm::AMDGPU::isKImmOperand
bool isKImmOperand(const MCInstrDesc &Desc, unsigned OpNo)
Is this a KImm operand?
Definition: AMDGPUBaseInfo.cpp:2403

llvm::AMDGPU::getHasColorExport
bool getHasColorExport(const Function &F)
Definition: AMDGPUBaseInfo.cpp:2030

llvm::AMDGPU::getMTBUFBaseOpcode
int getMTBUFBaseOpcode(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:432

llvm::AMDGPU::isChainCC
bool isChainCC(CallingConv::ID CC)
Definition: AMDGPUBaseInfo.cpp:2092

llvm::AMDGPU::isGFX90A
bool isGFX90A(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2246

llvm::AMDGPU::getSamplecntBitMask
unsigned getSamplecntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1414

llvm::AMDGPU::getDefaultQueueImplicitArgPosition
unsigned getDefaultQueueImplicitArgPosition(unsigned CodeObjectVersion)
Definition: AMDGPUBaseInfo.cpp:240

llvm::AMDGPU::hasSRAMECC
bool hasSRAMECC(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2110

llvm::AMDGPU::getHasDepthExport
bool getHasDepthExport(const Function &F)
Definition: AMDGPUBaseInfo.cpp:2037

llvm::AMDGPU::isGFX8_GFX9_GFX10
bool isGFX8_GFX9_GFX10(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2172

llvm::AMDGPU::getMUBUFHasVAddr
bool getMUBUFHasVAddr(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:477

llvm::AMDGPU::getVOPDFull
int getVOPDFull(unsigned OpX, unsigned OpY, unsigned EncodingFamily)
Definition: AMDGPUBaseInfo.cpp:688

llvm::AMDGPU::isTrue16Inst
bool isTrue16Inst(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:654

llvm::AMDGPU::hasAny64BitVGPROperands
bool hasAny64BitVGPROperands(const MCInstrDesc &OpDesc)
Definition: AMDGPUBaseInfo.cpp:3005

llvm::AMDGPU::getVOPDComponents
std::pair< unsigned, unsigned > getVOPDComponents(unsigned VOPDOpcode)
Definition: AMDGPUBaseInfo.cpp:694

llvm::AMDGPU::getMIMGDimInfoByEncoding
LLVM_READONLY const MIMGDimInfo * getMIMGDimInfoByEncoding(uint8_t DimEnc)

llvm::AMDGPU::isInlinableLiteral32
bool isInlinableLiteral32(int32_t Literal, bool HasInv2Pi)
Definition: AMDGPUBaseInfo.cpp:2616

llvm::AMDGPU::isGFX12
bool isGFX12(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2206

llvm::AMDGPU::getInitialPSInputAddr
unsigned getInitialPSInputAddr(const Function &F)
Definition: AMDGPUBaseInfo.cpp:2026

llvm::AMDGPU::encodeExpcnt
unsigned encodeExpcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned Expcnt)
Definition: AMDGPUBaseInfo.cpp:1496

llvm::AMDGPU::isSISrcOperand
bool isSISrcOperand(const MCInstrDesc &Desc, unsigned OpNo)
Is this an AMDGPU specific source operand? These include registers, inline constants,...
Definition: AMDGPUBaseInfo.cpp:2396

llvm::AMDGPU::isLegalSMRDImmOffset
bool isLegalSMRDImmOffset(const MCSubtargetInfo &ST, int64_t ByteOffset)

llvm::AMDGPU::getKmcntBitMask
unsigned getKmcntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1434

llvm::AMDGPU::getVmcntBitMask
unsigned getVmcntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1404

llvm::AMDGPU::FPType
FPType
Definition: AMDGPUBaseInfo.h:58

llvm::AMDGPU::FPType::FP4
@ FP4

llvm::AMDGPU::FPType::FP8
@ FP8

llvm::AMDGPU::isNotGFX10Plus
bool isNotGFX10Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2218

llvm::AMDGPU::hasMAIInsts
bool hasMAIInsts(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2258

llvm::AMDGPU::isIntrinsicSourceOfDivergence
bool isIntrinsicSourceOfDivergence(unsigned IntrID)
Definition: AMDGPUBaseInfo.cpp:2977

llvm::AMDGPU::isKernelCC
bool isKernelCC(const Function *Func)
Definition: AMDGPUBaseInfo.cpp:2102

llvm::AMDGPU::isGenericAtomic
bool isGenericAtomic(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:634

llvm::AMDGPU::decodeStorecntDscnt
Waitcnt decodeStorecntDscnt(const IsaVersion &Version, unsigned StorecntDscnt)
Definition: AMDGPUBaseInfo.cpp:1545

llvm::AMDGPU::isGFX8Plus
bool isGFX8Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2176

llvm::AMDGPU::hasNamedOperand
LLVM_READONLY bool hasNamedOperand(uint64_t Opcode, uint64_t NamedIdx)
Definition: AMDGPUBaseInfo.h:400

llvm::AMDGPU::isInlinableIntLiteral
LLVM_READNONE bool isInlinableIntLiteral(int64_t Literal)
Is this literal inlinable, and not one of the values intended for floating point values.
Definition: AMDGPUBaseInfo.h:1458

llvm::AMDGPU::getLgkmcntBitMask
unsigned getLgkmcntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1426

llvm::AMDGPU::getMUBUFTfe
bool getMUBUFTfe(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:497

llvm::AMDGPU::getMIMGBiasMappingInfo
LLVM_READONLY const MIMGBiasMappingInfo * getMIMGBiasMappingInfo(unsigned Bias)

llvm::AMDGPU::getBvhcntBitMask
unsigned getBvhcntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1418

llvm::AMDGPU::hasSMRDSignedImmOffset
bool hasSMRDSignedImmOffset(const MCSubtargetInfo &ST)
Definition: AMDGPUBaseInfo.cpp:163

llvm::AMDGPU::getMIMGDimInfoByAsmSuffix
LLVM_READONLY const MIMGDimInfo * getMIMGDimInfoByAsmSuffix(StringRef AsmSuffix)

llvm::AMDGPU::hasMIMG_R128
bool hasMIMG_R128(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2114

llvm::AMDGPU::hasGFX10_3Insts
bool hasGFX10_3Insts(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2238

llvm::AMDGPU::hasG16
bool hasG16(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2122

llvm::AMDGPU::getAddrSizeMIMGOp
unsigned getAddrSizeMIMGOp(const MIMGBaseOpcodeInfo *BaseOpcode, const MIMGDimInfo *Dim, bool IsA16, bool IsG16Supported)
Definition: AMDGPUBaseInfo.cpp:293

llvm::AMDGPU::getMTBUFOpcode
int getMTBUFOpcode(unsigned BaseOpc, unsigned Elements)
Definition: AMDGPUBaseInfo.cpp:437

llvm::AMDGPU::getExpcntBitMask
unsigned getExpcntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1422

llvm::AMDGPU::hasArchitectedFlatScratch
bool hasArchitectedFlatScratch(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2254

llvm::AMDGPU::getMUBUFHasSoffset
bool getMUBUFHasSoffset(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:487

llvm::AMDGPU::isNotGFX11Plus
bool isNotGFX11Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2214

llvm::AMDGPU::isGFX11Plus
bool isGFX11Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2202

llvm::AMDGPU::getInlineEncodingV2F16
std::optional< unsigned > getInlineEncodingV2F16(uint32_t Literal)
Definition: AMDGPUBaseInfo.cpp:2769

llvm::AMDGPU::isInlineValue
bool isInlineValue(unsigned Reg)
Definition: AMDGPUBaseInfo.cpp:2367

llvm::AMDGPU::isSISrcFPOperand
bool isSISrcFPOperand(const MCInstrDesc &Desc, unsigned OpNo)
Is this floating-point operand?
Definition: AMDGPUBaseInfo.cpp:2410

llvm::AMDGPU::isShader
bool isShader(CallingConv::ID cc)
Definition: AMDGPUBaseInfo.cpp:2041

llvm::AMDGPU::getHostcallImplicitArgPosition
unsigned getHostcallImplicitArgPosition(unsigned CodeObjectVersion)
Definition: AMDGPUBaseInfo.cpp:229

llvm::AMDGPU::isGFX10Plus
bool isGFX10Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2194

llvm::AMDGPU::getSMRDEncodedOffset
std::optional< int64_t > getSMRDEncodedOffset(const MCSubtargetInfo &ST, int64_t ByteOffset, bool IsBuffer, bool HasSOffset)
Definition: AMDGPUBaseInfo.cpp:2907

llvm::AMDGPU::isGlobalSegment
bool isGlobalSegment(const GlobalValue *GV)
Definition: AMDGPUBaseInfo.cpp:1317

llvm::AMDGPU::OPERAND_KIMM32
@ OPERAND_KIMM32
Operand with 32-bit immediate that uses the constant bus.
Definition: SIDefines.h:234

llvm::AMDGPU::OPERAND_REG_IMM_INT64
@ OPERAND_REG_IMM_INT64
Definition: SIDefines.h:201

llvm::AMDGPU::OPERAND_REG_IMM_V2FP16
@ OPERAND_REG_IMM_V2FP16
Definition: SIDefines.h:211

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2INT32
@ OPERAND_REG_INLINE_C_V2INT32
Definition: SIDefines.h:227

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP64
@ OPERAND_REG_INLINE_C_FP64
Definition: SIDefines.h:223

llvm::AMDGPU::OPERAND_REG_INLINE_C_BF16
@ OPERAND_REG_INLINE_C_BF16
Definition: SIDefines.h:220

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2BF16
@ OPERAND_REG_INLINE_C_V2BF16
Definition: SIDefines.h:225

llvm::AMDGPU::OPERAND_REG_IMM_V2INT16
@ OPERAND_REG_IMM_V2INT16
Definition: SIDefines.h:212

llvm::AMDGPU::OPERAND_REG_IMM_BF16
@ OPERAND_REG_IMM_BF16
Definition: SIDefines.h:205

llvm::AMDGPU::OPERAND_REG_INLINE_AC_V2FP16
@ OPERAND_REG_INLINE_AC_V2FP16
Definition: SIDefines.h:246

llvm::AMDGPU::OPERAND_REG_IMM_INT32
@ OPERAND_REG_IMM_INT32
Operands with register or 32-bit immediate.
Definition: SIDefines.h:200

llvm::AMDGPU::OPERAND_REG_IMM_V2BF16
@ OPERAND_REG_IMM_V2BF16
Definition: SIDefines.h:210

llvm::AMDGPU::OPERAND_REG_IMM_BF16_DEFERRED
@ OPERAND_REG_IMM_BF16_DEFERRED
Definition: SIDefines.h:207

llvm::AMDGPU::OPERAND_REG_IMM_FP16
@ OPERAND_REG_IMM_FP16
Definition: SIDefines.h:206

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT64
@ OPERAND_REG_INLINE_C_INT64
Definition: SIDefines.h:219

llvm::AMDGPU::OPERAND_KIMM16
@ OPERAND_KIMM16
Definition: SIDefines.h:235

llvm::AMDGPU::OPERAND_REG_INLINE_AC_BF16
@ OPERAND_REG_INLINE_AC_BF16
Definition: SIDefines.h:240

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT16
@ OPERAND_REG_INLINE_C_INT16
Operands with register or inline constant.
Definition: SIDefines.h:217

llvm::AMDGPU::OPERAND_REG_INLINE_AC_INT16
@ OPERAND_REG_INLINE_AC_INT16
Operands with an AccVGPR register or inline constant.
Definition: SIDefines.h:238

llvm::AMDGPU::OPERAND_REG_IMM_FP64
@ OPERAND_REG_IMM_FP64
Definition: SIDefines.h:204

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2FP16
@ OPERAND_REG_INLINE_C_V2FP16
Definition: SIDefines.h:226

llvm::AMDGPU::OPERAND_REG_INLINE_AC_V2INT16
@ OPERAND_REG_INLINE_AC_V2INT16
Definition: SIDefines.h:244

llvm::AMDGPU::OPERAND_REG_INLINE_AC_FP16
@ OPERAND_REG_INLINE_AC_FP16
Definition: SIDefines.h:241

llvm::AMDGPU::OPERAND_REG_INLINE_AC_INT32
@ OPERAND_REG_INLINE_AC_INT32
Definition: SIDefines.h:239

llvm::AMDGPU::OPERAND_REG_INLINE_AC_FP32
@ OPERAND_REG_INLINE_AC_FP32
Definition: SIDefines.h:242

llvm::AMDGPU::OPERAND_REG_INLINE_AC_V2BF16
@ OPERAND_REG_INLINE_AC_V2BF16
Definition: SIDefines.h:245

llvm::AMDGPU::OPERAND_REG_IMM_V2INT32
@ OPERAND_REG_IMM_V2INT32
Definition: SIDefines.h:213

llvm::AMDGPU::OPERAND_REG_IMM_FP32
@ OPERAND_REG_IMM_FP32
Definition: SIDefines.h:203

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP32
@ OPERAND_REG_INLINE_C_FP32
Definition: SIDefines.h:222

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT32
@ OPERAND_REG_INLINE_C_INT32
Definition: SIDefines.h:218

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2INT16
@ OPERAND_REG_INLINE_C_V2INT16
Definition: SIDefines.h:224

llvm::AMDGPU::OPERAND_REG_IMM_V2FP32
@ OPERAND_REG_IMM_V2FP32
Definition: SIDefines.h:214

llvm::AMDGPU::OPERAND_REG_INLINE_AC_FP64
@ OPERAND_REG_INLINE_AC_FP64
Definition: SIDefines.h:243

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP16
@ OPERAND_REG_INLINE_C_FP16
Definition: SIDefines.h:221

llvm::AMDGPU::OPERAND_REG_IMM_INT16
@ OPERAND_REG_IMM_INT16
Definition: SIDefines.h:202

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2FP32
@ OPERAND_REG_INLINE_C_V2FP32
Definition: SIDefines.h:228

llvm::AMDGPU::OPERAND_INLINE_SPLIT_BARRIER_INT32
@ OPERAND_INLINE_SPLIT_BARRIER_INT32
Definition: SIDefines.h:231

llvm::AMDGPU::OPERAND_REG_IMM_FP32_DEFERRED
@ OPERAND_REG_IMM_FP32_DEFERRED
Definition: SIDefines.h:209

llvm::AMDGPU::OPERAND_REG_IMM_FP16_DEFERRED
@ OPERAND_REG_IMM_FP16_DEFERRED
Definition: SIDefines.h:208

llvm::AMDGPU::initDefaultAMDKernelCodeT
void initDefaultAMDKernelCodeT(AMDGPUMCKernelCodeT &KernelCode, const MCSubtargetInfo *STI)
Definition: AMDGPUBaseInfo.cpp:1279

llvm::AMDGPU::isNotGFX9Plus
bool isNotGFX9Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2184

llvm::AMDGPU::getMIMGLZMappingInfo
LLVM_READONLY const MIMGLZMappingInfo * getMIMGLZMappingInfo(unsigned L)

llvm::AMDGPU::hasGDS
bool hasGDS(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2131

llvm::AMDGPU::isLegalSMRDEncodedUnsignedOffset
bool isLegalSMRDEncodedUnsignedOffset(const MCSubtargetInfo &ST, int64_t EncodedOffset)
Definition: AMDGPUBaseInfo.cpp:2874

llvm::AMDGPU::isGFX9Plus
bool isGFX9Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2180

llvm::AMDGPU::hasDPPSrc1SGPR
bool hasDPPSrc1SGPR(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2266

llvm::AMDGPU::isVOPD
bool isVOPD(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:582

llvm::AMDGPU::getVOPDInstInfo
VOPD::InstInfo getVOPDInstInfo(const MCInstrDesc &OpX, const MCInstrDesc &OpY)
Definition: AMDGPUBaseInfo.cpp:790

llvm::AMDGPU::encodeVmcnt
unsigned encodeVmcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned Vmcnt)
Definition: AMDGPUBaseInfo.cpp:1487

llvm::AMDGPU::decodeExpcnt
unsigned decodeExpcnt(const IsaVersion &Version, unsigned Waitcnt)
Definition: AMDGPUBaseInfo.cpp:1462

llvm::AMDGPU::isCvt_F32_Fp8_Bf8_e64
bool isCvt_F32_Fp8_Bf8_e64(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:621

llvm::AMDGPU::decodeLoadcntDscnt
Waitcnt decodeLoadcntDscnt(const IsaVersion &Version, unsigned LoadcntDscnt)
Definition: AMDGPUBaseInfo.cpp:1535

llvm::AMDGPU::getInlineEncodingV2I16
std::optional< unsigned > getInlineEncodingV2I16(uint32_t Literal)
Definition: AMDGPUBaseInfo.cpp:2735

llvm::AMDGPU::getRegBitWidth
unsigned getRegBitWidth(const TargetRegisterClass &RC)
Get the size in bits of a register from the register class RC.
Definition: SIRegisterInfo.cpp:3201

llvm::AMDGPU::encodeStorecntDscnt
static unsigned encodeStorecntDscnt(const IsaVersion &Version, unsigned Storecnt, unsigned Dscnt)
Definition: AMDGPUBaseInfo.cpp:1585

llvm::AMDGPU::getMCOpcode
int getMCOpcode(uint16_t Opcode, unsigned Gen)
Definition: AMDGPUBaseInfo.cpp:684

llvm::AMDGPU::getMIMGBaseOpcode
const MIMGBaseOpcodeInfo * getMIMGBaseOpcode(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:280

llvm::AMDGPU::isVI
bool isVI(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2156

llvm::AMDGPU::getMIMGDimInfo
LLVM_READONLY const MIMGDimInfo * getMIMGDimInfo(unsigned DimEnum)

llvm::AMDGPU::getMUBUFIsBufferInv
bool getMUBUFIsBufferInv(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:492

llvm::AMDGPU::mc2PseudoReg
MCRegister mc2PseudoReg(MCRegister Reg)
Convert hardware register Reg to a pseudo register.
Definition: AMDGPUBaseInfo.cpp:2365

llvm::AMDGPU::getInlineEncodingV2BF16
std::optional< unsigned > getInlineEncodingV2BF16(uint32_t Literal)
Definition: AMDGPUBaseInfo.cpp:2741

llvm::AMDGPU::hasKernargPreload
unsigned hasKernargPreload(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2270

llvm::AMDGPU::isMAC
bool isMAC(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:586

llvm::AMDGPU::getOperandSize
LLVM_READNONE unsigned getOperandSize(const MCOperandInfo &OpInfo)
Definition: AMDGPUBaseInfo.h:1398

llvm::AMDGPU::isCI
bool isCI(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2152

llvm::AMDGPU::encodeLgkmcnt
unsigned encodeLgkmcnt(const IsaVersion &Version, unsigned Waitcnt, unsigned Lgkmcnt)
Definition: AMDGPUBaseInfo.cpp:1502

llvm::AMDGPU::getVOP2IsSingle
bool getVOP2IsSingle(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:512

llvm::AMDGPU::getMAIIsDGEMM
bool getMAIIsDGEMM(unsigned Opc)
Returns true if MAI operation is a double precision GEMM.
Definition: AMDGPUBaseInfo.cpp:528

llvm::AMDGPU::getMIMGBaseOpcodeInfo
LLVM_READONLY const MIMGBaseOpcodeInfo * getMIMGBaseOpcodeInfo(unsigned BaseOpcode)

llvm::AMDGPU::getCompletionActionImplicitArgPosition
unsigned getCompletionActionImplicitArgPosition(unsigned CodeObjectVersion)
Definition: AMDGPUBaseInfo.cpp:251

llvm::AMDGPU::getIntegerVecAttribute
SmallVector< unsigned > getIntegerVecAttribute(const Function &F, StringRef Name, unsigned Size, unsigned DefaultVal)
Definition: AMDGPUBaseInfo.cpp:1367

llvm::AMDGPU::getMaskedMIMGOp
int getMaskedMIMGOp(unsigned Opc, unsigned NewChannels)
Definition: AMDGPUBaseInfo.cpp:285

llvm::AMDGPU::isModuleEntryFunctionCC
bool isModuleEntryFunctionCC(CallingConv::ID CC)
Definition: AMDGPUBaseInfo.cpp:2083

llvm::AMDGPU::isNotGFX12Plus
bool isNotGFX12Plus(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2212

llvm::AMDGPU::getMTBUFHasVAddr
bool getMTBUFHasVAddr(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:447

llvm::AMDGPU::decodeVmcnt
unsigned decodeVmcnt(const IsaVersion &Version, unsigned Waitcnt)
Definition: AMDGPUBaseInfo.cpp:1454

llvm::AMDGPU::getELFABIVersion
uint8_t getELFABIVersion(const Triple &T, unsigned CodeObjectVersion)
Definition: AMDGPUBaseInfo.cpp:198

llvm::AMDGPU::getIntegerPairAttribute
std::pair< unsigned, unsigned > getIntegerPairAttribute(const Function &F, StringRef Name, std::pair< unsigned, unsigned > Default, bool OnlyFirstRequired)
Definition: AMDGPUBaseInfo.cpp:1332

llvm::AMDGPU::getLoadcntBitMask
unsigned getLoadcntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1410

llvm::AMDGPU::isInlinableLiteralI16
bool isInlinableLiteralI16(int32_t Literal, bool HasInv2Pi)
Definition: AMDGPUBaseInfo.cpp:2659

llvm::AMDGPU::hasVOPD
bool hasVOPD(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2262

llvm::AMDGPU::isInlinableLiteral64
bool isInlinableLiteral64(int64_t Literal, bool HasInv2Pi)
Is this literal inlinable.
Definition: AMDGPUBaseInfo.cpp:2599

llvm::AMDGPU::getMFMA_F8F6F4_WithFormatArgs
const MFMA_F8F6F4_Info * getMFMA_F8F6F4_WithFormatArgs(unsigned CBSZ, unsigned BLGP, unsigned F8F8Opcode)
Definition: AMDGPUBaseInfo.cpp:554

llvm::AMDGPU::getMultigridSyncArgImplicitArgPosition
unsigned getMultigridSyncArgImplicitArgPosition(unsigned CodeObjectVersion)
Definition: AMDGPUBaseInfo.cpp:215

llvm::AMDGPU::isGFX9_GFX10_GFX11
bool isGFX9_GFX10_GFX11(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2168

llvm::AMDGPU::isGFX9_GFX10
bool isGFX9_GFX10(const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2164

llvm::AMDGPU::getMUBUFElements
int getMUBUFElements(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:472

llvm::AMDGPU::encodeLoadcntDscnt
static unsigned encodeLoadcntDscnt(const IsaVersion &Version, unsigned Loadcnt, unsigned Dscnt)
Definition: AMDGPUBaseInfo.cpp:1573

llvm::AMDGPU::getGcnBufferFormatInfo
const GcnBufferFormatInfo * getGcnBufferFormatInfo(uint8_t BitsPerComp, uint8_t NumComponents, uint8_t NumFormat, const MCSubtargetInfo &STI)
Definition: AMDGPUBaseInfo.cpp:2985

llvm::AMDGPU::isGraphics
bool isGraphics(CallingConv::ID cc)
Definition: AMDGPUBaseInfo.cpp:2058

llvm::AMDGPU::mapWMMA3AddrTo2AddrOpcode
unsigned mapWMMA3AddrTo2AddrOpcode(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:676

llvm::AMDGPU::isPermlane16
bool isPermlane16(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:610

llvm::AMDGPU::getSOPPWithRelaxation
LLVM_READONLY int getSOPPWithRelaxation(uint16_t Opcode)

llvm::AMDGPU::getMUBUFHasSrsrc
bool getMUBUFHasSrsrc(unsigned Opc)
Definition: AMDGPUBaseInfo.cpp:482

llvm::AMDGPU::getDscntBitMask
unsigned getDscntBitMask(const IsaVersion &Version)
Definition: AMDGPUBaseInfo.cpp:1430

llvm::CallingConv::AMDGPU_KERNEL
@ AMDGPU_KERNEL
Used for AMDGPU code object kernels.
Definition: CallingConv.h:200

llvm::CallingConv::SPIR_KERNEL
@ SPIR_KERNEL
Used for SPIR kernel functions.
Definition: CallingConv.h:144

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::codeview::PublicSymFlags::Function
@ Function

llvm::logicalview::LVAttributeKind::Argument
@ Argument

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Offset
@ Offset
Definition: DWP.cpp:480

llvm::IRMemLocation::Other
@ Other
Any other memory.

llvm::ReplacementType::Format
@ Format

llvm::ReplacementType::Literal
@ Literal

llvm::operator<<
raw_ostream & operator<<(raw_ostream &OS, const APFixedPoint &FX)
Definition: APFixedPoint.h:303

llvm::InstructionUniformity::Default
@ Default
The result values are uniform if and only if all operands are uniform.

llvm::Version
@ Version
Definition: PGOCtxProfWriter.h:22

llvm::maxUIntN
uint64_t maxUIntN(uint64_t N)
Gets the maximum value for a N-bit unsigned integer.
Definition: MathExtras.h:220

amd_kernel_code_t
AMD Kernel Code Object (amd_kernel_code_t).
Definition: AMDKernelCodeT.h:526

llvm::AMDGPU::AMDGPUMCKernelCodeT
Definition: AMDKernelCodeTUtils.h:33

llvm::AMDGPU::CanBeVOPD
Definition: AMDGPUBaseInfo.h:588

llvm::AMDGPU::CanBeVOPD::X
bool X
Definition: AMDGPUBaseInfo.h:589

llvm::AMDGPU::CanBeVOPD::Y
bool Y
Definition: AMDGPUBaseInfo.h:590

llvm::AMDGPU::CvtScaleF32_F32F16ToF8F4_Info
Definition: AMDGPUBaseInfo.h:108

llvm::AMDGPU::CvtScaleF32_F32F16ToF8F4_Info::Opcode
unsigned Opcode
Definition: AMDGPUBaseInfo.h:109

llvm::AMDGPU::EncodingField
Definition: AMDGPUBaseInfo.h:365

llvm::AMDGPU::EncodingField::Width
static constexpr unsigned Width
Definition: AMDGPUBaseInfo.h:368

llvm::AMDGPU::EncodingField::EncodingField
constexpr EncodingField(ValueType Value)
Definition: AMDGPUBaseInfo.h:374

llvm::AMDGPU::EncodingField::Offset
static constexpr unsigned Offset
Definition: AMDGPUBaseInfo.h:367

llvm::AMDGPU::EncodingField::Value
ValueType Value
Definition: AMDGPUBaseInfo.h:373

llvm::AMDGPU::EncodingField::Default
static constexpr ValueType Default
Definition: AMDGPUBaseInfo.h:371

llvm::AMDGPU::EncodingField::decode
static ValueType decode(uint64_t Encoded)
Definition: AMDGPUBaseInfo.h:377

llvm::AMDGPU::EncodingField::encode
constexpr uint64_t encode() const
Definition: AMDGPUBaseInfo.h:376

llvm::AMDGPU::EncodingFields
Definition: AMDGPUBaseInfo.h:385

llvm::AMDGPU::EncodingFields::encode
static constexpr uint64_t encode(Fields... Values)
Definition: AMDGPUBaseInfo.h:386

llvm::AMDGPU::EncodingFields::decode
static std::tuple< typename Fields::ValueType... > decode(uint64_t Encoded)
Definition: AMDGPUBaseInfo.h:390

llvm::AMDGPU::GcnBufferFormatInfo
Definition: AMDGPUBaseInfo.h:87

llvm::AMDGPU::GcnBufferFormatInfo::BitsPerComp
unsigned BitsPerComp
Definition: AMDGPUBaseInfo.h:89

llvm::AMDGPU::GcnBufferFormatInfo::Format
unsigned Format
Definition: AMDGPUBaseInfo.h:88

llvm::AMDGPU::GcnBufferFormatInfo::DataFormat
unsigned DataFormat
Definition: AMDGPUBaseInfo.h:92

llvm::AMDGPU::GcnBufferFormatInfo::NumFormat
unsigned NumFormat
Definition: AMDGPUBaseInfo.h:91

llvm::AMDGPU::GcnBufferFormatInfo::NumComponents
unsigned NumComponents
Definition: AMDGPUBaseInfo.h:90

llvm::AMDGPU::Hwreg::HwregSize
Definition: AMDGPUBaseInfo.h:1142

llvm::AMDGPU::Hwreg::HwregSize::encode
constexpr uint64_t encode() const
Definition: AMDGPUBaseInfo.h:1144

llvm::AMDGPU::Hwreg::HwregSize::decode
static ValueType decode(uint64_t Encoded)
Definition: AMDGPUBaseInfo.h:1145

llvm::AMDGPU::MAIInstInfo
Definition: AMDGPUBaseInfo.h:95

llvm::AMDGPU::MAIInstInfo::is_gfx940_xdl
bool is_gfx940_xdl
Definition: AMDGPUBaseInfo.h:98

llvm::AMDGPU::MAIInstInfo::Opcode
uint16_t Opcode
Definition: AMDGPUBaseInfo.h:96

llvm::AMDGPU::MAIInstInfo::is_dgemm
bool is_dgemm
Definition: AMDGPUBaseInfo.h:97

llvm::AMDGPU::MFMA_F8F6F4_Info
Definition: AMDGPUBaseInfo.h:101

llvm::AMDGPU::MFMA_F8F6F4_Info::F8F8Opcode
unsigned F8F8Opcode
Definition: AMDGPUBaseInfo.h:103

llvm::AMDGPU::MFMA_F8F6F4_Info::NumRegsSrcB
uint8_t NumRegsSrcB
Definition: AMDGPUBaseInfo.h:105

llvm::AMDGPU::MFMA_F8F6F4_Info::Opcode
unsigned Opcode
Definition: AMDGPUBaseInfo.h:102

llvm::AMDGPU::MFMA_F8F6F4_Info::NumRegsSrcA
uint8_t NumRegsSrcA
Definition: AMDGPUBaseInfo.h:104

llvm::AMDGPU::MIMGBaseOpcodeInfo
Definition: AMDGPUBaseInfo.h:407

llvm::AMDGPU::MIMGBaseOpcodeInfo::Gather4
bool Gather4
Definition: AMDGPUBaseInfo.h:413

llvm::AMDGPU::MIMGBaseOpcodeInfo::Gradients
bool Gradients
Definition: AMDGPUBaseInfo.h:416

llvm::AMDGPU::MIMGBaseOpcodeInfo::G16
bool G16
Definition: AMDGPUBaseInfo.h:417

llvm::AMDGPU::MIMGBaseOpcodeInfo::AtomicX2
bool AtomicX2
Definition: AMDGPUBaseInfo.h:411

llvm::AMDGPU::MIMGBaseOpcodeInfo::Sampler
bool Sampler
Definition: AMDGPUBaseInfo.h:412

llvm::AMDGPU::MIMGBaseOpcodeInfo::BaseOpcode
MIMGBaseOpcode BaseOpcode
Definition: AMDGPUBaseInfo.h:408

llvm::AMDGPU::MIMGBaseOpcodeInfo::NoReturn
bool NoReturn
Definition: AMDGPUBaseInfo.h:424

llvm::AMDGPU::MIMGBaseOpcodeInfo::HasD16
bool HasD16
Definition: AMDGPUBaseInfo.h:420

llvm::AMDGPU::MIMGBaseOpcodeInfo::LodOrClampOrMip
bool LodOrClampOrMip
Definition: AMDGPUBaseInfo.h:419

llvm::AMDGPU::MIMGBaseOpcodeInfo::Coordinates
bool Coordinates
Definition: AMDGPUBaseInfo.h:418

llvm::AMDGPU::MIMGBaseOpcodeInfo::MSAA
bool MSAA
Definition: AMDGPUBaseInfo.h:421

llvm::AMDGPU::MIMGBaseOpcodeInfo::Store
bool Store
Definition: AMDGPUBaseInfo.h:409

llvm::AMDGPU::MIMGBaseOpcodeInfo::Atomic
bool Atomic
Definition: AMDGPUBaseInfo.h:410

llvm::AMDGPU::MIMGBaseOpcodeInfo::A16
bool A16
Definition: AMDGPUBaseInfo.h:423

llvm::AMDGPU::MIMGBaseOpcodeInfo::BVH
bool BVH
Definition: AMDGPUBaseInfo.h:422

llvm::AMDGPU::MIMGBaseOpcodeInfo::NumExtraArgs
uint8_t NumExtraArgs
Definition: AMDGPUBaseInfo.h:415

llvm::AMDGPU::MIMGBiasMappingInfo
Definition: AMDGPUBaseInfo.h:462

llvm::AMDGPU::MIMGBiasMappingInfo::NoBias
MIMGBaseOpcode NoBias
Definition: AMDGPUBaseInfo.h:464

llvm::AMDGPU::MIMGBiasMappingInfo::Bias
MIMGBaseOpcode Bias
Definition: AMDGPUBaseInfo.h:463

llvm::AMDGPU::MIMGDimInfo
Definition: AMDGPUBaseInfo.h:433

llvm::AMDGPU::MIMGDimInfo::NumCoords
uint8_t NumCoords
Definition: AMDGPUBaseInfo.h:435

llvm::AMDGPU::MIMGDimInfo::MSAA
bool MSAA
Definition: AMDGPUBaseInfo.h:437

llvm::AMDGPU::MIMGDimInfo::AsmSuffix
const char * AsmSuffix
Definition: AMDGPUBaseInfo.h:440

llvm::AMDGPU::MIMGDimInfo::Dim
MIMGDim Dim
Definition: AMDGPUBaseInfo.h:434

llvm::AMDGPU::MIMGDimInfo::NumGradients
uint8_t NumGradients
Definition: AMDGPUBaseInfo.h:436

llvm::AMDGPU::MIMGDimInfo::Encoding
uint8_t Encoding
Definition: AMDGPUBaseInfo.h:439

llvm::AMDGPU::MIMGDimInfo::DA
bool DA
Definition: AMDGPUBaseInfo.h:438

llvm::AMDGPU::MIMGG16MappingInfo
Definition: AMDGPUBaseInfo.h:472

llvm::AMDGPU::MIMGG16MappingInfo::G
MIMGBaseOpcode G
Definition: AMDGPUBaseInfo.h:473

llvm::AMDGPU::MIMGG16MappingInfo::G16
MIMGBaseOpcode G16
Definition: AMDGPUBaseInfo.h:474

llvm::AMDGPU::MIMGInfo
Definition: AMDGPUBaseInfo.h:509

llvm::AMDGPU::MIMGInfo::VDataDwords
uint8_t VDataDwords
Definition: AMDGPUBaseInfo.h:513

llvm::AMDGPU::MIMGInfo::BaseOpcode
uint16_t BaseOpcode
Definition: AMDGPUBaseInfo.h:511

llvm::AMDGPU::MIMGInfo::Opcode
uint16_t Opcode
Definition: AMDGPUBaseInfo.h:510

llvm::AMDGPU::MIMGInfo::VAddrDwords
uint8_t VAddrDwords
Definition: AMDGPUBaseInfo.h:514

llvm::AMDGPU::MIMGInfo::VAddrOperands
uint8_t VAddrOperands
Definition: AMDGPUBaseInfo.h:515

llvm::AMDGPU::MIMGInfo::MIMGEncoding
uint8_t MIMGEncoding
Definition: AMDGPUBaseInfo.h:512

llvm::AMDGPU::MIMGLZMappingInfo
Definition: AMDGPUBaseInfo.h:452

llvm::AMDGPU::MIMGLZMappingInfo::LZ
MIMGBaseOpcode LZ
Definition: AMDGPUBaseInfo.h:454

llvm::AMDGPU::MIMGLZMappingInfo::L
MIMGBaseOpcode L
Definition: AMDGPUBaseInfo.h:453

llvm::AMDGPU::MIMGMIPMappingInfo
Definition: AMDGPUBaseInfo.h:457

llvm::AMDGPU::MIMGMIPMappingInfo::NONMIP
MIMGBaseOpcode NONMIP
Definition: AMDGPUBaseInfo.h:459

llvm::AMDGPU::MIMGMIPMappingInfo::MIP
MIMGBaseOpcode MIP
Definition: AMDGPUBaseInfo.h:458

llvm::AMDGPU::MIMGOffsetMappingInfo
Definition: AMDGPUBaseInfo.h:467

llvm::AMDGPU::MIMGOffsetMappingInfo::Offset
MIMGBaseOpcode Offset
Definition: AMDGPUBaseInfo.h:468

llvm::AMDGPU::MIMGOffsetMappingInfo::NoOffset
MIMGBaseOpcode NoOffset
Definition: AMDGPUBaseInfo.h:469

llvm::AMDGPU::WMMAOpcodeMappingInfo
Definition: AMDGPUBaseInfo.h:480

llvm::AMDGPU::WMMAOpcodeMappingInfo::Opcode3Addr
unsigned Opcode3Addr
Definition: AMDGPUBaseInfo.h:482

llvm::AMDGPU::WMMAOpcodeMappingInfo::Opcode2Addr
unsigned Opcode2Addr
Definition: AMDGPUBaseInfo.h:481

llvm::AMDGPU::Waitcnt
Represents the counter values to wait for in an s_waitcnt instruction.
Definition: AMDGPUBaseInfo.h:967

llvm::AMDGPU::Waitcnt::Waitcnt
Waitcnt()=default

llvm::AMDGPU::Waitcnt::ExpCnt
unsigned ExpCnt
Definition: AMDGPUBaseInfo.h:969

llvm::AMDGPU::Waitcnt::LoadCnt
unsigned LoadCnt
Definition: AMDGPUBaseInfo.h:968

llvm::AMDGPU::Waitcnt::Waitcnt
Waitcnt(unsigned LoadCnt, unsigned ExpCnt, unsigned DsCnt, unsigned StoreCnt, unsigned SampleCnt, unsigned BvhCnt, unsigned KmCnt)
Definition: AMDGPUBaseInfo.h:983

llvm::AMDGPU::Waitcnt::hasWait
bool hasWait() const
Definition: AMDGPUBaseInfo.h:988

llvm::AMDGPU::Waitcnt::BvhCnt
unsigned BvhCnt
Definition: AMDGPUBaseInfo.h:973

llvm::AMDGPU::Waitcnt::StoreCnt
unsigned StoreCnt
Definition: AMDGPUBaseInfo.h:971

llvm::AMDGPU::Waitcnt::SampleCnt
unsigned SampleCnt
Definition: AMDGPUBaseInfo.h:972

llvm::AMDGPU::Waitcnt::KmCnt
unsigned KmCnt
Definition: AMDGPUBaseInfo.h:974

llvm::AMDGPU::Waitcnt::hasWaitExceptStoreCnt
bool hasWaitExceptStoreCnt() const
Definition: AMDGPUBaseInfo.h:990

llvm::AMDGPU::Waitcnt::hasWaitStoreCnt
bool hasWaitStoreCnt() const
Definition: AMDGPUBaseInfo.h:995

llvm::AMDGPU::Waitcnt::Waitcnt
Waitcnt(unsigned VmCnt, unsigned ExpCnt, unsigned LgkmCnt, unsigned VsCnt)
Definition: AMDGPUBaseInfo.h:978

llvm::AMDGPU::Waitcnt::combined
Waitcnt combined(const Waitcnt &Other) const
Definition: AMDGPUBaseInfo.h:997

llvm::AMDGPU::Waitcnt::DsCnt
unsigned DsCnt
Definition: AMDGPUBaseInfo.h:970

llvm::DWARFExpression::Operation::Description
Description of the encoding of one expression Op.
Definition: DWARFExpression.h:66