LLVM 20.0.0git
Macros | Functions | Variables
AMDGPULegalizerInfo.cpp File Reference

This file implements the targeting of the Machinelegalizer class for AMDGPU. More...

#include "AMDGPULegalizerInfo.h"
#include "AMDGPU.h"
#include "AMDGPUGlobalISelUtils.h"
#include "AMDGPUInstrInfo.h"
#include "AMDGPUMemoryUtils.h"
#include "AMDGPUTargetMachine.h"
#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
#include "SIInstrInfo.h"
#include "SIMachineFunctionInfo.h"
#include "SIRegisterInfo.h"
#include "Utils/AMDGPUBaseInfo.h"
#include "llvm/ADT/ScopeExit.h"
#include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h"
#include "llvm/CodeGen/GlobalISel/LegalizerHelper.h"
#include "llvm/CodeGen/GlobalISel/MIPatternMatch.h"
#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
#include "llvm/CodeGen/GlobalISel/Utils.h"
#include "llvm/CodeGen/TargetOpcodes.h"
#include "llvm/IR/DiagnosticInfo.h"
#include "llvm/IR/IntrinsicsAMDGPU.h"
#include "llvm/IR/IntrinsicsR600.h"

Go to the source code of this file.

Macros

#define DEBUG_TYPE   "amdgpu-legalinfo"
 

Functions

static LLT getPow2VectorType (LLT Ty)
 
static LLT getPow2ScalarType (LLT Ty)
 
static LegalityPredicate isSmallOddVector (unsigned TypeIdx)
 
static LegalityPredicate sizeIsMultipleOf32 (unsigned TypeIdx)
 
static LegalityPredicate isWideVec16 (unsigned TypeIdx)
 
static LegalizeMutation oneMoreElement (unsigned TypeIdx)
 
static LegalizeMutation fewerEltsToSize64Vector (unsigned TypeIdx)
 
static LegalizeMutation moreEltsToNext32Bit (unsigned TypeIdx)
 
static LegalizeMutation moreElementsToNextExistingRegClass (unsigned TypeIdx)
 
static LLT getBufferRsrcScalarType (const LLT Ty)
 
static LLT getBufferRsrcRegisterType (const LLT Ty)
 
static LLT getBitcastRegisterType (const LLT Ty)
 
static LegalizeMutation bitcastToRegisterType (unsigned TypeIdx)
 
static LegalizeMutation bitcastToVectorElement32 (unsigned TypeIdx)
 
static LegalityPredicate vectorSmallerThan (unsigned TypeIdx, unsigned Size)
 
static LegalityPredicate vectorWiderThan (unsigned TypeIdx, unsigned Size)
 
static LegalityPredicate numElementsNotEven (unsigned TypeIdx)
 
static bool isRegisterSize (unsigned Size)
 
static bool isRegisterVectorElementType (LLT EltTy)
 
static bool isRegisterVectorType (LLT Ty)
 
static bool isRegisterType (LLT Ty)
 
static LegalityPredicate isRegisterType (unsigned TypeIdx)
 
static LegalityPredicate isIllegalRegisterType (unsigned TypeIdx)
 
static LegalityPredicate elementTypeIsLegal (unsigned TypeIdx)
 
static bool isRegisterClassType (LLT Ty)
 
static LegalityPredicate isRegisterClassType (unsigned TypeIdx)
 
static LegalityPredicate isWideScalarExtLoadTruncStore (unsigned TypeIdx)
 
static unsigned maxSizeForAddrSpace (const GCNSubtarget &ST, unsigned AS, bool IsLoad, bool IsAtomic)
 
static bool isLoadStoreSizeLegal (const GCNSubtarget &ST, const LegalityQuery &Query)
 
static bool hasBufferRsrcWorkaround (const LLT Ty)
 
static bool loadStoreBitcastWorkaround (const LLT Ty)
 
static bool isLoadStoreLegal (const GCNSubtarget &ST, const LegalityQuery &Query)
 
static bool shouldBitcastLoadStoreType (const GCNSubtarget &ST, const LLT Ty, const LLT MemTy)
 Return true if a load or store of the type should be lowered with a bitcast to a different type.
 
static bool shouldWidenLoad (const GCNSubtarget &ST, LLT MemoryTy, uint64_t AlignInBits, unsigned AddrSpace, unsigned Opcode)
 Return true if we should legalize a load by widening an odd sized memory access up to the alignment.
 
static bool shouldWidenLoad (const GCNSubtarget &ST, const LegalityQuery &Query, unsigned Opcode)
 
static LLT castBufferRsrcFromV4I32 (MachineInstr &MI, MachineIRBuilder &B, MachineRegisterInfo &MRI, unsigned Idx)
 Mutates IR (typicaly a load instruction) to use a <4 x s32> as the initial type of the operand idx and then to transform it to a p8 via bitcasts and inttoptr.
 
static Register castBufferRsrcToV4I32 (Register Pointer, MachineIRBuilder &B)
 Cast a buffer resource (an address space 8 pointer) into a 4xi32, which is the form in which the value must be in order to be passed to the low-level representations used for MUBUF/MTBUF intrinsics.
 
static void castBufferRsrcArgToV4I32 (MachineInstr &MI, MachineIRBuilder &B, unsigned Idx)
 
static bool isKnownNonNull (Register Val, MachineRegisterInfo &MRI, const AMDGPUTargetMachine &TM, unsigned AddrSpace)
 Return true if the value is a known valid address, such that a null check is not necessary.
 
static MachineInstrBuilder extractF64Exponent (Register Hi, MachineIRBuilder &B)
 
static LLT widenToNextPowerOf2 (LLT Ty)
 
static bool valueIsKnownNeverF32Denorm (const MachineRegisterInfo &MRI, Register Src)
 Return true if it's known that Src can never be an f32 denormal value.
 
static bool allowApproxFunc (const MachineFunction &MF, unsigned Flags)
 
static bool needsDenormHandlingF32 (const MachineFunction &MF, Register Src, unsigned Flags)
 
static Register getMad (MachineIRBuilder &B, LLT Ty, Register X, Register Y, Register Z, unsigned Flags)
 
static Register stripAnySourceMods (Register OrigSrc, MachineRegisterInfo &MRI)
 
static bool isNot (const MachineRegisterInfo &MRI, const MachineInstr &MI)
 
static MachineInstrverifyCFIntrinsic (MachineInstr &MI, MachineRegisterInfo &MRI, MachineInstr *&Br, MachineBasicBlock *&UncondBrTarget, bool &Negated)
 
static bool replaceWithConstant (MachineIRBuilder &B, MachineInstr &MI, int64_t C)
 
static std::pair< Register, RegisteremitReciprocalU64 (MachineIRBuilder &B, Register Val)
 
static void toggleSPDenormMode (bool Enable, MachineIRBuilder &B, const GCNSubtarget &ST, SIModeRegisterDefaults Mode)
 
static void buildBufferLoad (unsigned Opc, Register LoadDstReg, Register RSrc, Register VIndex, Register VOffset, Register SOffset, unsigned ImmOffset, unsigned Format, unsigned AuxiliaryData, MachineMemOperand *MMO, bool IsTyped, bool HasVIndex, MachineIRBuilder &B)
 
static unsigned getBufferAtomicPseudo (Intrinsic::ID IntrID)
 
static void packImage16bitOpsToDwords (MachineIRBuilder &B, MachineInstr &MI, SmallVectorImpl< Register > &PackedAddrs, unsigned ArgOffset, const AMDGPU::ImageDimIntrinsicInfo *Intr, bool IsA16, bool IsG16)
 Turn a set of s16 typed registers in AddrRegs into a dword sized vector with s16 typed elements.
 
static void convertImageAddrToPacked (MachineIRBuilder &B, MachineInstr &MI, int DimIdx, int NumVAddrs)
 Convert from separate vaddr components to a single vector address register, and replace the remaining operands with $noreg.
 

Variables

static cl::opt< boolEnableNewLegality ("amdgpu-global-isel-new-legality", cl::desc("Use GlobalISel desired legality, rather than try to use" "rules compatible with selection patterns"), cl::init(false), cl::ReallyHidden)
 
static constexpr unsigned MaxRegisterSize = 1024
 
static const LLT S1 = LLT::scalar(1)
 
static const LLT S8 = LLT::scalar(8)
 
static const LLT S16 = LLT::scalar(16)
 
static const LLT S32 = LLT::scalar(32)
 
static const LLT F32 = LLT::float32()
 
static const LLT S64 = LLT::scalar(64)
 
static const LLT F64 = LLT::float64()
 
static const LLT S96 = LLT::scalar(96)
 
static const LLT S128 = LLT::scalar(128)
 
static const LLT S160 = LLT::scalar(160)
 
static const LLT S192 = LLT::scalar(192)
 
static const LLT S224 = LLT::scalar(224)
 
static const LLT S256 = LLT::scalar(256)
 
static const LLT S512 = LLT::scalar(512)
 
static const LLT S1024 = LLT::scalar(1024)
 
static const LLT MaxScalar = LLT::scalar(MaxRegisterSize)
 
static const LLT V2S8 = LLT::fixed_vector(2, 8)
 
static const LLT V2S16 = LLT::fixed_vector(2, 16)
 
static const LLT V4S16 = LLT::fixed_vector(4, 16)
 
static const LLT V6S16 = LLT::fixed_vector(6, 16)
 
static const LLT V8S16 = LLT::fixed_vector(8, 16)
 
static const LLT V10S16 = LLT::fixed_vector(10, 16)
 
static const LLT V12S16 = LLT::fixed_vector(12, 16)
 
static const LLT V16S16 = LLT::fixed_vector(16, 16)
 
static const LLT V2F16 = LLT::fixed_vector(2, LLT::float16())
 
static const LLT V2BF16 = V2F16
 
static const LLT V2S32 = LLT::fixed_vector(2, 32)
 
static const LLT V3S32 = LLT::fixed_vector(3, 32)
 
static const LLT V4S32 = LLT::fixed_vector(4, 32)
 
static const LLT V5S32 = LLT::fixed_vector(5, 32)
 
static const LLT V6S32 = LLT::fixed_vector(6, 32)
 
static const LLT V7S32 = LLT::fixed_vector(7, 32)
 
static const LLT V8S32 = LLT::fixed_vector(8, 32)
 
static const LLT V9S32 = LLT::fixed_vector(9, 32)
 
static const LLT V10S32 = LLT::fixed_vector(10, 32)
 
static const LLT V11S32 = LLT::fixed_vector(11, 32)
 
static const LLT V12S32 = LLT::fixed_vector(12, 32)
 
static const LLT V16S32 = LLT::fixed_vector(16, 32)
 
static const LLT V32S32 = LLT::fixed_vector(32, 32)
 
static const LLT V2S64 = LLT::fixed_vector(2, 64)
 
static const LLT V3S64 = LLT::fixed_vector(3, 64)
 
static const LLT V4S64 = LLT::fixed_vector(4, 64)
 
static const LLT V5S64 = LLT::fixed_vector(5, 64)
 
static const LLT V6S64 = LLT::fixed_vector(6, 64)
 
static const LLT V7S64 = LLT::fixed_vector(7, 64)
 
static const LLT V8S64 = LLT::fixed_vector(8, 64)
 
static const LLT V16S64 = LLT::fixed_vector(16, 64)
 
static const LLT V2S128 = LLT::fixed_vector(2, 128)
 
static const LLT V4S128 = LLT::fixed_vector(4, 128)
 
static std::initializer_list< LLTAllScalarTypes
 
static std::initializer_list< LLTAllS16Vectors
 
static std::initializer_list< LLTAllS32Vectors
 
static std::initializer_list< LLTAllS64Vectors
 
static constexpr unsigned SPDenormModeBitField
 
static constexpr unsigned FPEnvModeBitField
 
static constexpr unsigned FPEnvTrapBitField
 

Detailed Description

This file implements the targeting of the Machinelegalizer class for AMDGPU.

Todo:
This should be generated by TableGen.

Definition in file AMDGPULegalizerInfo.cpp.

Macro Definition Documentation

◆ DEBUG_TYPE

#define DEBUG_TYPE   "amdgpu-legalinfo"

Definition at line 37 of file AMDGPULegalizerInfo.cpp.

Function Documentation

◆ allowApproxFunc()

static bool allowApproxFunc ( const MachineFunction MF,
unsigned  Flags 
)
static

◆ bitcastToRegisterType()

static LegalizeMutation bitcastToRegisterType ( unsigned  TypeIdx)
static

Definition at line 188 of file AMDGPULegalizerInfo.cpp.

References getBitcastRegisterType().

◆ bitcastToVectorElement32()

static LegalizeMutation bitcastToVectorElement32 ( unsigned  TypeIdx)
static

◆ buildBufferLoad()

static void buildBufferLoad ( unsigned  Opc,
Register  LoadDstReg,
Register  RSrc,
Register  VIndex,
Register  VOffset,
Register  SOffset,
unsigned  ImmOffset,
unsigned  Format,
unsigned  AuxiliaryData,
MachineMemOperand MMO,
bool  IsTyped,
bool  HasVIndex,
MachineIRBuilder B 
)
static

Definition at line 5959 of file AMDGPULegalizerInfo.cpp.

References B, and llvm::Format.

Referenced by llvm::AMDGPULegalizerInfo::legalizeBufferLoad().

◆ castBufferRsrcArgToV4I32()

static void castBufferRsrcArgToV4I32 ( MachineInstr MI,
MachineIRBuilder B,
unsigned  Idx 
)
static

◆ castBufferRsrcFromV4I32()

static LLT castBufferRsrcFromV4I32 ( MachineInstr MI,
MachineIRBuilder B,
MachineRegisterInfo MRI,
unsigned  Idx 
)
static

Mutates IR (typicaly a load instruction) to use a <4 x s32> as the initial type of the operand idx and then to transform it to a p8 via bitcasts and inttoptr.

In addition, handle vectors of p8. Returns the new type.

Definition at line 585 of file AMDGPULegalizerInfo.cpp.

References B, getBufferRsrcRegisterType(), getBufferRsrcScalarType(), llvm::MachineOperand::getReg(), hasBufferRsrcWorkaround(), I, Idx, MI, MRI, S32, llvm::LLT::scalar(), and llvm::MachineOperand::setReg().

Referenced by llvm::AMDGPULegalizerInfo::legalizeBufferLoad(), llvm::AMDGPULegalizerInfo::legalizeLoad(), and llvm::AMDGPULegalizerInfo::legalizeSBufferLoad().

◆ castBufferRsrcToV4I32()

static Register castBufferRsrcToV4I32 ( Register  Pointer,
MachineIRBuilder B 
)
static

Cast a buffer resource (an address space 8 pointer) into a 4xi32, which is the form in which the value must be in order to be passed to the low-level representations used for MUBUF/MTBUF intrinsics.

This is a hack, which is needed in order to account for the fact that we can't define a register class for s128 without breaking SelectionDAG.

Definition at line 626 of file AMDGPULegalizerInfo.cpp.

References B, getBufferRsrcRegisterType(), getBufferRsrcScalarType(), I, MRI, llvm::SmallVectorTemplateBase< T, bool >::push_back(), and llvm::LLT::scalar().

Referenced by castBufferRsrcArgToV4I32(), and llvm::AMDGPULegalizerInfo::fixStoreSourceType().

◆ convertImageAddrToPacked()

static void convertImageAddrToPacked ( MachineIRBuilder B,
MachineInstr MI,
int  DimIdx,
int  NumVAddrs 
)
static

Convert from separate vaddr components to a single vector address register, and replace the remaining operands with $noreg.

Definition at line 6359 of file AMDGPULegalizerInfo.cpp.

References assert(), B, llvm::LLT::fixed_vector(), llvm::SrcOp::getReg(), I, MI, llvm::SmallVectorTemplateBase< T, bool >::push_back(), S32, llvm::LLT::scalar(), and llvm::SmallVectorBase< Size_T >::size().

Referenced by llvm::AMDGPULegalizerInfo::legalizeImageIntrinsic().

◆ elementTypeIsLegal()

static LegalityPredicate elementTypeIsLegal ( unsigned  TypeIdx)
static

◆ emitReciprocalU64()

static std::pair< Register, Register > emitReciprocalU64 ( MachineIRBuilder B,
Register  Val 
)
static

◆ extractF64Exponent()

static MachineInstrBuilder extractF64Exponent ( Register  Hi,
MachineIRBuilder B 
)
static

Definition at line 2511 of file AMDGPULegalizerInfo.cpp.

References B, llvm::Hi, S32, and llvm::LLT::scalar().

◆ fewerEltsToSize64Vector()

static LegalizeMutation fewerEltsToSize64Vector ( unsigned  TypeIdx)
static

◆ getBitcastRegisterType()

static LLT getBitcastRegisterType ( const LLT  Ty)
static

◆ getBufferAtomicPseudo()

static unsigned getBufferAtomicPseudo ( Intrinsic::ID  IntrID)
static

◆ getBufferRsrcRegisterType()

static LLT getBufferRsrcRegisterType ( const LLT  Ty)
static

◆ getBufferRsrcScalarType()

static LLT getBufferRsrcScalarType ( const LLT  Ty)
static

◆ getMad()

static Register getMad ( MachineIRBuilder B,
LLT  Ty,
Register  X,
Register  Y,
Register  Z,
unsigned  Flags 
)
static

Definition at line 3354 of file AMDGPULegalizerInfo.cpp.

References B, llvm::FMul, X, and Y.

◆ getPow2ScalarType()

static LLT getPow2ScalarType ( LLT  Ty)
static

◆ getPow2VectorType()

static LLT getPow2VectorType ( LLT  Ty)
static

◆ hasBufferRsrcWorkaround()

static bool hasBufferRsrcWorkaround ( const LLT  Ty)
static

◆ isIllegalRegisterType()

static LegalityPredicate isIllegalRegisterType ( unsigned  TypeIdx)
static

◆ isKnownNonNull()

static bool isKnownNonNull ( Register  Val,
MachineRegisterInfo MRI,
const AMDGPUTargetMachine TM,
unsigned  AddrSpace 
)
static

Return true if the value is a known valid address, such that a null check is not necessary.

Definition at line 2292 of file AMDGPULegalizerInfo.cpp.

References llvm::ConstantInt::getSExtValue(), and MRI.

Referenced by llvm::AMDGPULegalizerInfo::legalizeAddrSpaceCast().

◆ isLoadStoreLegal()

static bool isLoadStoreLegal ( const GCNSubtarget ST,
const LegalityQuery Query 
)
static

◆ isLoadStoreSizeLegal()

static bool isLoadStoreSizeLegal ( const GCNSubtarget ST,
const LegalityQuery Query 
)
static

◆ isNot()

static bool isNot ( const MachineRegisterInfo MRI,
const MachineInstr MI 
)
static

◆ isRegisterClassType() [1/2]

static bool isRegisterClassType ( LLT  Ty)
static

◆ isRegisterClassType() [2/2]

static LegalityPredicate isRegisterClassType ( unsigned  TypeIdx)
static

Definition at line 359 of file AMDGPULegalizerInfo.cpp.

References isRegisterClassType().

◆ isRegisterSize()

static bool isRegisterSize ( unsigned  Size)
static

Definition at line 226 of file AMDGPULegalizerInfo.cpp.

References MaxRegisterSize, and Size.

Referenced by isRegisterType(), and shouldBitcastLoadStoreType().

◆ isRegisterType() [1/2]

static bool isRegisterType ( LLT  Ty)
static

◆ isRegisterType() [2/2]

static LegalityPredicate isRegisterType ( unsigned  TypeIdx)
static

Definition at line 255 of file AMDGPULegalizerInfo.cpp.

References isRegisterType().

◆ isRegisterVectorElementType()

static bool isRegisterVectorElementType ( LLT  EltTy)
static

Definition at line 230 of file AMDGPULegalizerInfo.cpp.

References llvm::LLT::getSizeInBits().

Referenced by shouldBitcastLoadStoreType().

◆ isRegisterVectorType()

static bool isRegisterVectorType ( LLT  Ty)
static

◆ isSmallOddVector()

static LegalityPredicate isSmallOddVector ( unsigned  TypeIdx)
static
Returns
true if this is an odd sized vector which should widen by adding an additional element. This is mostly to handle <3 x s16> -> <4 x s16>. This excludes s1 vectors, which should always be scalarized.

Definition at line 72 of file AMDGPULegalizerInfo.cpp.

References llvm::LLT::getElementType(), llvm::LLT::getNumElements(), llvm::LLT::getSizeInBits(), and llvm::LLT::isVector().

Referenced by llvm::AMDGPULegalizerInfo::AMDGPULegalizerInfo().

◆ isWideScalarExtLoadTruncStore()

static LegalityPredicate isWideScalarExtLoadTruncStore ( unsigned  TypeIdx)
static

Definition at line 367 of file AMDGPULegalizerInfo.cpp.

References llvm::LLT::getSizeInBits(), and llvm::LLT::isVector().

◆ isWideVec16()

static LegalityPredicate isWideVec16 ( unsigned  TypeIdx)
static

◆ loadStoreBitcastWorkaround()

static bool loadStoreBitcastWorkaround ( const LLT  Ty)
static

◆ maxSizeForAddrSpace()

static unsigned maxSizeForAddrSpace ( const GCNSubtarget ST,
unsigned  AS,
bool  IsLoad,
bool  IsAtomic 
)
static

◆ moreElementsToNextExistingRegClass()

static LegalizeMutation moreElementsToNextExistingRegClass ( unsigned  TypeIdx)
static

◆ moreEltsToNext32Bit()

static LegalizeMutation moreEltsToNext32Bit ( unsigned  TypeIdx)
static

◆ needsDenormHandlingF32()

static bool needsDenormHandlingF32 ( const MachineFunction MF,
Register  Src,
unsigned  Flags 
)
static

◆ numElementsNotEven()

static LegalityPredicate numElementsNotEven ( unsigned  TypeIdx)
static

Definition at line 219 of file AMDGPULegalizerInfo.cpp.

References llvm::LLT::getNumElements(), and llvm::LLT::isVector().

◆ oneMoreElement()

static LegalizeMutation oneMoreElement ( unsigned  TypeIdx)
static

◆ packImage16bitOpsToDwords()

static void packImage16bitOpsToDwords ( MachineIRBuilder B,
MachineInstr MI,
SmallVectorImpl< Register > &  PackedAddrs,
unsigned  ArgOffset,
const AMDGPU::ImageDimIntrinsicInfo Intr,
bool  IsA16,
bool  IsG16 
)
static

Turn a set of s16 typed registers in AddrRegs into a dword sized vector with s16 typed elements.

Definition at line 6298 of file AMDGPULegalizerInfo.cpp.

References assert(), B, llvm::LLT::fixed_vector(), llvm::SrcOp::getReg(), I, Intr, MI, llvm::SmallVectorTemplateBase< T, bool >::push_back(), S16, llvm::LLT::scalar(), and V2S16.

Referenced by llvm::AMDGPULegalizerInfo::legalizeImageIntrinsic().

◆ replaceWithConstant()

static bool replaceWithConstant ( MachineIRBuilder B,
MachineInstr MI,
int64_t  C 
)
static

◆ shouldBitcastLoadStoreType()

static bool shouldBitcastLoadStoreType ( const GCNSubtarget ST,
const LLT  Ty,
const LLT  MemTy 
)
static

◆ shouldWidenLoad() [1/2]

static bool shouldWidenLoad ( const GCNSubtarget ST,
const LegalityQuery Query,
unsigned  Opcode 
)
static

◆ shouldWidenLoad() [2/2]

static bool shouldWidenLoad ( const GCNSubtarget ST,
LLT  MemoryTy,
uint64_t  AlignInBits,
unsigned  AddrSpace,
unsigned  Opcode 
)
static

Return true if we should legalize a load by widening an odd sized memory access up to the alignment.

Note this case when the memory access itself changes, not the size of the result register.

Definition at line 538 of file AMDGPULegalizerInfo.cpp.

References llvm::SITargetLowering::allowsMisalignedMemoryAccessesImpl(), llvm::CallingConv::Fast, llvm::LLT::getSizeInBits(), llvm::isPowerOf2_32(), maxSizeForAddrSpace(), llvm::MachineMemOperand::MOLoad, and llvm::NextPowerOf2().

Referenced by llvm::AMDGPULegalizerInfo::legalizeLoad(), and shouldWidenLoad().

◆ sizeIsMultipleOf32()

static LegalityPredicate sizeIsMultipleOf32 ( unsigned  TypeIdx)
static

Definition at line 86 of file AMDGPULegalizerInfo.cpp.

References llvm::LLT::getSizeInBits().

◆ stripAnySourceMods()

static Register stripAnySourceMods ( Register  OrigSrc,
MachineRegisterInfo MRI 
)
static

Definition at line 3784 of file AMDGPULegalizerInfo.cpp.

References llvm::getOpcodeDef(), and MRI.

Referenced by llvm::AMDGPULegalizerInfo::legalizeFFloor().

◆ toggleSPDenormMode()

static void toggleSPDenormMode ( bool  Enable,
MachineIRBuilder B,
const GCNSubtarget ST,
SIModeRegisterDefaults  Mode 
)
static

◆ valueIsKnownNeverF32Denorm()

static bool valueIsKnownNeverF32Denorm ( const MachineRegisterInfo MRI,
Register  Src 
)
static

Return true if it's known that Src can never be an f32 denormal value.

Definition at line 3240 of file AMDGPULegalizerInfo.cpp.

References DefMI, getIntrinsicID(), llvm::MachineInstr::getOpcode(), llvm::MachineInstr::getOperand(), llvm::MachineOperand::getReg(), MRI, and llvm::LLT::scalar().

◆ vectorSmallerThan()

static LegalityPredicate vectorSmallerThan ( unsigned  TypeIdx,
unsigned  Size 
)
static

Definition at line 205 of file AMDGPULegalizerInfo.cpp.

References llvm::LLT::getSizeInBits(), llvm::LLT::isVector(), and Size.

◆ vectorWiderThan()

static LegalityPredicate vectorWiderThan ( unsigned  TypeIdx,
unsigned  Size 
)
static

◆ verifyCFIntrinsic()

static MachineInstr * verifyCFIntrinsic ( MachineInstr MI,
MachineRegisterInfo MRI,
MachineInstr *&  Br,
MachineBasicBlock *&  UncondBrTarget,
bool Negated 
)
static

◆ widenToNextPowerOf2()

static LLT widenToNextPowerOf2 ( LLT  Ty)
static

Variable Documentation

◆ AllS16Vectors

std::initializer_list<LLT> AllS16Vectors
static
Initial value:
{
static const LLT V16S16
static const LLT V2S16
static const LLT V4S16
static const LLT V12S16
static const LLT V4S128
static const LLT V10S16
static const LLT V2S128
static const LLT V6S16
static const LLT V8S16

Definition at line 340 of file AMDGPULegalizerInfo.cpp.

Referenced by isRegisterClassType().

◆ AllS32Vectors

std::initializer_list<LLT> AllS32Vectors
static
Initial value:
= {
static const LLT V4S32
static const LLT V2S32
static const LLT V12S32
static const LLT V8S32
static const LLT V3S32
static const LLT V6S32
static const LLT V7S32
static const LLT V5S32
static const LLT V11S32
static const LLT V32S32
static const LLT V9S32
static const LLT V10S32
static const LLT V16S32

Definition at line 343 of file AMDGPULegalizerInfo.cpp.

Referenced by llvm::AMDGPULegalizerInfo::AMDGPULegalizerInfo(), and isRegisterClassType().

◆ AllS64Vectors

std::initializer_list<LLT> AllS64Vectors
static
Initial value:
static const LLT V3S64
static const LLT V8S64
static const LLT V4S64
static const LLT V16S64
static const LLT V7S64
static const LLT V5S64
static const LLT V6S64
static const LLT V2S64

Definition at line 347 of file AMDGPULegalizerInfo.cpp.

Referenced by llvm::AMDGPULegalizerInfo::AMDGPULegalizerInfo(), and isRegisterClassType().

◆ AllScalarTypes

std::initializer_list<LLT> AllScalarTypes
static
Initial value:
= {
static const LLT S128
static const LLT S64
static const LLT S32
static const LLT S1024
static const LLT S192
static const LLT S512
static const LLT S160
static const LLT S96
static const LLT S256
static const LLT S224

Definition at line 337 of file AMDGPULegalizerInfo.cpp.

Referenced by isRegisterClassType().

◆ EnableNewLegality

cl::opt< bool > EnableNewLegality("amdgpu-global-isel-new-legality", cl::desc("Use GlobalISel desired legality, rather than try to use" "rules compatible with selection patterns"), cl::init(false), cl::ReallyHidden) ( "amdgpu-global-isel-new-legality"  ,
cl::desc("Use GlobalISel desired legality, rather than try to use" "rules compatible with selection patterns")  ,
cl::init(false)  ,
cl::ReallyHidden   
)
static

◆ F32

const LLT F32 = LLT::float32()
static

◆ F64

const LLT F64 = LLT::float64()
static

◆ FPEnvModeBitField

constexpr unsigned FPEnvModeBitField
staticconstexpr

◆ FPEnvTrapBitField

constexpr unsigned FPEnvTrapBitField
staticconstexpr

◆ MaxRegisterSize

constexpr unsigned MaxRegisterSize = 1024
staticconstexpr

Definition at line 53 of file AMDGPULegalizerInfo.cpp.

Referenced by isRegisterSize(), and moreElementsToNextExistingRegClass().

◆ MaxScalar

const LLT MaxScalar = LLT::scalar(MaxRegisterSize)
static

◆ S1

const LLT S1 = LLT::scalar(1)
static

Definition at line 282 of file AMDGPULegalizerInfo.cpp.

Referenced by llvm::AMDGPULegalizerInfo::AMDGPULegalizerInfo(), llvm::HexagonSubtarget::BankConflictMutation::apply(), llvm::AMDGPURegisterBankInfo::applyMappingMAD_64_32(), llvm::BinaryOperator::BinaryOperator(), llvm::AMDGPULegalizerInfo::buildMultiply(), llvm::StringSwitch< T, R >::Cases(), llvm::StringSwitch< T, R >::CasesLower(), llvm::BinaryOperator::Create(), llvm::CmpInst::Create(), llvm::sandboxir::CmpInst::create(), llvm::SelectInst::Create(), CreateAdd(), CreateMul(), CreateNeg(), llvm::CmpInst::CreateWithCopiedFlags(), llvm::sandboxir::CmpInst::createWithCopiedFlags(), llvm::PMDataManager::dumpPassInfo(), llvm::AMDGPURegisterBankInfo::executeInWaterfallLoop(), foldShuffleOfUnaryOps(), llvm::get_stable_name(), llvm::DILocation::getMergedLocation(), gsiRecordCmp(), INITIALIZE_PASS(), llvm::isEqual(), llvm::MipsCCState::isF128SoftLibCall(), llvm::MipsMCExpr::isGpOff(), isMemOPCandidate(), llvm::AMDGPULegalizerInfo::legalizeFceil(), llvm::AMDGPULegalizerInfo::legalizeFDIV32(), llvm::AMDGPULegalizerInfo::legalizeFDIV64(), llvm::AMDGPULegalizerInfo::legalizeFDIVFastIntrin(), llvm::AMDGPULegalizerInfo::legalizeFFloor(), llvm::AMDGPULegalizerInfo::legalizeFSQRTF32(), llvm::AMDGPULegalizerInfo::legalizeFSQRTF64(), llvm::AMDGPULegalizerInfo::legalizeIntrinsicTrunc(), llvm::AMDGPULegalizerInfo::legalizeUnsignedDIV_REM32Impl(), llvm::AMDGPULegalizerInfo::legalizeUnsignedDIV_REM64Impl(), llvm::LegalizerHelper::lowerFPTOSI(), llvm::LegalizerHelper::lowerFPTOUI(), llvm::LegalizerHelper::lowerFPTRUNC_F64_TO_F16(), llvm::LegalizerHelper::lowerSITOFP(), llvm::LegalizerHelper::lowerU64ToF32BitOps(), llvm::LegalizerHelper::lowerU64ToF32WithSITOFP(), matchBinaryPermuteShuffle(), llvm::CombinerHelper::matchCommuteShift(), llvm::ARMTargetLowering::PerformMVETruncCombine(), performVectorExtCombine(), llvm::PPCLegalizerInfo::PPCLegalizerInfo(), runImpl(), llvm::set_difference(), llvm::set_intersect(), llvm::set_intersection(), llvm::set_intersection_impl(), llvm::set_is_subset(), llvm::set_subtract(), llvm::set_union(), simplifyLoopInst(), and llvm::GISelCSEInfo::verify().

◆ S1024

const LLT S1024 = LLT::scalar(1024)
static

Definition at line 296 of file AMDGPULegalizerInfo.cpp.

◆ S128

const LLT S128 = LLT::scalar(128)
static

◆ S16

const LLT S16 = LLT::scalar(16)
static

◆ S160

const LLT S160 = LLT::scalar(160)
static

Definition at line 291 of file AMDGPULegalizerInfo.cpp.

◆ S192

const LLT S192 = LLT::scalar(192)
static

Definition at line 292 of file AMDGPULegalizerInfo.cpp.

◆ S224

const LLT S224 = LLT::scalar(224)
static

Definition at line 293 of file AMDGPULegalizerInfo.cpp.

◆ S256

const LLT S256 = LLT::scalar(256)
static

◆ S32

const LLT S32 = LLT::scalar(32)
static

Definition at line 285 of file AMDGPULegalizerInfo.cpp.

Referenced by llvm::SITargetLowering::allocateSpecialEntryInputVGPRs(), llvm::AMDGPULegalizerInfo::AMDGPULegalizerInfo(), llvm::AMDGPURegisterBankInfo::applyMappingBFE(), llvm::AMDGPURegisterBankInfo::applyMappingImpl(), llvm::AMDGPURegisterBankInfo::applyMappingLoad(), llvm::AMDGPURegisterBankInfo::applyMappingMAD_64_32(), llvm::AMDGPURegisterBankInfo::applyMappingSBufferLoad(), llvm::AMDGPULegalizerInfo::buildAbsGlobalAddress(), llvm::AMDGPULegalizerInfo::buildMultiply(), llvm::AMDGPURegisterBankInfo::buildReadFirstLane(), castBufferRsrcFromV4I32(), convertImageAddrToPacked(), emitReciprocalU64(), extractF64Exponent(), llvm::AMDGPULegalizerInfo::getSegmentAperture(), llvm::AMDGPURegisterBankInfo::handleD16VData(), llvm::AMDGPULegalizerInfo::handleD16VData(), llvm::AMDGPULegalizerInfo::legalizeAddrSpaceCast(), llvm::AMDGPULegalizerInfo::legalizeBufferLoad(), llvm::AMDGPULegalizerInfo::legalizeBufferStore(), llvm::AMDGPULegalizerInfo::legalizeBuildVector(), llvm::AMDGPULegalizerInfo::legalizeBVHIntrinsic(), llvm::AMDGPULegalizerInfo::legalizeCTLZ_ZERO_UNDEF(), llvm::AMDGPULegalizerInfo::legalizeFDIV(), llvm::AMDGPULegalizerInfo::legalizeFDIV16(), llvm::AMDGPULegalizerInfo::legalizeFDIV32(), llvm::AMDGPULegalizerInfo::legalizeFDIV64(), llvm::AMDGPULegalizerInfo::legalizeFDIVFastIntrin(), llvm::AMDGPULegalizerInfo::legalizeFPTOI(), llvm::AMDGPULegalizerInfo::legalizeFSQRTF64(), llvm::AMDGPULegalizerInfo::legalizeGetFPEnv(), llvm::AMDGPULegalizerInfo::legalizeGlobalValue(), llvm::AMDGPULegalizerInfo::legalizeImageIntrinsic(), llvm::AMDGPULegalizerInfo::legalizeIntrinsic(), llvm::AMDGPULegalizerInfo::legalizeIntrinsicTrunc(), llvm::AMDGPULegalizerInfo::legalizeITOFP(), llvm::AMDGPULegalizerInfo::legalizeLaneOp(), llvm::AMDGPULegalizerInfo::legalizeMul(), llvm::AMDGPULegalizerInfo::legalizePointerAsRsrcIntrin(), llvm::AMDGPULegalizerInfo::legalizeSetFPEnv(), llvm::AMDGPULegalizerInfo::legalizeSignedDIV_REM(), llvm::AMDGPULegalizerInfo::legalizeUnsignedDIV_REM(), llvm::AMDGPULegalizerInfo::legalizeUnsignedDIV_REM32Impl(), llvm::AMDGPULegalizerInfo::legalizeUnsignedDIV_REM64Impl(), llvm::AMDGPULegalizerInfo::legalizeWaveID(), llvm::AMDGPULegalizerInfo::loadInputValue(), llvm::LegalizerHelper::lowerFPTOSI(), llvm::LegalizerHelper::lowerFPTOUI(), llvm::LegalizerHelper::lowerFPTRUNC_F64_TO_F16(), llvm::LegalizerHelper::lowerSITOFP(), llvm::LegalizerHelper::lowerU64ToF32BitOps(), llvm::LegalizerHelper::lowerU64ToF32WithSITOFP(), llvm::LegalizerHelper::lowerU64ToF64BitFloatOps(), llvm::AMDGPUCallLowering::passSpecialInputs(), llvm::PPCLegalizerInfo::PPCLegalizerInfo(), reinsertVectorIndexAdd(), llvm::AMDGPURegisterBankInfo::setBufferOffsets(), llvm::AMDGPURegisterBankInfo::splitBufferOffsets(), llvm::AMDGPULegalizerInfo::splitBufferOffsets(), and unpackV2S16ToS32().

◆ S512

const LLT S512 = LLT::scalar(512)
static

Definition at line 295 of file AMDGPULegalizerInfo.cpp.

◆ S64

const LLT S64 = LLT::scalar(64)
static

◆ S8

const LLT S8 = LLT::scalar(8)
static

◆ S96

const LLT S96 = LLT::scalar(96)
static

Definition at line 289 of file AMDGPULegalizerInfo.cpp.

◆ SPDenormModeBitField

constexpr unsigned SPDenormModeBitField
staticconstexpr

◆ V10S16

const LLT V10S16 = LLT::fixed_vector(10, 16)
static

Definition at line 304 of file AMDGPULegalizerInfo.cpp.

◆ V10S32

const LLT V10S32 = LLT::fixed_vector(10, 32)
static

Definition at line 319 of file AMDGPULegalizerInfo.cpp.

◆ V11S32

const LLT V11S32 = LLT::fixed_vector(11, 32)
static

Definition at line 320 of file AMDGPULegalizerInfo.cpp.

◆ V12S16

const LLT V12S16 = LLT::fixed_vector(12, 16)
static

Definition at line 305 of file AMDGPULegalizerInfo.cpp.

◆ V12S32

const LLT V12S32 = LLT::fixed_vector(12, 32)
static

Definition at line 321 of file AMDGPULegalizerInfo.cpp.

◆ V16S16

const LLT V16S16 = LLT::fixed_vector(16, 16)
static

Definition at line 306 of file AMDGPULegalizerInfo.cpp.

◆ V16S32

const LLT V16S32 = LLT::fixed_vector(16, 32)
static

◆ V16S64

const LLT V16S64 = LLT::fixed_vector(16, 64)
static

Definition at line 332 of file AMDGPULegalizerInfo.cpp.

◆ V2BF16

const LLT V2BF16 = V2F16
static

Definition at line 309 of file AMDGPULegalizerInfo.cpp.

◆ V2F16

const LLT V2F16 = LLT::fixed_vector(2, LLT::float16())
static

Definition at line 308 of file AMDGPULegalizerInfo.cpp.

◆ V2S128

const LLT V2S128 = LLT::fixed_vector(2, 128)
static

Definition at line 334 of file AMDGPULegalizerInfo.cpp.

◆ V2S16

const LLT V2S16 = LLT::fixed_vector(2, 16)
static

◆ V2S32

const LLT V2S32 = LLT::fixed_vector(2, 32)
static

◆ V2S64

const LLT V2S64 = LLT::fixed_vector(2, 64)
static

◆ V2S8

const LLT V2S8 = LLT::fixed_vector(2, 8)
static

◆ V32S32

const LLT V32S32 = LLT::fixed_vector(32, 32)
static

◆ V3S32

const LLT V3S32 = LLT::fixed_vector(3, 32)
static

◆ V3S64

const LLT V3S64 = LLT::fixed_vector(3, 64)
static

Definition at line 326 of file AMDGPULegalizerInfo.cpp.

◆ V4S128

const LLT V4S128 = LLT::fixed_vector(4, 128)
static

Definition at line 335 of file AMDGPULegalizerInfo.cpp.

◆ V4S16

const LLT V4S16 = LLT::fixed_vector(4, 16)
static

◆ V4S32

const LLT V4S32 = LLT::fixed_vector(4, 32)
static

Definition at line 313 of file AMDGPULegalizerInfo.cpp.

Referenced by llvm::PPCLegalizerInfo::PPCLegalizerInfo().

◆ V4S64

const LLT V4S64 = LLT::fixed_vector(4, 64)
static

Definition at line 327 of file AMDGPULegalizerInfo.cpp.

◆ V5S32

const LLT V5S32 = LLT::fixed_vector(5, 32)
static

Definition at line 314 of file AMDGPULegalizerInfo.cpp.

◆ V5S64

const LLT V5S64 = LLT::fixed_vector(5, 64)
static

Definition at line 328 of file AMDGPULegalizerInfo.cpp.

◆ V6S16

const LLT V6S16 = LLT::fixed_vector(6, 16)
static

Definition at line 302 of file AMDGPULegalizerInfo.cpp.

◆ V6S32

const LLT V6S32 = LLT::fixed_vector(6, 32)
static

Definition at line 315 of file AMDGPULegalizerInfo.cpp.

◆ V6S64

const LLT V6S64 = LLT::fixed_vector(6, 64)
static

Definition at line 329 of file AMDGPULegalizerInfo.cpp.

◆ V7S32

const LLT V7S32 = LLT::fixed_vector(7, 32)
static

Definition at line 316 of file AMDGPULegalizerInfo.cpp.

◆ V7S64

const LLT V7S64 = LLT::fixed_vector(7, 64)
static

Definition at line 330 of file AMDGPULegalizerInfo.cpp.

◆ V8S16

const LLT V8S16 = LLT::fixed_vector(8, 16)
static

Definition at line 303 of file AMDGPULegalizerInfo.cpp.

Referenced by llvm::PPCLegalizerInfo::PPCLegalizerInfo().

◆ V8S32

const LLT V8S32 = LLT::fixed_vector(8, 32)
static

Definition at line 317 of file AMDGPULegalizerInfo.cpp.

◆ V8S64

const LLT V8S64 = LLT::fixed_vector(8, 64)
static

Definition at line 331 of file AMDGPULegalizerInfo.cpp.

◆ V9S32

const LLT V9S32 = LLT::fixed_vector(9, 32)
static

Definition at line 318 of file AMDGPULegalizerInfo.cpp.