13#ifndef LLVM_LIB_TARGET_AMDGPU_SIMACHINEFUNCTIONINFO_H
14#define LLVM_LIB_TARGET_AMDGPU_SIMACHINEFUNCTIONINFO_H
32class MachineFrameInfo;
34class SIMachineFunctionInfo;
36class TargetRegisterClass;
97 std::optional<unsigned>
Mask;
113 if (
Other.IsRegister)
145 if (
YamlIO.outputting()) {
147 YamlIO.mapRequired(
"reg",
A.RegisterName);
149 YamlIO.mapRequired(
"offset",
A.StackOffset);
151 auto Keys =
YamlIO.keys();
154 YamlIO.mapRequired(
"reg",
A.RegisterName);
156 YamlIO.mapRequired(
"offset",
A.StackOffset);
158 YamlIO.setError(
"missing required key 'reg' or 'offset'");
160 YamlIO.mapOptional(
"mask",
A.Mask);
162 static const bool flow =
true;
204 YamlIO.mapOptional(
"privateSegmentWaveByteOffset",
252 YamlIO.mapOptional(
"dx10-clamp",
Mode.DX10Clamp,
true);
253 YamlIO.mapOptional(
"fp32-input-denormals",
Mode.FP32InputDenormals,
true);
254 YamlIO.mapOptional(
"fp32-output-denormals",
Mode.FP32OutputDenormals,
true);
255 YamlIO.mapOptional(
"fp64-fp16-input-denormals",
Mode.FP64FP16InputDenormals,
true);
256 YamlIO.mapOptional(
"fp64-fp16-output-denormals",
Mode.FP64FP16OutputDenormals,
true);
340 YamlIO.mapOptional(
"highBitsOf32BitAddress",
398 Register ScratchRSrcReg = AMDGPU::PRIVATE_RSRC_REG;
402 Register FrameOffsetReg = AMDGPU::FP_REG;
407 Register StackPtrOffsetReg = AMDGPU::SP_REG;
417 unsigned PSInputAddr = 0;
418 unsigned PSInputEnable = 0;
429 unsigned BytesInStackArgArea = 0;
431 bool ReturnsVoid =
true;
435 std::pair<unsigned, unsigned> FlatWorkGroupSizes = {0, 0};
439 std::pair<unsigned, unsigned> WavesPerEU = {0, 0};
441 const AMDGPUGWSResourcePseudoSourceValue GWSResourcePSV;
444 SmallVector<unsigned> MaxNumWorkGroups = {0, 0, 0};
447 unsigned NumUserSGPRs = 0;
448 unsigned NumSystemSGPRs = 0;
450 bool HasSpilledSGPRs =
false;
451 bool HasSpilledVGPRs =
false;
452 bool HasNonSpillStackObjects =
false;
453 bool IsStackRealigned =
false;
455 unsigned NumSpilledSGPRs = 0;
456 unsigned NumSpilledVGPRs = 0;
460 GCNUserSGPRUsageInfo UserSGPRInfo;
463 bool WorkGroupIDX : 1;
464 bool WorkGroupIDY : 1;
465 bool WorkGroupIDZ : 1;
466 bool WorkGroupInfo : 1;
467 bool LDSKernelId : 1;
468 bool PrivateSegmentWaveByteOffset : 1;
470 bool WorkItemIDX : 1;
471 bool WorkItemIDY : 1;
472 bool WorkItemIDZ : 1;
476 bool ImplicitArgPtr : 1;
478 bool MayNeedAGPRs : 1;
485 unsigned HighBitsOf32BitAddress;
488 IndexedMap<uint8_t, VirtReg2IndexFunctor> VRegFlags;
497 mutable std::optional<bool> UsesAGPRs;
504 void MRI_NoteNewVirtualRegister(
Register Reg)
override;
505 void MRI_NoteCloneVirtualRegister(
Register NewReg,
Register SrcReg)
override;
518 SGPRSpillsToVirtualVGPRLanes;
522 SGPRSpillsToPhysicalVGPRLanes;
523 unsigned NumVirtualVGPRSpillLanes = 0;
524 unsigned NumPhysicalVGPRSpillLanes = 0;
548 using PrologEpilogSGPRSpill =
549 std::pair<Register, PrologEpilogSGPRSaveRestoreInfo>;
569 std::optional<int> ScavengeFI;
578 bool IsPrologEpilog);
582 return VGPRForAGPRCopy;
586 VGPRForAGPRCopy = NewVGPRForAGPRCopy;
619 auto I = SGPRSpillsToVirtualVGPRLanes.
find(FrameIndex);
620 return (
I == SGPRSpillsToVirtualVGPRLanes.
end())
633 return PrologEpilogSGPRSpills;
646 PrologEpilogSGPRSpills.
insert(
648 PrologEpilogSGPRSpills,
Reg,
649 [](
const auto &
LHS,
const auto &
RHS) {
return LHS <
RHS.first; }),
650 std::make_pair(
Reg, SI));
656 const auto *
I =
find_if(PrologEpilogSGPRSpills, [&
Reg](
const auto &Spill) {
657 return Spill.first ==
Reg;
659 return I != PrologEpilogSGPRSpills.
end();
664 const auto *
I =
find_if(PrologEpilogSGPRSpills, [&
Reg](
const auto &Spill) {
665 return Spill.first ==
Reg;
667 if (
I != PrologEpilogSGPRSpills.
end() &&
669 return I->second.getReg();
671 return AMDGPU::NoRegister;
676 for (
const auto &SI : PrologEpilogSGPRSpills) {
684 return find_if(PrologEpilogSGPRSpills,
687 return SI.second.getKind() ==
689 SI.second.getIndex() == FI;
690 }) != PrologEpilogSGPRSpills.
end();
695 const auto *
I =
find_if(PrologEpilogSGPRSpills, [&
Reg](
const auto &Spill) {
696 return Spill.first ==
Reg;
705 auto I = SGPRSpillsToPhysicalVGPRLanes.
find(FrameIndex);
706 return (
I == SGPRSpillsToPhysicalVGPRLanes.
end())
713 if (VRegFlags.inBounds(
Reg))
714 VRegFlags[
Reg] |= Flag;
718 if (
Reg.isPhysical())
721 return VRegFlags.inBounds(
Reg) && VRegFlags[
Reg] & Flag;
747 auto I = VGPRToAGPRSpills.
find(FrameIndex);
748 return (
I == VGPRToAGPRSpills.
end()) ? (
MCPhysReg)AMDGPU::NoRegister
749 :
I->second.Lanes[Lane];
753 auto I = VGPRToAGPRSpills.
find(FrameIndex);
754 if (
I != VGPRToAGPRSpills.
end())
755 I->second.IsDead =
true;
765 bool SpillToPhysVGPRLane =
false,
766 bool IsPrologEpilog =
false);
772 bool ResetSGPRSpillStackIDs);
778 return BytesInStackArgArea;
782 BytesInStackArgArea = Bytes;
797 unsigned AllocSizeDWord,
int KernArgIdx,
811 return ArgInfo.WorkGroupIDX.getRegister();
817 return ArgInfo.WorkGroupIDY.getRegister();
823 return ArgInfo.WorkGroupIDZ.getRegister();
829 return ArgInfo.WorkGroupInfo.getRegister();
848 ArgInfo.PrivateSegmentWaveByteOffset
851 return ArgInfo.PrivateSegmentWaveByteOffset.getRegister();
871 return WorkGroupInfo;
875 return PrivateSegmentWaveByteOffset;
891 return ImplicitArgPtr;
902 std::tuple<const ArgDescriptor *, const TargetRegisterClass *, LLT>
908 const auto *Arg = std::get<0>(
ArgInfo.getPreloadedValue(
Value));
909 return Arg ? Arg->getRegister() :
MCRegister();
919 return HighBitsOf32BitAddress;
927 return NumUserSGPRs + NumSystemSGPRs;
931 return UserSGPRInfo.getNumKernargPreloadSGPRs();
935 return ArgInfo.PrivateSegmentWaveByteOffset.getRegister();
941 return ScratchRSrcReg;
945 assert(
Reg != 0 &&
"Should never be unset");
946 ScratchRSrcReg =
Reg;
950 return FrameOffsetReg;
954 assert(
Reg != 0 &&
"Should never be unset");
955 FrameOffsetReg =
Reg;
959 assert(
Reg != 0 &&
"Should never be unset");
960 StackPtrOffsetReg =
Reg;
970 return StackPtrOffsetReg;
976 return ArgInfo.QueuePtr.getRegister();
980 return ArgInfo.ImplicitBufferPtr.getRegister();
984 return HasSpilledSGPRs;
988 HasSpilledSGPRs = Spill;
992 return HasSpilledVGPRs;
996 HasSpilledVGPRs = Spill;
1000 return HasNonSpillStackObjects;
1004 HasNonSpillStackObjects = StackObject;
1008 return IsStackRealigned;
1012 IsStackRealigned = Realigned;
1016 return NumSpilledSGPRs;
1020 return NumSpilledVGPRs;
1024 NumSpilledSGPRs += num;
1028 NumSpilledVGPRs += num;
1036 return PSInputEnable;
1040 return PSInputAddr & (1 <<
Index);
1044 PSInputAddr |= 1 <<
Index;
1048 PSInputEnable |= 1 <<
Index;
1056 ReturnsVoid =
Value;
1062 return FlatWorkGroupSizes;
1067 return FlatWorkGroupSizes.first;
1072 return FlatWorkGroupSizes.second;
1083 return WavesPerEU.first;
1088 return WavesPerEU.second;
1093 return &GWSResourcePSV;
1103 return (Occupancy < 4) ? Occupancy : 4;
1109 if (Occupancy > Limit)
1114 if (Occupancy < Limit)
1122 return MayNeedAGPRs;
Provides AMDGPU specific target descriptions.
The AMDGPU TargetMachine interface definition for hw codegen targets.
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
AMD GCN specific subclass of TargetSubtarget.
unsigned const TargetRegisterInfo * TRI
Promote Memory to Register
static cl::opt< RegAllocEvictionAdvisorAnalysis::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysis::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysis::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysis::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysis::AdvisorMode::Development, "development", "for training")))
Interface definition for SIInstrInfo.
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file implements a set that has insertion order iteration characteristics.
This file defines the SmallVector class.
void printCustom(raw_ostream &OS) const override
Implement printing for PseudoSourceValue.
static bool classof(const PseudoSourceValue *V)
AMDGPUGWSResourcePseudoSourceValue(const AMDGPUTargetMachine &TM)
bool mayAlias(const MachineFrameInfo *) const override
Return true if the memory pointed to by this PseudoSourceValue can ever alias an LLVM IR Value.
bool isAliased(const MachineFrameInfo *) const override
Test whether the memory pointed to by this PseudoSourceValue may also be pointed to by an LLVM IR Val...
bool isMemoryBound() const
bool needsWaveLimiter() const
bool isConstant(const MachineFrameInfo *) const override
Test whether the memory pointed to by this PseudoSourceValue has a constant value.
AMDGPUPseudoSourceValue(unsigned Kind, const AMDGPUTargetMachine &TM)
bool mayAlias(const MachineFrameInfo *) const override
Return true if the memory pointed to by this PseudoSourceValue can ever alias an LLVM IR Value.
bool isAliased(const MachineFrameInfo *) const override
Test whether the memory pointed to by this PseudoSourceValue may also be pointed to by an LLVM IR Val...
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
void clear()
clear - Removes all bits from the bitvector.
Allocate memory in an ever growing pool, as if by bump-pointer.
iterator find(const_arg_type_t< KeyT > Val)
Lightweight error class with error context and mandatory checking.
Wrapper class representing physical registers. Should be passed by value.
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
PrologEpilogSGPRSaveRestoreInfo(SGPRSaveKind K, Register R)
PrologEpilogSGPRSaveRestoreInfo(SGPRSaveKind K, int I)
SGPRSaveKind getKind() const
Special value supplied for machine level alias analysis.
Wrapper class representing virtual and physical registers.
This class keeps track of the SPI_SP_INPUT_ADDR config register, which tells the hardware which inter...
bool hasNonSpillStackObjects() const
ArrayRef< PrologEpilogSGPRSpill > getPrologEpilogSGPRSpills() const
const WWMSpillsMap & getWWMSpills() const
bool usesAGPRs(const MachineFunction &MF) const
bool isPSInputAllocated(unsigned Index) const
void getAllScratchSGPRCopyDstRegs(SmallVectorImpl< Register > &Regs) const
ArrayRef< MCPhysReg > getAGPRSpillVGPRs() const
void setSGPRForEXECCopy(Register Reg)
bool initializeBaseYamlFields(const yaml::SIMachineFunctionInfo &YamlMFI, const MachineFunction &MF, PerFunctionMIParsingState &PFS, SMDiagnostic &Error, SMRange &SourceRange)
unsigned getOccupancy() const
unsigned getNumPreloadedSGPRs() const
void shiftWwmVGPRsToLowestRange(MachineFunction &MF, SmallVectorImpl< Register > &WWMVGPRs, BitVector &SavedVGPRs)
void setWorkItemIDY(ArgDescriptor Arg)
unsigned getNumSpilledVGPRs() const
bool hasLDSKernelId() const
void increaseOccupancy(const MachineFunction &MF, unsigned Limit)
Register addPrivateSegmentSize(const SIRegisterInfo &TRI)
void setWorkItemIDZ(ArgDescriptor Arg)
std::pair< unsigned, unsigned > getWavesPerEU() const
unsigned getMaxNumWorkGroupsZ() const
MCPhysReg getVGPRToAGPRSpill(int FrameIndex, unsigned Lane) const
unsigned getNumSpilledSGPRs() const
GCNUserSGPRUsageInfo & getUserSGPRInfo()
void allocateWWMSpill(MachineFunction &MF, Register VGPR, uint64_t Size=4, Align Alignment=Align(4))
Register addDispatchPtr(const SIRegisterInfo &TRI)
Register getLongBranchReservedReg() const
bool hasSpilledVGPRs() const
void setFlag(Register Reg, uint8_t Flag)
void setVGPRToAGPRSpillDead(int FrameIndex)
unsigned getMaxFlatWorkGroupSize() const
std::pair< unsigned, unsigned > getFlatWorkGroupSizes() const
Register getStackPtrOffsetReg() const
bool isStackRealigned() const
Register addFlatScratchInit(const SIRegisterInfo &TRI)
Register getScratchRSrcReg() const
Returns the physical register reserved for use as the resource descriptor for scratch accesses.
unsigned getMaxWavesPerEU() const
void setStackPtrOffsetReg(Register Reg)
Register addReservedUserSGPR()
Increment user SGPRs used for padding the argument list only.
ArrayRef< MCPhysReg > getVGPRSpillAGPRs() const
ArrayRef< Register > getSGPRSpillPhysVGPRs() const
int getScavengeFI(MachineFrameInfo &MFI, const SIRegisterInfo &TRI)
Register addQueuePtr(const SIRegisterInfo &TRI)
bool hasWorkGroupIDZ() const
Register getQueuePtrUserSGPR() const
ArrayRef< SIRegisterInfo::SpilledReg > getSGPRSpillToVirtualVGPRLanes(int FrameIndex) const
unsigned getMaxMemoryClusterDWords() const
SIMachineFunctionInfo(const SIMachineFunctionInfo &MFI)=default
SmallVector< unsigned > getMaxNumWorkGroups() const
void clearNonWWMRegAllocMask()
bool hasPrologEpilogSGPRSpillEntry(Register Reg) const
Register getGITPtrLoReg(const MachineFunction &MF) const
bool hasWorkGroupIDY() const
void setVGPRForAGPRCopy(Register NewVGPRForAGPRCopy)
bool allocateVGPRSpillToAGPR(MachineFunction &MF, int FI, bool isAGPRtoVGPR)
Reserve AGPRs or VGPRs to support spilling for FrameIndex FI.
Register addWorkGroupIDY()
void splitWWMSpillRegisters(MachineFunction &MF, SmallVectorImpl< std::pair< Register, int > > &CalleeSavedRegs, SmallVectorImpl< std::pair< Register, int > > &ScratchRegs) const
void setBytesInStackArgArea(unsigned Bytes)
SIModeRegisterDefaults getMode() const
Register getSGPRForEXECCopy() const
void setFrameOffsetReg(Register Reg)
ArrayRef< SIRegisterInfo::SpilledReg > getSGPRSpillToPhysicalVGPRLanes(int FrameIndex) const
Register addPrivateSegmentWaveByteOffset()
std::tuple< const ArgDescriptor *, const TargetRegisterClass *, LLT > getPreloadedValue(AMDGPUFunctionArgInfo::PreloadedValue Value) const
bool hasWorkGroupInfo() const
bool mayUseAGPRs(const Function &F) const
bool isCalleeSavedReg(const MCPhysReg *CSRegs, MCPhysReg Reg) const
bool hasWorkItemIDY() const
unsigned getMinFlatWorkGroupSize() const
Register addLDSKernelId()
Register getVGPRForAGPRCopy() const
const GCNUserSGPRUsageInfo & getUserSGPRInfo() const
bool allocateSGPRSpillToVGPRLane(MachineFunction &MF, int FI, bool SpillToPhysVGPRLane=false, bool IsPrologEpilog=false)
void setPrivateSegmentWaveByteOffset(Register Reg)
unsigned getMinWavesPerEU() const
Register getFrameOffsetReg() const
void setLongBranchReservedReg(Register Reg)
bool hasWorkGroupIDX() const
const AMDGPUFunctionArgInfo & getArgInfo() const
unsigned getMaxNumWorkGroupsX() const
unsigned getBytesInStackArgArea() const
Register addKernargSegmentPtr(const SIRegisterInfo &TRI)
Register addDispatchID(const SIRegisterInfo &TRI)
void setHasSpilledVGPRs(bool Spill=true)
void setIfReturnsVoid(bool Value)
void limitOccupancy(unsigned Limit)
bool removeDeadFrameIndices(MachineFrameInfo &MFI, bool ResetSGPRSpillStackIDs)
If ResetSGPRSpillStackIDs is true, reset the stack ID from sgpr-spill to the default stack.
BitVector getNonWWMRegMask() const
void markPSInputAllocated(unsigned Index)
void setWorkItemIDX(ArgDescriptor Arg)
bool isWWMReg(Register Reg) const
MachineFunctionInfo * clone(BumpPtrAllocator &Allocator, MachineFunction &DestMF, const DenseMap< MachineBasicBlock *, MachineBasicBlock * > &Src2DstMBB) const override
Make a functionally equivalent copy of this MachineFunctionInfo in MF.
bool checkFlag(Register Reg, uint8_t Flag) const
void markPSInputEnabled(unsigned Index)
void addToSpilledVGPRs(unsigned num)
MCRegister getPreloadedReg(AMDGPUFunctionArgInfo::PreloadedValue Value) const
uint32_t get32BitAddressHighBits() const
unsigned getMinAllowedOccupancy() const
void setHasSpilledSGPRs(bool Spill=true)
bool checkIndexInPrologEpilogSGPRSpills(int FI) const
void updateNonWWMRegMask(BitVector &RegMask)
unsigned getNumKernargPreloadedSGPRs() const
Register addPrivateSegmentBuffer(const SIRegisterInfo &TRI)
bool hasWorkItemIDX() const
unsigned getNumUserSGPRs() const
const ReservedRegSet & getWWMReservedRegs() const
Register getImplicitBufferPtrUserSGPR() const
std::optional< int > getOptionalScavengeFI() const
Register addImplicitBufferPtr(const SIRegisterInfo &TRI)
AMDGPUFunctionArgInfo & getArgInfo()
const PrologEpilogSGPRSaveRestoreInfo & getPrologEpilogSGPRSaveRestoreInfo(Register Reg) const
void setHasNonSpillStackObjects(bool StackObject=true)
void setIsStackRealigned(bool Realigned=true)
unsigned getGITPtrHigh() const
void limitOccupancy(const MachineFunction &MF)
bool hasSpilledSGPRs() const
ArrayRef< Register > getSGPRSpillVGPRs() const
unsigned getPSInputAddr() const
SmallVectorImpl< MCRegister > * addPreloadedKernArg(const SIRegisterInfo &TRI, const TargetRegisterClass *RC, unsigned AllocSizeDWord, int KernArgIdx, int PaddingSGPRs)
void addToPrologEpilogSGPRSpills(Register Reg, PrologEpilogSGPRSaveRestoreInfo SI)
Register getScratchSGPRCopyDstReg(Register Reg) const
Register getPrivateSegmentWaveByteOffsetSystemSGPR() const
bool hasImplicitArgPtr() const
Register addWorkGroupIDZ()
bool mayNeedAGPRs() const
Register addWorkGroupInfo()
bool hasWorkItemIDZ() const
unsigned getMaxNumWorkGroupsY() const
unsigned getPSInputEnable() const
void setScratchRSrcReg(Register Reg)
void addToSpilledSGPRs(unsigned num)
const AMDGPUGWSResourcePseudoSourceValue * getGWSPSV(const AMDGPUTargetMachine &TM)
void reserveWWMRegister(Register Reg)
bool hasPrivateSegmentWaveByteOffset() const
Register addWorkGroupIDX()
Instances of this class encapsulate one diagnostic report, allowing printing to a raw_ostream as a ca...
Represents a range in source code.
bool insert(const value_type &X)
Insert a new element into the SetVector.
bool contains(const key_type &key) const
Check if the SetVector contains the given key.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
iterator insert(iterator I, T &&Elt)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StackOffset holds a fixed and a scalable offset in bytes.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
LLVM Value Representation.
This class implements an extremely fast bulk output stream that can only output to a stream.
This is an optimization pass for GlobalISel generic memory operations.
uint16_t MCPhysReg
An unsigned integer type large enough to represent all physical registers, but not necessarily virtua...
auto upper_bound(R &&Range, T &&Value)
Provide wrappers to std::upper_bound which take ranges instead of having to pass begin/end explicitly...
bool is_sorted(R &&Range, Compare C)
Wrapper function around std::is_sorted to check if elements in a range R are sorted with respect to a...
constexpr unsigned DefaultMemoryClusterDWordsLimit
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
This struct is a compact representation of a valid (non-zero power of two) alignment.
static ArgDescriptor createRegister(Register Reg, unsigned Mask=~0u)
Helper struct shared between Function Specialization and SCCP Solver.
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
MachineFunctionInfo - This class can be derived from and used by targets to hold private target-speci...
SmallVector< MCPhysReg, 32 > Lanes
Function object to check whether the first component of a container supported by std::get (like std::...
Targets should override this in a way that mirrors the implementation of llvm::MachineFunctionInfo.
static void mapping(IO &YamlIO, SIArgumentInfo &AI)
static void mapping(IO &YamlIO, SIArgument &A)
static void mapping(IO &YamlIO, SIMachineFunctionInfo &MFI)
static void mapping(IO &YamlIO, SIMode &Mode)
std::optional< SIArgument > PrivateSegmentWaveByteOffset
std::optional< SIArgument > WorkGroupIDY
std::optional< SIArgument > FlatScratchInit
std::optional< SIArgument > DispatchPtr
std::optional< SIArgument > DispatchID
std::optional< SIArgument > WorkItemIDY
std::optional< SIArgument > WorkGroupIDX
std::optional< SIArgument > ImplicitArgPtr
std::optional< SIArgument > QueuePtr
std::optional< SIArgument > WorkGroupInfo
std::optional< SIArgument > LDSKernelId
std::optional< SIArgument > ImplicitBufferPtr
std::optional< SIArgument > WorkItemIDX
std::optional< SIArgument > KernargSegmentPtr
std::optional< SIArgument > WorkItemIDZ
std::optional< SIArgument > PrivateSegmentSize
std::optional< SIArgument > PrivateSegmentBuffer
std::optional< SIArgument > WorkGroupIDZ
std::optional< unsigned > Mask
SIArgument(const SIArgument &Other)
SIArgument & operator=(const SIArgument &Other)
static SIArgument createArgument(bool IsReg)
unsigned MaxMemoryClusterDWords
StringValue SGPRForEXECCopy
SmallVector< StringValue > WWMReservedRegs
uint32_t HighBitsOf32BitAddress
SIMachineFunctionInfo()=default
StringValue FrameOffsetReg
StringValue LongBranchReservedReg
uint64_t ExplicitKernArgSize
void mappingImpl(yaml::IO &YamlIO) override
~SIMachineFunctionInfo()=default
StringValue VGPRForAGPRCopy
std::optional< SIArgumentInfo > ArgInfo
SmallVector< StringValue, 2 > SpillPhysVGPRS
std::optional< FrameIndex > ScavengeFI
unsigned BytesInStackArgArea
StringValue ScratchRSrcReg
StringValue StackPtrOffsetReg
SIMode(const SIModeRegisterDefaults &Mode)
bool FP64FP16OutputDenormals
bool FP64FP16InputDenormals
A wrapper around std::string which contains a source range that's being set during parsing.