LLVM 20.0.0git
|
#include "Target/AMDGPU/AMDGPUISelLowering.h"
Public Types | |
enum | ImplicitParameter { FIRST_IMPLICIT , PRIVATE_BASE , SHARED_BASE , QUEUE_PTR } |
Public Types inherited from llvm::TargetLowering | |
enum | ConstraintType { C_Register , C_RegisterClass , C_Memory , C_Address , C_Immediate , C_Other , C_Unknown } |
enum | ConstraintWeight { CW_Invalid = -1 , CW_Okay = 0 , CW_Good = 1 , CW_Better = 2 , CW_Best = 3 , CW_SpecificReg = CW_Okay , CW_Register = CW_Good , CW_Memory = CW_Better , CW_Constant = CW_Best , CW_Default = CW_Okay } |
using | AsmOperandInfoVector = std::vector< AsmOperandInfo > |
using | ConstraintPair = std::pair< StringRef, TargetLowering::ConstraintType > |
using | ConstraintGroup = SmallVector< ConstraintPair > |
Public Types inherited from llvm::TargetLoweringBase | |
enum | LegalizeAction : uint8_t { Legal , Promote , Expand , LibCall , Custom } |
This enum indicates whether operations are valid for a target, and if not, what action should be used to make them valid. More... | |
enum | LegalizeTypeAction : uint8_t { TypeLegal , TypePromoteInteger , TypeExpandInteger , TypeSoftenFloat , TypeExpandFloat , TypeScalarizeVector , TypeSplitVector , TypeWidenVector , TypePromoteFloat , TypeSoftPromoteHalf , TypeScalarizeScalableVector } |
This enum indicates whether a types are legal for a target, and if not, what action should be used to make them valid. More... | |
enum | BooleanContent { UndefinedBooleanContent , ZeroOrOneBooleanContent , ZeroOrNegativeOneBooleanContent } |
Enum that describes how the target represents true/false values. More... | |
enum | SelectSupportKind { ScalarValSelect , ScalarCondVectorVal , VectorMaskSelect } |
Enum that describes what type of support for selects the target has. More... | |
enum class | AtomicExpansionKind { None , CastToInteger , LLSC , LLOnly , CmpXChg , MaskedIntrinsic , BitTestIntrinsic , CmpArithIntrinsic , Expand , NotAtomic } |
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all. More... | |
enum class | MulExpansionKind { Always , OnlyLegalOrCustom } |
Enum that specifies when a multiplication should be expanded. More... | |
enum class | NegatibleCost { Cheaper = 0 , Neutral = 1 , Expensive = 2 } |
Enum that specifies when a float negation is beneficial. More... | |
enum | AndOrSETCCFoldKind : uint8_t { None = 0 , AddAnd = 1 , NotAnd = 2 , ABS = 4 } |
Enum of different potentially desirable ways to fold (and/or (setcc ...), (setcc ...)). More... | |
enum | ReciprocalEstimate : int { Unspecified = -1 , Disabled = 0 , Enabled = 1 } |
Reciprocal estimate status values used by the functions below. More... | |
enum class | ShiftLegalizationStrategy { ExpandToParts , ExpandThroughStack , LowerToLibcall } |
Return the preferred strategy to legalize tihs SHIFT instruction, with ExpansionFactor being the recursion depth - how many expansion needed. More... | |
using | LegalizeKind = std::pair< LegalizeTypeAction, EVT > |
LegalizeKind holds the legalization kind that needs to happen to EVT in order to type-legalize it. | |
using | ArgListTy = std::vector< ArgListEntry > |
Public Member Functions | |
AMDGPUTargetLowering (const TargetMachine &TM, const AMDGPUSubtarget &STI) | |
bool | mayIgnoreSignedZero (SDValue Op) const |
bool | isFAbsFree (EVT VT) const override |
Return true if an fabs operation is free to the point where it is never worthwhile to replace it with a bitwise operation. | |
bool | isFNegFree (EVT VT) const override |
Return true if an fneg operation is free to the point where it is never worthwhile to replace it with a bitwise operation. | |
bool | isTruncateFree (EVT Src, EVT Dest) const override |
bool | isTruncateFree (Type *Src, Type *Dest) const override |
Return true if it's free to truncate a value of type FromTy to type ToTy. | |
bool | isZExtFree (Type *Src, Type *Dest) const override |
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the value to ToTy in the result register. | |
bool | isZExtFree (EVT Src, EVT Dest) const override |
SDValue | getNegatedExpression (SDValue Op, SelectionDAG &DAG, bool LegalOperations, bool ForCodeSize, NegatibleCost &Cost, unsigned Depth) const override |
Return the newly negated expression if the cost is not expensive and set the cost in Cost to indicate that if it is cheaper or neutral to do the negation. | |
bool | isNarrowingProfitable (EVT SrcVT, EVT DestVT) const override |
Return true if it's profitable to narrow operations of type SrcVT to DestVT. | |
bool | isDesirableToCommuteWithShift (const SDNode *N, CombineLevel Level) const override |
Return true if it is profitable to move this shift by a constant amount through its operand, adjusting any immediate operands as necessary to preserve semantics. | |
EVT | getTypeForExtReturn (LLVMContext &Context, EVT VT, ISD::NodeType ExtendKind) const override |
Return the type that should be used to zero or sign extend a zeroext/signext integer return value. | |
MVT | getVectorIdxTy (const DataLayout &) const override |
Returns the type to be used for the index operand of: ISD::INSERT_VECTOR_ELT, ISD::EXTRACT_VECTOR_ELT, ISD::INSERT_SUBVECTOR, and ISD::EXTRACT_SUBVECTOR. | |
bool | isSelectSupported (SelectSupportKind) const override |
bool | isFPImmLegal (const APFloat &Imm, EVT VT, bool ForCodeSize) const override |
Returns true if the target can instruction select the specified FP immediate natively. | |
bool | ShouldShrinkFPConstant (EVT VT) const override |
If true, then instruction selection should seek to shrink the FP constant of the specified type to a smaller type in order to save space and / or reduce runtime. | |
bool | shouldReduceLoadWidth (SDNode *Load, ISD::LoadExtType ExtType, EVT ExtVT) const override |
Return true if it is profitable to reduce a load to a smaller type. | |
bool | isLoadBitCastBeneficial (EVT, EVT, const SelectionDAG &DAG, const MachineMemOperand &MMO) const final |
Return true if the following transform is beneficial: fold (conv (load x)) -> (load (conv*)x) On architectures that don't natively support some vector loads efficiently, casting the load to a smaller vector of larger types and loading is more efficient, however, this can be undone by optimizations in dag combiner. | |
bool | storeOfVectorConstantIsCheap (bool IsZero, EVT MemVT, unsigned NumElem, unsigned AS) const override |
Return true if it is expected to be cheaper to do a store of vector constant with the given size and type for the address space than to store the individual scalar element constants. | |
bool | aggressivelyPreferBuildVectorSources (EVT VecVT) const override |
bool | isCheapToSpeculateCttz (Type *Ty) const override |
Return true if it is cheap to speculate a call to intrinsic cttz. | |
bool | isCheapToSpeculateCtlz (Type *Ty) const override |
Return true if it is cheap to speculate a call to intrinsic ctlz. | |
bool | isSDNodeAlwaysUniform (const SDNode *N) const override |
AtomicExpansionKind | shouldCastAtomicLoadInIR (LoadInst *LI) const override |
Returns how the given (atomic) load should be cast by the IR-level AtomicExpand pass. | |
AtomicExpansionKind | shouldCastAtomicStoreInIR (StoreInst *SI) const override |
Returns how the given (atomic) store should be cast by the IR-level AtomicExpand pass into. | |
AtomicExpansionKind | shouldCastAtomicRMWIInIR (AtomicRMWInst *) const override |
Returns how the given atomic atomicrmw should be cast by the IR-level AtomicExpand pass. | |
SDValue | LowerReturn (SDValue Chain, CallingConv::ID CallConv, bool isVarArg, const SmallVectorImpl< ISD::OutputArg > &Outs, const SmallVectorImpl< SDValue > &OutVals, const SDLoc &DL, SelectionDAG &DAG) const override |
This hook must be implemented to lower outgoing return values, described by the Outs array, into the specified DAG. | |
SDValue | addTokenForArgument (SDValue Chain, SelectionDAG &DAG, MachineFrameInfo &MFI, int ClobberedFI) const |
SDValue | lowerUnhandledCall (CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals, StringRef Reason) const |
SDValue | LowerCall (CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals) const override |
This hook must be implemented to lower calls into the specified DAG. | |
SDValue | LowerDYNAMIC_STACKALLOC (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerOperation (SDValue Op, SelectionDAG &DAG) const override |
This callback is invoked for operations that are unsupported by the target, which are registered to use 'custom' lowering, and whose defined values are all legal. | |
SDValue | PerformDAGCombine (SDNode *N, DAGCombinerInfo &DCI) const override |
This method will be invoked for all target nodes and for any target-independent nodes that the target has registered with invoke it for. | |
void | ReplaceNodeResults (SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG) const override |
This callback is invoked when a node result type is illegal for the target, and the operation was registered to use 'custom' lowering for that result type. | |
SDValue | combineFMinMaxLegacyImpl (const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, SDValue True, SDValue False, SDValue CC, DAGCombinerInfo &DCI) const |
SDValue | combineFMinMaxLegacy (const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, SDValue True, SDValue False, SDValue CC, DAGCombinerInfo &DCI) const |
Generate Min/Max node. | |
const char * | getTargetNodeName (unsigned Opcode) const override |
This method returns the name of a target specific DAG node. | |
bool | mergeStoresAfterLegalization (EVT) const override |
Allow store merging for the specified type after legalization in addition to before legalization. | |
bool | isFsqrtCheap (SDValue Operand, SelectionDAG &DAG) const override |
Return true if SQRT(X) shouldn't be replaced with X*RSQRT(X). | |
SDValue | getSqrtEstimate (SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps, bool &UseOneConstNR, bool Reciprocal) const override |
Hooks for building estimates in place of slower divisions and square roots. | |
SDValue | getRecipEstimate (SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps) const override |
Return a reciprocal estimate value for the input operand. | |
virtual SDNode * | PostISelFolding (MachineSDNode *N, SelectionDAG &DAG) const =0 |
void | computeKnownBitsForTargetNode (const SDValue Op, KnownBits &Known, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth=0) const override |
Determine which of the bits specified in Mask are known to be either zero or one and return them in the KnownZero and KnownOne bitsets. | |
unsigned | ComputeNumSignBitsForTargetNode (SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth=0) const override |
This method can be implemented by targets that want to expose additional information about sign bits to the DAG Combiner. | |
unsigned | computeNumSignBitsForTargetInstr (GISelKnownBits &Analysis, Register R, const APInt &DemandedElts, const MachineRegisterInfo &MRI, unsigned Depth=0) const override |
This method can be implemented by targets that want to expose additional information about sign bits to GlobalISel combiners. | |
bool | isKnownNeverNaNForTargetNode (SDValue Op, const SelectionDAG &DAG, bool SNaN=false, unsigned Depth=0) const override |
If SNaN is false,. | |
bool | isReassocProfitable (MachineRegisterInfo &MRI, Register N0, Register N1) const override |
SDValue | CreateLiveInRegister (SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT, const SDLoc &SL, bool RawReg=false) const |
Helper function that adds Reg to the LiveIn list of the DAG's MachineFunction. | |
SDValue | CreateLiveInRegister (SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT) const |
SDValue | CreateLiveInRegisterRaw (SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT) const |
SDValue | loadStackInputValue (SelectionDAG &DAG, EVT VT, const SDLoc &SL, int64_t Offset) const |
Similar to CreateLiveInRegister, except value maybe loaded from a stack slot rather than passed in a register. | |
SDValue | storeStackInputValue (SelectionDAG &DAG, const SDLoc &SL, SDValue Chain, SDValue ArgVal, int64_t Offset) const |
SDValue | loadInputValue (SelectionDAG &DAG, const TargetRegisterClass *RC, EVT VT, const SDLoc &SL, const ArgDescriptor &Arg) const |
uint32_t | getImplicitParameterOffset (const MachineFunction &MF, const ImplicitParameter Param) const |
Helper function that returns the byte offset of the given type of implicit parameter. | |
uint32_t | getImplicitParameterOffset (const uint64_t ExplicitKernArgSize, const ImplicitParameter Param) const |
MVT | getFenceOperandTy (const DataLayout &DL) const override |
Return the type for operands of fence. | |
bool | shouldSinkOperands (Instruction *I, SmallVectorImpl< Use * > &Ops) const override |
Whether it is profitable to sink the operands of an Instruction I to the basic block of I. | |
Public Member Functions inherited from llvm::TargetLowering | |
TargetLowering (const TargetLowering &)=delete | |
TargetLowering & | operator= (const TargetLowering &)=delete |
TargetLowering (const TargetMachine &TM) | |
NOTE: The TargetMachine owns TLOF. | |
bool | isPositionIndependent () const |
virtual bool | isSDNodeSourceOfDivergence (const SDNode *N, FunctionLoweringInfo *FLI, UniformityInfo *UA) const |
virtual bool | isReassocProfitable (SelectionDAG &DAG, SDValue N0, SDValue N1) const |
virtual bool | isReassocProfitable (MachineRegisterInfo &MRI, Register N0, Register N1) const |
virtual bool | isSDNodeAlwaysUniform (const SDNode *N) const |
virtual bool | getPreIndexedAddressParts (SDNode *, SDValue &, SDValue &, ISD::MemIndexedMode &, SelectionDAG &) const |
Returns true by value, base pointer and offset pointer and addressing mode by reference if the node's address can be legally represented as pre-indexed load / store address. | |
virtual bool | getPostIndexedAddressParts (SDNode *, SDNode *, SDValue &, SDValue &, ISD::MemIndexedMode &, SelectionDAG &) const |
Returns true by value, base pointer and offset pointer and addressing mode by reference if this node can be combined with a load / store to form a post-indexed load / store. | |
virtual bool | isIndexingLegal (MachineInstr &MI, Register Base, Register Offset, bool IsPre, MachineRegisterInfo &MRI) const |
Returns true if the specified base+offset is a legal indexed addressing mode for this target. | |
virtual unsigned | getJumpTableEncoding () const |
Return the entry encoding for a jump table in the current function. | |
virtual MVT | getJumpTableRegTy (const DataLayout &DL) const |
virtual const MCExpr * | LowerCustomJumpTableEntry (const MachineJumpTableInfo *, const MachineBasicBlock *, unsigned, MCContext &) const |
virtual SDValue | getPICJumpTableRelocBase (SDValue Table, SelectionDAG &DAG) const |
Returns relocation base for the given PIC jumptable. | |
virtual const MCExpr * | getPICJumpTableRelocBaseExpr (const MachineFunction *MF, unsigned JTI, MCContext &Ctx) const |
This returns the relocation base for the given PIC jumptable, the same as getPICJumpTableRelocBase, but as an MCExpr. | |
virtual bool | isOffsetFoldingLegal (const GlobalAddressSDNode *GA) const |
Return true if folding a constant offset with the given GlobalAddress is legal. | |
virtual bool | isInlineAsmTargetBranch (const SmallVectorImpl< StringRef > &AsmStrs, unsigned OpNo) const |
On x86, return true if the operand with index OpNo is a CALL or JUMP instruction, which can use either a memory constraint or an address constraint. | |
bool | isInTailCallPosition (SelectionDAG &DAG, SDNode *Node, SDValue &Chain) const |
Check whether a given call node is in tail position within its function. | |
void | softenSetCCOperands (SelectionDAG &DAG, EVT VT, SDValue &NewLHS, SDValue &NewRHS, ISD::CondCode &CCCode, const SDLoc &DL, const SDValue OldLHS, const SDValue OldRHS) const |
Soften the operands of a comparison. | |
void | softenSetCCOperands (SelectionDAG &DAG, EVT VT, SDValue &NewLHS, SDValue &NewRHS, ISD::CondCode &CCCode, const SDLoc &DL, const SDValue OldLHS, const SDValue OldRHS, SDValue &Chain, bool IsSignaling=false) const |
virtual SDValue | visitMaskedLoad (SelectionDAG &DAG, const SDLoc &DL, SDValue Chain, MachineMemOperand *MMO, SDValue &NewLoad, SDValue Ptr, SDValue PassThru, SDValue Mask) const |
virtual SDValue | visitMaskedStore (SelectionDAG &DAG, const SDLoc &DL, SDValue Chain, MachineMemOperand *MMO, SDValue Ptr, SDValue Val, SDValue Mask) const |
std::pair< SDValue, SDValue > | makeLibCall (SelectionDAG &DAG, RTLIB::Libcall LC, EVT RetVT, ArrayRef< SDValue > Ops, MakeLibCallOptions CallOptions, const SDLoc &dl, SDValue Chain=SDValue()) const |
Returns a pair of (return value, chain). | |
bool | parametersInCSRMatch (const MachineRegisterInfo &MRI, const uint32_t *CallerPreservedMask, const SmallVectorImpl< CCValAssign > &ArgLocs, const SmallVectorImpl< SDValue > &OutVals) const |
Check whether parameters to a call that are passed in callee saved registers are the same as from the calling function. | |
virtual bool | findOptimalMemOpLowering (std::vector< EVT > &MemOps, unsigned Limit, const MemOp &Op, unsigned DstAS, unsigned SrcAS, const AttributeList &FuncAttributes) const |
Determines the optimal series of memory ops to replace the memset / memcpy. | |
bool | ShrinkDemandedConstant (SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, TargetLoweringOpt &TLO) const |
Check to see if the specified operand of the specified instruction is a constant integer. | |
bool | ShrinkDemandedConstant (SDValue Op, const APInt &DemandedBits, TargetLoweringOpt &TLO) const |
Helper wrapper around ShrinkDemandedConstant, demanding all elements. | |
virtual bool | targetShrinkDemandedConstant (SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, TargetLoweringOpt &TLO) const |
bool | ShrinkDemandedOp (SDValue Op, unsigned BitWidth, const APInt &DemandedBits, TargetLoweringOpt &TLO) const |
Convert x+y to (VT)((SmallVT)x+(SmallVT)y) if the casts are free. | |
bool | SimplifyDemandedBits (SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, KnownBits &Known, TargetLoweringOpt &TLO, unsigned Depth=0, bool AssumeSingleUse=false) const |
Look at Op. | |
bool | SimplifyDemandedBits (SDValue Op, const APInt &DemandedBits, KnownBits &Known, TargetLoweringOpt &TLO, unsigned Depth=0, bool AssumeSingleUse=false) const |
Helper wrapper around SimplifyDemandedBits, demanding all elements. | |
bool | SimplifyDemandedBits (SDValue Op, const APInt &DemandedBits, DAGCombinerInfo &DCI) const |
Helper wrapper around SimplifyDemandedBits. | |
bool | SimplifyDemandedBits (SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, DAGCombinerInfo &DCI) const |
Helper wrapper around SimplifyDemandedBits. | |
SDValue | SimplifyMultipleUseDemandedBits (SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, SelectionDAG &DAG, unsigned Depth=0) const |
More limited version of SimplifyDemandedBits that can be used to "look
through" ops that don't contribute to the DemandedBits/DemandedElts - bitwise ops etc. | |
SDValue | SimplifyMultipleUseDemandedBits (SDValue Op, const APInt &DemandedBits, SelectionDAG &DAG, unsigned Depth=0) const |
Helper wrapper around SimplifyMultipleUseDemandedBits, demanding all elements. | |
SDValue | SimplifyMultipleUseDemandedVectorElts (SDValue Op, const APInt &DemandedElts, SelectionDAG &DAG, unsigned Depth=0) const |
Helper wrapper around SimplifyMultipleUseDemandedBits, demanding all bits from only some vector elements. | |
bool | SimplifyDemandedVectorElts (SDValue Op, const APInt &DemandedEltMask, APInt &KnownUndef, APInt &KnownZero, TargetLoweringOpt &TLO, unsigned Depth=0, bool AssumeSingleUse=false) const |
Look at Vector Op. | |
bool | SimplifyDemandedVectorElts (SDValue Op, const APInt &DemandedElts, DAGCombinerInfo &DCI) const |
Helper wrapper around SimplifyDemandedVectorElts. | |
virtual bool | shouldSimplifyDemandedVectorElts (SDValue Op, const TargetLoweringOpt &TLO) const |
Return true if the target supports simplifying demanded vector elements by converting them to undefs. | |
virtual void | computeKnownBitsForTargetNode (const SDValue Op, KnownBits &Known, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth=0) const |
Determine which of the bits specified in Mask are known to be either zero or one and return them in the KnownZero/KnownOne bitsets. | |
virtual void | computeKnownBitsForTargetInstr (GISelKnownBits &Analysis, Register R, KnownBits &Known, const APInt &DemandedElts, const MachineRegisterInfo &MRI, unsigned Depth=0) const |
Determine which of the bits specified in Mask are known to be either zero or one and return them in the KnownZero/KnownOne bitsets. | |
virtual Align | computeKnownAlignForTargetInstr (GISelKnownBits &Analysis, Register R, const MachineRegisterInfo &MRI, unsigned Depth=0) const |
Determine the known alignment for the pointer value R . | |
virtual void | computeKnownBitsForFrameIndex (int FIOp, KnownBits &Known, const MachineFunction &MF) const |
Determine which of the bits of FrameIndex FIOp are known to be 0. | |
virtual unsigned | ComputeNumSignBitsForTargetNode (SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth=0) const |
This method can be implemented by targets that want to expose additional information about sign bits to the DAG Combiner. | |
virtual unsigned | computeNumSignBitsForTargetInstr (GISelKnownBits &Analysis, Register R, const APInt &DemandedElts, const MachineRegisterInfo &MRI, unsigned Depth=0) const |
This method can be implemented by targets that want to expose additional information about sign bits to GlobalISel combiners. | |
virtual bool | SimplifyDemandedVectorEltsForTargetNode (SDValue Op, const APInt &DemandedElts, APInt &KnownUndef, APInt &KnownZero, TargetLoweringOpt &TLO, unsigned Depth=0) const |
Attempt to simplify any target nodes based on the demanded vector elements, returning true on success. | |
virtual bool | SimplifyDemandedBitsForTargetNode (SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, KnownBits &Known, TargetLoweringOpt &TLO, unsigned Depth=0) const |
Attempt to simplify any target nodes based on the demanded bits/elts, returning true on success. | |
virtual SDValue | SimplifyMultipleUseDemandedBitsForTargetNode (SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, SelectionDAG &DAG, unsigned Depth) const |
More limited version of SimplifyDemandedBits that can be used to "look
through" ops that don't contribute to the DemandedBits/DemandedElts - bitwise ops etc. | |
virtual bool | isGuaranteedNotToBeUndefOrPoisonForTargetNode (SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG, bool PoisonOnly, unsigned Depth) const |
Return true if this function can prove that Op is never poison and, if PoisonOnly is false, does not have undef bits. | |
virtual bool | canCreateUndefOrPoisonForTargetNode (SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG, bool PoisonOnly, bool ConsiderFlags, unsigned Depth) const |
Return true if Op can create undef or poison from non-undef & non-poison operands. | |
SDValue | buildLegalVectorShuffle (EVT VT, const SDLoc &DL, SDValue N0, SDValue N1, MutableArrayRef< int > Mask, SelectionDAG &DAG) const |
Tries to build a legal vector shuffle using the provided parameters or equivalent variations. | |
virtual const Constant * | getTargetConstantFromLoad (LoadSDNode *LD) const |
This method returns the constant pool value that will be loaded by LD. | |
virtual bool | isKnownNeverNaNForTargetNode (SDValue Op, const SelectionDAG &DAG, bool SNaN=false, unsigned Depth=0) const |
If SNaN is false,. | |
virtual bool | isSplatValueForTargetNode (SDValue Op, const APInt &DemandedElts, APInt &UndefElts, const SelectionDAG &DAG, unsigned Depth=0) const |
Return true if vector Op has the same value across all DemandedElts , indicating any elements which may be undef in the output UndefElts . | |
virtual bool | isTargetCanonicalConstantNode (SDValue Op) const |
Returns true if the given Opc is considered a canonical constant for the target, which should not be transformed back into a BUILD_VECTOR. | |
bool | isConstTrueVal (SDValue N) const |
Return if the N is a constant or constant vector equal to the true value from getBooleanContents(). | |
bool | isConstFalseVal (SDValue N) const |
Return if the N is a constant or constant vector equal to the false value from getBooleanContents(). | |
bool | isExtendedTrueVal (const ConstantSDNode *N, EVT VT, bool SExt) const |
Return if N is a True value when extended to VT . | |
SDValue | SimplifySetCC (EVT VT, SDValue N0, SDValue N1, ISD::CondCode Cond, bool foldBooleans, DAGCombinerInfo &DCI, const SDLoc &dl) const |
Try to simplify a setcc built with the specified operands and cc. | |
virtual SDValue | unwrapAddress (SDValue N) const |
virtual bool | isGAPlusOffset (SDNode *N, const GlobalValue *&GA, int64_t &Offset) const |
Returns true (and the GlobalValue and the offset) if the node is a GlobalAddress + offset. | |
virtual SDValue | PerformDAGCombine (SDNode *N, DAGCombinerInfo &DCI) const |
This method will be invoked for all target nodes and for any target-independent nodes that the target has registered with invoke it for. | |
virtual bool | isDesirableToCommuteWithShift (const SDNode *N, CombineLevel Level) const |
Return true if it is profitable to move this shift by a constant amount through its operand, adjusting any immediate operands as necessary to preserve semantics. | |
virtual bool | isDesirableToCommuteWithShift (const MachineInstr &MI, bool IsAfterLegal) const |
GlobalISel - return true if it is profitable to move this shift by a constant amount through its operand, adjusting any immediate operands as necessary to preserve semantics. | |
virtual bool | isDesirableToPullExtFromShl (const MachineInstr &MI) const |
GlobalISel - return true if it's profitable to perform the combine: shl ([sza]ext x), y => zext (shl x, y) | |
virtual AndOrSETCCFoldKind | isDesirableToCombineLogicOpOfSETCC (const SDNode *LogicOp, const SDNode *SETCC0, const SDNode *SETCC1) const |
virtual bool | isDesirableToCommuteXorWithShift (const SDNode *N) const |
Return true if it is profitable to combine an XOR of a logical shift to create a logical shift of NOT. | |
virtual bool | isTypeDesirableForOp (unsigned, EVT VT) const |
Return true if the target has native support for the specified value type and it is 'desirable' to use the type for the given node type. | |
virtual bool | isDesirableToTransformToIntegerOp (unsigned, EVT) const |
Return true if it is profitable for dag combiner to transform a floating point op of specified opcode to a equivalent op of an integer type. | |
virtual bool | IsDesirableToPromoteOp (SDValue, EVT &) const |
This method query the target whether it is beneficial for dag combiner to promote the specified node. | |
virtual bool | supportSwiftError () const |
Return true if the target supports swifterror attribute. | |
virtual bool | supportSplitCSR (MachineFunction *MF) const |
Return true if the target supports that a subset of CSRs for the given machine function is handled explicitly via copies. | |
virtual bool | supportKCFIBundles () const |
Return true if the target supports kcfi operand bundles. | |
virtual bool | supportPtrAuthBundles () const |
Return true if the target supports ptrauth operand bundles. | |
virtual void | initializeSplitCSR (MachineBasicBlock *Entry) const |
Perform necessary initialization to handle a subset of CSRs explicitly via copies. | |
virtual void | insertCopiesSplitCSR (MachineBasicBlock *Entry, const SmallVectorImpl< MachineBasicBlock * > &Exits) const |
Insert explicit copies in entry and exit blocks. | |
virtual SDValue | getNegatedExpression (SDValue Op, SelectionDAG &DAG, bool LegalOps, bool OptForSize, NegatibleCost &Cost, unsigned Depth=0) const |
Return the newly negated expression if the cost is not expensive and set the cost in Cost to indicate that if it is cheaper or neutral to do the negation. | |
SDValue | getCheaperOrNeutralNegatedExpression (SDValue Op, SelectionDAG &DAG, bool LegalOps, bool OptForSize, const NegatibleCost CostThreshold=NegatibleCost::Neutral, unsigned Depth=0) const |
SDValue | getCheaperNegatedExpression (SDValue Op, SelectionDAG &DAG, bool LegalOps, bool OptForSize, unsigned Depth=0) const |
This is the helper function to return the newly negated expression only when the cost is cheaper. | |
SDValue | getNegatedExpression (SDValue Op, SelectionDAG &DAG, bool LegalOps, bool OptForSize, unsigned Depth=0) const |
This is the helper function to return the newly negated expression if the cost is not expensive. | |
virtual bool | splitValueIntoRegisterParts (SelectionDAG &DAG, const SDLoc &DL, SDValue Val, SDValue *Parts, unsigned NumParts, MVT PartVT, std::optional< CallingConv::ID > CC) const |
Target-specific splitting of values into parts that fit a register storing a legal type. | |
virtual bool | checkForPhysRegDependency (SDNode *Def, SDNode *User, unsigned Op, const TargetRegisterInfo *TRI, const TargetInstrInfo *TII, unsigned &PhysReg, int &Cost) const |
Allows the target to handle physreg-carried dependency in target-specific way. | |
virtual SDValue | joinRegisterPartsIntoValue (SelectionDAG &DAG, const SDLoc &DL, const SDValue *Parts, unsigned NumParts, MVT PartVT, EVT ValueVT, std::optional< CallingConv::ID > CC) const |
Target-specific combining of register parts into its original value. | |
virtual SDValue | LowerFormalArguments (SDValue, CallingConv::ID, bool, const SmallVectorImpl< ISD::InputArg > &, const SDLoc &, SelectionDAG &, SmallVectorImpl< SDValue > &) const |
This hook must be implemented to lower the incoming (formal) arguments, described by the Ins array, into the specified DAG. | |
std::pair< SDValue, SDValue > | LowerCallTo (CallLoweringInfo &CLI) const |
This function lowers an abstract call to a function into an actual call. | |
virtual SDValue | LowerCall (CallLoweringInfo &, SmallVectorImpl< SDValue > &) const |
This hook must be implemented to lower calls into the specified DAG. | |
virtual void | HandleByVal (CCState *, unsigned &, Align) const |
Target-specific cleanup for formal ByVal parameters. | |
virtual bool | CanLowerReturn (CallingConv::ID, MachineFunction &, bool, const SmallVectorImpl< ISD::OutputArg > &, LLVMContext &) const |
This hook should be implemented to check whether the return values described by the Outs array can fit into the return registers. | |
virtual SDValue | LowerReturn (SDValue, CallingConv::ID, bool, const SmallVectorImpl< ISD::OutputArg > &, const SmallVectorImpl< SDValue > &, const SDLoc &, SelectionDAG &) const |
This hook must be implemented to lower outgoing return values, described by the Outs array, into the specified DAG. | |
virtual bool | isUsedByReturnOnly (SDNode *, SDValue &) const |
Return true if result of the specified node is used by a return node only. | |
virtual bool | mayBeEmittedAsTailCall (const CallInst *) const |
Return true if the target may be able emit the call instruction as a tail call. | |
virtual Register | getRegisterByName (const char *RegName, LLT Ty, const MachineFunction &MF) const |
Return the register ID of the name passed in. | |
virtual EVT | getTypeForExtReturn (LLVMContext &Context, EVT VT, ISD::NodeType) const |
Return the type that should be used to zero or sign extend a zeroext/signext integer return value. | |
virtual bool | functionArgumentNeedsConsecutiveRegisters (Type *Ty, CallingConv::ID CallConv, bool isVarArg, const DataLayout &DL) const |
For some targets, an LLVM struct type must be broken down into multiple simple types, but the calling convention specifies that the entire struct must be passed in a block of consecutive registers. | |
virtual bool | shouldSplitFunctionArgumentsAsLittleEndian (const DataLayout &DL) const |
For most targets, an LLVM type must be broken down into multiple smaller types. | |
virtual const MCPhysReg * | getScratchRegisters (CallingConv::ID CC) const |
Returns a 0 terminated array of registers that can be safely used as scratch registers. | |
virtual ArrayRef< MCPhysReg > | getRoundingControlRegisters () const |
Returns a 0 terminated array of rounding control registers that can be attached into strict FP call. | |
virtual SDValue | prepareVolatileOrAtomicLoad (SDValue Chain, const SDLoc &DL, SelectionDAG &DAG) const |
This callback is used to prepare for a volatile or atomic load. | |
virtual void | LowerOperationWrapper (SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG) const |
This callback is invoked by the type legalizer to legalize nodes with an illegal operand type but legal result types. | |
virtual SDValue | LowerOperation (SDValue Op, SelectionDAG &DAG) const |
This callback is invoked for operations that are unsupported by the target, which are registered to use 'custom' lowering, and whose defined values are all legal. | |
virtual void | ReplaceNodeResults (SDNode *, SmallVectorImpl< SDValue > &, SelectionDAG &) const |
This callback is invoked when a node result type is illegal for the target, and the operation was registered to use 'custom' lowering for that result type. | |
virtual const char * | getTargetNodeName (unsigned Opcode) const |
This method returns the name of a target specific DAG node. | |
virtual FastISel * | createFastISel (FunctionLoweringInfo &, const TargetLibraryInfo *) const |
This method returns a target specific FastISel object, or null if the target does not support "fast" ISel. | |
bool | verifyReturnAddressArgumentIsConstant (SDValue Op, SelectionDAG &DAG) const |
virtual void | verifyTargetSDNode (const SDNode *N) const |
Check the given SDNode. Aborts if it is invalid. | |
virtual bool | ExpandInlineAsm (CallInst *) const |
This hook allows the target to expand an inline asm call to be explicit llvm code if it wants to. | |
virtual AsmOperandInfoVector | ParseConstraints (const DataLayout &DL, const TargetRegisterInfo *TRI, const CallBase &Call) const |
Split up the constraint string from the inline assembly value into the specific constraints and their prefixes, and also tie in the associated operand values. | |
virtual ConstraintWeight | getMultipleConstraintMatchWeight (AsmOperandInfo &info, int maIndex) const |
Examine constraint type and operand type and determine a weight value. | |
virtual ConstraintWeight | getSingleConstraintMatchWeight (AsmOperandInfo &info, const char *constraint) const |
Examine constraint string and operand type and determine a weight value. | |
virtual void | ComputeConstraintToUse (AsmOperandInfo &OpInfo, SDValue Op, SelectionDAG *DAG=nullptr) const |
Determines the constraint code and constraint type to use for the specific AsmOperandInfo, setting OpInfo.ConstraintCode and OpInfo.ConstraintType. | |
virtual ConstraintType | getConstraintType (StringRef Constraint) const |
Given a constraint, return the type of constraint it is for this target. | |
ConstraintGroup | getConstraintPreferences (AsmOperandInfo &OpInfo) const |
Given an OpInfo with list of constraints codes as strings, return a sorted Vector of pairs of constraint codes and their types in priority of what we'd prefer to lower them as. | |
virtual std::pair< unsigned, const TargetRegisterClass * > | getRegForInlineAsmConstraint (const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const |
Given a physical register constraint (e.g. | |
virtual InlineAsm::ConstraintCode | getInlineAsmMemConstraint (StringRef ConstraintCode) const |
virtual const char * | LowerXConstraint (EVT ConstraintVT) const |
Try to replace an X constraint, which matches anything, with another that has more specific requirements based on the type of the corresponding operand. | |
virtual void | LowerAsmOperandForConstraint (SDValue Op, StringRef Constraint, std::vector< SDValue > &Ops, SelectionDAG &DAG) const |
Lower the specified operand into the Ops vector. | |
virtual SDValue | LowerAsmOutputForConstraint (SDValue &Chain, SDValue &Glue, const SDLoc &DL, const AsmOperandInfo &OpInfo, SelectionDAG &DAG) const |
virtual void | CollectTargetIntrinsicOperands (const CallInst &I, SmallVectorImpl< SDValue > &Ops, SelectionDAG &DAG) const |
SDValue | BuildSDIV (SDNode *N, SelectionDAG &DAG, bool IsAfterLegalization, bool IsAfterLegalTypes, SmallVectorImpl< SDNode * > &Created) const |
Given an ISD::SDIV node expressing a divide by constant, return a DAG expression to select that will generate the same value by multiplying by a magic number. | |
SDValue | BuildUDIV (SDNode *N, SelectionDAG &DAG, bool IsAfterLegalization, bool IsAfterLegalTypes, SmallVectorImpl< SDNode * > &Created) const |
Given an ISD::UDIV node expressing a divide by constant, return a DAG expression to select that will generate the same value by multiplying by a magic number. | |
SDValue | buildSDIVPow2WithCMov (SDNode *N, const APInt &Divisor, SelectionDAG &DAG, SmallVectorImpl< SDNode * > &Created) const |
Build sdiv by power-of-2 with conditional move instructions Ref: "Hacker's Delight" by Henry Warren 10-1 If conditional move/branch is preferred, we lower sdiv x, +/-2**k into: bgez x, label add x, x, 2**k-1 label: sra res, x, k neg res, res (when the divisor is negative) | |
virtual SDValue | BuildSDIVPow2 (SDNode *N, const APInt &Divisor, SelectionDAG &DAG, SmallVectorImpl< SDNode * > &Created) const |
Targets may override this function to provide custom SDIV lowering for power-of-2 denominators. | |
virtual SDValue | BuildSREMPow2 (SDNode *N, const APInt &Divisor, SelectionDAG &DAG, SmallVectorImpl< SDNode * > &Created) const |
Targets may override this function to provide custom SREM lowering for power-of-2 denominators. | |
virtual unsigned | combineRepeatedFPDivisors () const |
Indicate whether this target prefers to combine FDIVs with the same divisor. | |
virtual SDValue | getSqrtEstimate (SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps, bool &UseOneConstNR, bool Reciprocal) const |
Hooks for building estimates in place of slower divisions and square roots. | |
SDValue | createSelectForFMINNUM_FMAXNUM (SDNode *Node, SelectionDAG &DAG) const |
Try to convert the fminnum/fmaxnum to a compare/select sequence. | |
virtual SDValue | getRecipEstimate (SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps) const |
Return a reciprocal estimate value for the input operand. | |
virtual SDValue | getSqrtInputTest (SDValue Operand, SelectionDAG &DAG, const DenormalMode &Mode) const |
Return a target-dependent comparison result if the input operand is suitable for use with a square root estimate calculation. | |
virtual SDValue | getSqrtResultForDenormInput (SDValue Operand, SelectionDAG &DAG) const |
Return a target-dependent result if the input operand is not suitable for use with a square root estimate calculation. | |
bool | expandMUL_LOHI (unsigned Opcode, EVT VT, const SDLoc &dl, SDValue LHS, SDValue RHS, SmallVectorImpl< SDValue > &Result, EVT HiLoVT, SelectionDAG &DAG, MulExpansionKind Kind, SDValue LL=SDValue(), SDValue LH=SDValue(), SDValue RL=SDValue(), SDValue RH=SDValue()) const |
Expand a MUL or [US]MUL_LOHI of n-bit values into two or four nodes, respectively, each computing an n/2-bit part of the result. | |
bool | expandMUL (SDNode *N, SDValue &Lo, SDValue &Hi, EVT HiLoVT, SelectionDAG &DAG, MulExpansionKind Kind, SDValue LL=SDValue(), SDValue LH=SDValue(), SDValue RL=SDValue(), SDValue RH=SDValue()) const |
Expand a MUL into two nodes. | |
bool | expandDIVREMByConstant (SDNode *N, SmallVectorImpl< SDValue > &Result, EVT HiLoVT, SelectionDAG &DAG, SDValue LL=SDValue(), SDValue LH=SDValue()) const |
Attempt to expand an n-bit div/rem/divrem by constant using a n/2-bit urem by constant and other arithmetic ops. | |
SDValue | expandFunnelShift (SDNode *N, SelectionDAG &DAG) const |
Expand funnel shift. | |
SDValue | expandROT (SDNode *N, bool AllowVectorOps, SelectionDAG &DAG) const |
Expand rotations. | |
void | expandShiftParts (SDNode *N, SDValue &Lo, SDValue &Hi, SelectionDAG &DAG) const |
Expand shift-by-parts. | |
bool | expandFP_TO_SINT (SDNode *N, SDValue &Result, SelectionDAG &DAG) const |
Expand float(f32) to SINT(i64) conversion. | |
bool | expandFP_TO_UINT (SDNode *N, SDValue &Result, SDValue &Chain, SelectionDAG &DAG) const |
Expand float to UINT conversion. | |
bool | expandUINT_TO_FP (SDNode *N, SDValue &Result, SDValue &Chain, SelectionDAG &DAG) const |
Expand UINT(i64) to double(f64) conversion. | |
SDValue | expandFMINNUM_FMAXNUM (SDNode *N, SelectionDAG &DAG) const |
Expand fminnum/fmaxnum into fminnum_ieee/fmaxnum_ieee with quieted inputs. | |
SDValue | expandFMINIMUM_FMAXIMUM (SDNode *N, SelectionDAG &DAG) const |
Expand fminimum/fmaximum into multiple comparison with selects. | |
SDValue | expandFMINIMUMNUM_FMAXIMUMNUM (SDNode *N, SelectionDAG &DAG) const |
Expand fminimumnum/fmaximumnum into multiple comparison with selects. | |
SDValue | expandFP_TO_INT_SAT (SDNode *N, SelectionDAG &DAG) const |
Expand FP_TO_[US]INT_SAT into FP_TO_[US]INT and selects or min/max. | |
SDValue | expandRoundInexactToOdd (EVT ResultVT, SDValue Op, const SDLoc &DL, SelectionDAG &DAG) const |
Truncate Op to ResultVT. | |
SDValue | expandFP_ROUND (SDNode *Node, SelectionDAG &DAG) const |
Expand round(fp) to fp conversion. | |
SDValue | expandIS_FPCLASS (EVT ResultVT, SDValue Op, FPClassTest Test, SDNodeFlags Flags, const SDLoc &DL, SelectionDAG &DAG) const |
Expand check for floating point class. | |
SDValue | expandCTPOP (SDNode *N, SelectionDAG &DAG) const |
Expand CTPOP nodes. | |
SDValue | expandVPCTPOP (SDNode *N, SelectionDAG &DAG) const |
Expand VP_CTPOP nodes. | |
SDValue | expandCTLZ (SDNode *N, SelectionDAG &DAG) const |
Expand CTLZ/CTLZ_ZERO_UNDEF nodes. | |
SDValue | expandVPCTLZ (SDNode *N, SelectionDAG &DAG) const |
Expand VP_CTLZ/VP_CTLZ_ZERO_UNDEF nodes. | |
SDValue | CTTZTableLookup (SDNode *N, SelectionDAG &DAG, const SDLoc &DL, EVT VT, SDValue Op, unsigned NumBitsPerElt) const |
Expand CTTZ via Table Lookup. | |
SDValue | expandCTTZ (SDNode *N, SelectionDAG &DAG) const |
Expand CTTZ/CTTZ_ZERO_UNDEF nodes. | |
SDValue | expandVPCTTZ (SDNode *N, SelectionDAG &DAG) const |
Expand VP_CTTZ/VP_CTTZ_ZERO_UNDEF nodes. | |
SDValue | expandVPCTTZElements (SDNode *N, SelectionDAG &DAG) const |
Expand VP_CTTZ_ELTS/VP_CTTZ_ELTS_ZERO_UNDEF nodes. | |
SDValue | expandABS (SDNode *N, SelectionDAG &DAG, bool IsNegative=false) const |
Expand ABS nodes. | |
SDValue | expandABD (SDNode *N, SelectionDAG &DAG) const |
Expand ABDS/ABDU nodes. | |
SDValue | expandAVG (SDNode *N, SelectionDAG &DAG) const |
Expand vector/scalar AVGCEILS/AVGCEILU/AVGFLOORS/AVGFLOORU nodes. | |
SDValue | expandBSWAP (SDNode *N, SelectionDAG &DAG) const |
Expand BSWAP nodes. | |
SDValue | expandVPBSWAP (SDNode *N, SelectionDAG &DAG) const |
Expand VP_BSWAP nodes. | |
SDValue | expandBITREVERSE (SDNode *N, SelectionDAG &DAG) const |
Expand BITREVERSE nodes. | |
SDValue | expandVPBITREVERSE (SDNode *N, SelectionDAG &DAG) const |
Expand VP_BITREVERSE nodes. | |
std::pair< SDValue, SDValue > | scalarizeVectorLoad (LoadSDNode *LD, SelectionDAG &DAG) const |
Turn load of vector type into a load of the individual elements. | |
SDValue | scalarizeVectorStore (StoreSDNode *ST, SelectionDAG &DAG) const |
std::pair< SDValue, SDValue > | expandUnalignedLoad (LoadSDNode *LD, SelectionDAG &DAG) const |
Expands an unaligned load to 2 half-size loads for an integer, and possibly more for vectors. | |
SDValue | expandUnalignedStore (StoreSDNode *ST, SelectionDAG &DAG) const |
Expands an unaligned store to 2 half-size stores for integer values, and possibly more for vectors. | |
SDValue | IncrementMemoryAddress (SDValue Addr, SDValue Mask, const SDLoc &DL, EVT DataVT, SelectionDAG &DAG, bool IsCompressedMemory) const |
Increments memory address Addr according to the type of the value DataVT that should be stored. | |
SDValue | getVectorElementPointer (SelectionDAG &DAG, SDValue VecPtr, EVT VecVT, SDValue Index) const |
Get a pointer to vector element Idx located in memory for a vector of type VecVT starting at a base address of VecPtr . | |
SDValue | getVectorSubVecPointer (SelectionDAG &DAG, SDValue VecPtr, EVT VecVT, EVT SubVecVT, SDValue Index) const |
Get a pointer to a sub-vector of type SubVecVT at index Idx located in memory for a vector of type VecVT starting at a base address of VecPtr . | |
SDValue | expandIntMINMAX (SDNode *Node, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::[US][MIN|MAX]. | |
SDValue | expandAddSubSat (SDNode *Node, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::[US][ADD|SUB]SAT. | |
SDValue | expandCMP (SDNode *Node, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::[US]CMP. | |
SDValue | expandShlSat (SDNode *Node, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::[US]SHLSAT. | |
SDValue | expandFixedPointMul (SDNode *Node, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::[U|S]MULFIX[SAT]. | |
SDValue | expandFixedPointDiv (unsigned Opcode, const SDLoc &dl, SDValue LHS, SDValue RHS, unsigned Scale, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::[US]DIVFIX[SAT]. | |
void | expandUADDSUBO (SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::U(ADD|SUB)O. | |
void | expandSADDSUBO (SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::S(ADD|SUB)O. | |
bool | expandMULO (SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::[US]MULO. | |
void | forceExpandWideMUL (SelectionDAG &DAG, const SDLoc &dl, bool Signed, EVT WideVT, const SDValue LL, const SDValue LH, const SDValue RL, const SDValue RH, SDValue &Lo, SDValue &Hi) const |
forceExpandWideMUL - Unconditionally expand a MUL into either a libcall or brute force via a wide multiplication. | |
void | forceExpandWideMUL (SelectionDAG &DAG, const SDLoc &dl, bool Signed, const SDValue LHS, const SDValue RHS, SDValue &Lo, SDValue &Hi) const |
Same as above, but creates the upper halves of each operand by sign/zero-extending the operands. | |
SDValue | expandVecReduce (SDNode *Node, SelectionDAG &DAG) const |
Expand a VECREDUCE_* into an explicit calculation. | |
SDValue | expandVecReduceSeq (SDNode *Node, SelectionDAG &DAG) const |
Expand a VECREDUCE_SEQ_* into an explicit ordered calculation. | |
bool | expandREM (SDNode *Node, SDValue &Result, SelectionDAG &DAG) const |
Expand an SREM or UREM using SDIV/UDIV or SDIVREM/UDIVREM, if legal. | |
SDValue | expandVectorSplice (SDNode *Node, SelectionDAG &DAG) const |
Method for building the DAG expansion of ISD::VECTOR_SPLICE. | |
SDValue | expandVECTOR_COMPRESS (SDNode *Node, SelectionDAG &DAG) const |
Expand a vector VECTOR_COMPRESS into a sequence of extract element, store temporarily, advance store position, before re-loading the final vector. | |
bool | LegalizeSetCCCondCode (SelectionDAG &DAG, EVT VT, SDValue &LHS, SDValue &RHS, SDValue &CC, SDValue Mask, SDValue EVL, bool &NeedInvert, const SDLoc &dl, SDValue &Chain, bool IsSignaling=false) const |
Legalize a SETCC or VP_SETCC with given LHS and RHS and condition code CC on the current target. | |
virtual MachineBasicBlock * | EmitInstrWithCustomInserter (MachineInstr &MI, MachineBasicBlock *MBB) const |
This method should be implemented by targets that mark instructions with the 'usesCustomInserter' flag. | |
virtual void | AdjustInstrPostInstrSelection (MachineInstr &MI, SDNode *Node) const |
This method should be implemented by targets that mark instructions with the 'hasPostISelHook' flag. | |
virtual bool | useLoadStackGuardNode () const |
If this function returns true, SelectionDAGBuilder emits a LOAD_STACK_GUARD node when it is lowering Intrinsic::stackprotector. | |
virtual SDValue | emitStackGuardXorFP (SelectionDAG &DAG, SDValue Val, const SDLoc &DL) const |
virtual SDValue | LowerToTLSEmulatedModel (const GlobalAddressSDNode *GA, SelectionDAG &DAG) const |
Lower TLS global address SDNode for target independent emulated TLS model. | |
virtual SDValue | expandIndirectJTBranch (const SDLoc &dl, SDValue Value, SDValue Addr, int JTI, SelectionDAG &DAG) const |
Expands target specific indirect branch for the case of JumpTable expansion. | |
SDValue | lowerCmpEqZeroToCtlzSrl (SDValue Op, SelectionDAG &DAG) const |
virtual bool | isXAndYEqZeroPreferableToXAndYEqY (ISD::CondCode, EVT) const |
Public Member Functions inherited from llvm::TargetLoweringBase | |
virtual void | markLibCallAttributes (MachineFunction *MF, unsigned CC, ArgListTy &Args) const |
TargetLoweringBase (const TargetMachine &TM) | |
NOTE: The TargetMachine owns TLOF. | |
TargetLoweringBase (const TargetLoweringBase &)=delete | |
TargetLoweringBase & | operator= (const TargetLoweringBase &)=delete |
virtual | ~TargetLoweringBase ()=default |
bool | isStrictFPEnabled () const |
Return true if the target support strict float operation. | |
const TargetMachine & | getTargetMachine () const |
virtual bool | useSoftFloat () const |
virtual MVT | getPointerTy (const DataLayout &DL, uint32_t AS=0) const |
Return the pointer type for the given address space, defaults to the pointer type from the data layout. | |
virtual MVT | getPointerMemTy (const DataLayout &DL, uint32_t AS=0) const |
Return the in-memory pointer type for the given address space, defaults to the pointer type from the data layout. | |
MVT | getFrameIndexTy (const DataLayout &DL) const |
Return the type for frame index, which is determined by the alloca address space specified through the data layout. | |
MVT | getProgramPointerTy (const DataLayout &DL) const |
Return the type for code pointers, which is determined by the program address space specified through the data layout. | |
virtual MVT | getFenceOperandTy (const DataLayout &DL) const |
Return the type for operands of fence. | |
virtual MVT | getScalarShiftAmountTy (const DataLayout &, EVT) const |
Return the type to use for a scalar shift opcode, given the shifted amount type. | |
EVT | getShiftAmountTy (EVT LHSTy, const DataLayout &DL) const |
Returns the type for the shift amount of a shift opcode. | |
virtual LLVM_READONLY LLT | getPreferredShiftAmountTy (LLT ShiftValueTy) const |
Return the preferred type to use for a shift opcode, given the shifted amount type is ShiftValueTy . | |
virtual MVT | getVectorIdxTy (const DataLayout &DL) const |
Returns the type to be used for the index operand of: ISD::INSERT_VECTOR_ELT, ISD::EXTRACT_VECTOR_ELT, ISD::INSERT_SUBVECTOR, and ISD::EXTRACT_SUBVECTOR. | |
virtual MVT | getVPExplicitVectorLengthTy () const |
Returns the type to be used for the EVL/AVL operand of VP nodes: ISD::VP_ADD, ISD::VP_SUB, etc. | |
virtual MachineMemOperand::Flags | getTargetMMOFlags (const Instruction &I) const |
This callback is used to inspect load/store instructions and add target-specific MachineMemOperand flags to them. | |
virtual MachineMemOperand::Flags | getTargetMMOFlags (const MemSDNode &Node) const |
This callback is used to inspect load/store SDNode. | |
MachineMemOperand::Flags | getLoadMemOperandFlags (const LoadInst &LI, const DataLayout &DL, AssumptionCache *AC=nullptr, const TargetLibraryInfo *LibInfo=nullptr) const |
MachineMemOperand::Flags | getStoreMemOperandFlags (const StoreInst &SI, const DataLayout &DL) const |
MachineMemOperand::Flags | getAtomicMemOperandFlags (const Instruction &AI, const DataLayout &DL) const |
virtual bool | isSelectSupported (SelectSupportKind) const |
virtual bool | shouldExpandGetActiveLaneMask (EVT VT, EVT OpVT) const |
Return true if the @llvm.get.active.lane.mask intrinsic should be expanded using generic code in SelectionDAGBuilder. | |
virtual bool | shouldExpandGetVectorLength (EVT CountVT, unsigned VF, bool IsScalable) const |
virtual bool | shouldExpandCttzElements (EVT VT) const |
Return true if the @llvm.experimental.cttz.elts intrinsic should be expanded using generic code in SelectionDAGBuilder. | |
unsigned | getBitWidthForCttzElements (Type *RetTy, ElementCount EC, bool ZeroIsPoison, const ConstantRange *VScaleRange) const |
Return the minimum number of bits required to hold the maximum possible number of trailing zero vector elements. | |
virtual bool | shouldReassociateReduction (unsigned RedOpc, EVT VT) const |
virtual bool | reduceSelectOfFPConstantLoads (EVT CmpOpVT) const |
Return true if it is profitable to convert a select of FP constants into a constant pool load whose address depends on the select condition. | |
bool | hasMultipleConditionRegisters () const |
Return true if multiple condition registers are available. | |
bool | hasExtractBitsInsn () const |
Return true if the target has BitExtract instructions. | |
virtual TargetLoweringBase::LegalizeTypeAction | getPreferredVectorAction (MVT VT) const |
Return the preferred vector type legalization action. | |
virtual bool | softPromoteHalfType () const |
virtual bool | useFPRegsForHalfType () const |
virtual bool | shouldExpandBuildVectorWithShuffles (EVT, unsigned DefinedValues) const |
virtual bool | isIntDivCheap (EVT VT, AttributeList Attr) const |
Return true if integer divide is usually cheaper than a sequence of several shifts, adds, and multiplies for this target. | |
virtual bool | hasStandaloneRem (EVT VT) const |
Return true if the target can handle a standalone remainder operation. | |
virtual bool | isFsqrtCheap (SDValue X, SelectionDAG &DAG) const |
Return true if SQRT(X) shouldn't be replaced with X*RSQRT(X). | |
int | getRecipEstimateSqrtEnabled (EVT VT, MachineFunction &MF) const |
Return a ReciprocalEstimate enum value for a square root of the given type based on the function's attributes. | |
int | getRecipEstimateDivEnabled (EVT VT, MachineFunction &MF) const |
Return a ReciprocalEstimate enum value for a division of the given type based on the function's attributes. | |
int | getSqrtRefinementSteps (EVT VT, MachineFunction &MF) const |
Return the refinement step count for a square root of the given type based on the function's attributes. | |
int | getDivRefinementSteps (EVT VT, MachineFunction &MF) const |
Return the refinement step count for a division of the given type based on the function's attributes. | |
bool | isSlowDivBypassed () const |
Returns true if target has indicated at least one type should be bypassed. | |
const DenseMap< unsigned int, unsigned int > & | getBypassSlowDivWidths () const |
Returns map of slow types for division or remainder with corresponding fast types. | |
virtual bool | isVScaleKnownToBeAPowerOfTwo () const |
Return true only if vscale must be a power of two. | |
bool | isJumpExpensive () const |
Return true if Flow Control is an expensive operation that should be avoided. | |
virtual CondMergingParams | getJumpConditionMergingParams (Instruction::BinaryOps, const Value *, const Value *) const |
bool | isPredictableSelectExpensive () const |
Return true if selects are only cheaper than branches if the branch is unlikely to be predicted right. | |
virtual bool | fallBackToDAGISel (const Instruction &Inst) const |
virtual bool | isLoadBitCastBeneficial (EVT LoadVT, EVT BitcastVT, const SelectionDAG &DAG, const MachineMemOperand &MMO) const |
Return true if the following transform is beneficial: fold (conv (load x)) -> (load (conv*)x) On architectures that don't natively support some vector loads efficiently, casting the load to a smaller vector of larger types and loading is more efficient, however, this can be undone by optimizations in dag combiner. | |
virtual bool | isStoreBitCastBeneficial (EVT StoreVT, EVT BitcastVT, const SelectionDAG &DAG, const MachineMemOperand &MMO) const |
Return true if the following transform is beneficial: (store (y (conv x)), y*)) -> (store x, (x*)) | |
virtual bool | storeOfVectorConstantIsCheap (bool IsZero, EVT MemVT, unsigned NumElem, unsigned AddrSpace) const |
Return true if it is expected to be cheaper to do a store of vector constant with the given size and type for the address space than to store the individual scalar element constants. | |
virtual bool | mergeStoresAfterLegalization (EVT MemVT) const |
Allow store merging for the specified type after legalization in addition to before legalization. | |
virtual bool | canMergeStoresTo (unsigned AS, EVT MemVT, const MachineFunction &MF) const |
Returns if it's reasonable to merge stores to MemVT size. | |
virtual bool | isCheapToSpeculateCttz (Type *Ty) const |
Return true if it is cheap to speculate a call to intrinsic cttz. | |
virtual bool | isCheapToSpeculateCtlz (Type *Ty) const |
Return true if it is cheap to speculate a call to intrinsic ctlz. | |
virtual bool | isCtlzFast () const |
Return true if ctlz instruction is fast. | |
virtual bool | isCtpopFast (EVT VT) const |
Return true if ctpop instruction is fast. | |
virtual unsigned | getCustomCtpopCost (EVT VT, ISD::CondCode Cond) const |
Return the maximum number of "x & (x - 1)" operations that can be done instead of deferring to a custom CTPOP. | |
virtual bool | isEqualityCmpFoldedWithSignedCmp () const |
Return true if instruction generated for equality comparison is folded with instruction generated for signed comparison. | |
virtual bool | preferZeroCompareBranch () const |
Return true if the heuristic to prefer icmp eq zero should be used in code gen prepare. | |
virtual bool | isMultiStoresCheaperThanBitsMerge (EVT LTy, EVT HTy) const |
Return true if it is cheaper to split the store of a merged int val from a pair of smaller values into multiple stores. | |
virtual bool | isMaskAndCmp0FoldingBeneficial (const Instruction &AndI) const |
Return if the target supports combining a chain like: | |
virtual bool | areTwoSDNodeTargetMMOFlagsMergeable (const MemSDNode &NodeX, const MemSDNode &NodeY) const |
Return true if it is valid to merge the TargetMMOFlags in two SDNodes. | |
virtual bool | convertSetCCLogicToBitwiseLogic (EVT VT) const |
Use bitwise logic to make pairs of compares more efficient. | |
virtual MVT | hasFastEqualityCompare (unsigned NumBits) const |
Return the preferred operand type if the target has a quick way to compare integer values of the given size. | |
virtual bool | hasAndNotCompare (SDValue Y) const |
Return true if the target should transform: (X & Y) == Y —> (~X & Y) == 0 (X & Y) != Y —> (~X & Y) != 0. | |
virtual bool | hasAndNot (SDValue X) const |
Return true if the target has a bitwise and-not operation: X = ~A & B This can be used to simplify select or other instructions. | |
virtual bool | hasBitTest (SDValue X, SDValue Y) const |
Return true if the target has a bit-test instruction: (X & (1 << Y)) ==/!= 0 This knowledge can be used to prevent breaking the pattern, or creating it if it could be recognized. | |
virtual bool | shouldFoldMaskToVariableShiftPair (SDValue X) const |
There are two ways to clear extreme bits (either low or high): Mask: x & (-1 << y) (the instcombine canonical form) Shifts: x >> y << y Return true if the variant with 2 variable shifts is preferred. | |
virtual bool | shouldFoldConstantShiftPairToMask (const SDNode *N, CombineLevel Level) const |
Return true if it is profitable to fold a pair of shifts into a mask. | |
virtual bool | shouldTransformSignedTruncationCheck (EVT XVT, unsigned KeptBits) const |
Should we tranform the IR-optimal check for whether given truncation down into KeptBits would be truncating or not: (add x, (1 << (KeptBits-1))) srccond (1 << KeptBits) Into it's more traditional form: ((x << C) a>> C) dstcond x Return true if we should transform. | |
virtual bool | shouldProduceAndByConstByHoistingConstFromShiftsLHSOfAnd (SDValue X, ConstantSDNode *XC, ConstantSDNode *CC, SDValue Y, unsigned OldShiftOpcode, unsigned NewShiftOpcode, SelectionDAG &DAG) const |
Given the pattern (X & (C l>>/<< Y)) ==/!= 0 return true if it should be transformed into: ((X <</l>> Y) & C) ==/!= 0 WARNING: if 'X' is a constant, the fold may deadlock! FIXME: we could avoid passing XC, but we can't use isConstOrConstSplat() here because it can end up being not linked in. | |
virtual bool | optimizeFMulOrFDivAsShiftAddBitcast (SDNode *N, SDValue FPConst, SDValue IntPow2) const |
virtual unsigned | preferedOpcodeForCmpEqPiecesOfOperand (EVT VT, unsigned ShiftOpc, bool MayTransformRotate, const APInt &ShiftOrRotateAmt, const std::optional< APInt > &AndMask) const |
virtual bool | preferIncOfAddToSubOfNot (EVT VT) const |
These two forms are equivalent: sub y, (xor x, -1) add (add x, 1), y The variant with two add's is IR-canonical. | |
virtual bool | preferABDSToABSWithNSW (EVT VT) const |
virtual bool | preferScalarizeSplat (SDNode *N) const |
virtual bool | preferSextInRegOfTruncate (EVT TruncVT, EVT VT, EVT ExtVT) const |
bool | enableExtLdPromotion () const |
Return true if the target wants to use the optimization that turns ext(promotableInst1(...(promotableInstN(load)))) into promotedInst1(...(promotedInstN(ext(load)))). | |
virtual bool | canCombineStoreAndExtract (Type *VectorTy, Value *Idx, unsigned &Cost) const |
Return true if the target can combine store(extractelement VectorTy,
Idx). | |
virtual bool | shallExtractConstSplatVectorElementToStore (Type *VectorTy, unsigned ElemSizeInBits, unsigned &Index) const |
Return true if the target shall perform extract vector element and store given that the vector is known to be splat of constant. | |
virtual bool | shouldSplatInsEltVarIndex (EVT) const |
Return true if inserting a scalar into a variable element of an undef vector is more efficiently handled by splatting the scalar instead. | |
virtual bool | enableAggressiveFMAFusion (EVT VT) const |
Return true if target always benefits from combining into FMA for a given value type. | |
virtual bool | enableAggressiveFMAFusion (LLT Ty) const |
Return true if target always benefits from combining into FMA for a given value type. | |
virtual EVT | getSetCCResultType (const DataLayout &DL, LLVMContext &Context, EVT VT) const |
Return the ValueType of the result of SETCC operations. | |
virtual MVT::SimpleValueType | getCmpLibcallReturnType () const |
Return the ValueType for comparison libcalls. | |
BooleanContent | getBooleanContents (bool isVec, bool isFloat) const |
For targets without i1 registers, this gives the nature of the high-bits of boolean values held in types wider than i1. | |
BooleanContent | getBooleanContents (EVT Type) const |
SDValue | promoteTargetBoolean (SelectionDAG &DAG, SDValue Bool, EVT ValVT) const |
Promote the given target boolean to a target boolean of the given type. | |
Sched::Preference | getSchedulingPreference () const |
Return target scheduling preference. | |
virtual Sched::Preference | getSchedulingPreference (SDNode *) const |
Some scheduler, e.g. | |
virtual const TargetRegisterClass * | getRegClassFor (MVT VT, bool isDivergent=false) const |
Return the register class that should be used for the specified value type. | |
virtual bool | requiresUniformRegister (MachineFunction &MF, const Value *) const |
Allows target to decide about the register class of the specific value that is live outside the defining block. | |
virtual const TargetRegisterClass * | getRepRegClassFor (MVT VT) const |
Return the 'representative' register class for the specified value type. | |
virtual uint8_t | getRepRegClassCostFor (MVT VT) const |
Return the cost of the 'representative' register class for the specified value type. | |
virtual ShiftLegalizationStrategy | preferredShiftLegalizationStrategy (SelectionDAG &DAG, SDNode *N, unsigned ExpansionFactor) const |
bool | isTypeLegal (EVT VT) const |
Return true if the target has native support for the specified value type. | |
const ValueTypeActionImpl & | getValueTypeActions () const |
LegalizeKind | getTypeConversion (LLVMContext &Context, EVT VT) const |
Return pair that represents the legalization kind (first) that needs to happen to EVT (second) in order to type-legalize it. | |
LegalizeTypeAction | getTypeAction (LLVMContext &Context, EVT VT) const |
Return how we should legalize values of this type, either it is already legal (return 'Legal') or we need to promote it to a larger type (return 'Promote'), or we need to expand it into multiple registers of smaller integer type (return 'Expand'). | |
LegalizeTypeAction | getTypeAction (MVT VT) const |
virtual EVT | getTypeToTransformTo (LLVMContext &Context, EVT VT) const |
For types supported by the target, this is an identity function. | |
EVT | getTypeToExpandTo (LLVMContext &Context, EVT VT) const |
For types supported by the target, this is an identity function. | |
unsigned | getVectorTypeBreakdown (LLVMContext &Context, EVT VT, EVT &IntermediateVT, unsigned &NumIntermediates, MVT &RegisterVT) const |
Vector types are broken down into some number of legal first class types. | |
virtual unsigned | getVectorTypeBreakdownForCallingConv (LLVMContext &Context, CallingConv::ID CC, EVT VT, EVT &IntermediateVT, unsigned &NumIntermediates, MVT &RegisterVT) const |
Certain targets such as MIPS require that some types such as vectors are always broken down into scalars in some contexts. | |
virtual bool | getTgtMemIntrinsic (IntrinsicInfo &, const CallInst &, MachineFunction &, unsigned) const |
Given an intrinsic, checks if on the target the intrinsic will need to map to a MemIntrinsicNode (touches memory). | |
virtual bool | isFPImmLegal (const APFloat &, EVT, bool ForCodeSize=false) const |
Returns true if the target can instruction select the specified FP immediate natively. | |
virtual bool | isShuffleMaskLegal (ArrayRef< int >, EVT) const |
Targets can use this to indicate that they only support some VECTOR_SHUFFLE operations, those with specific masks. | |
virtual bool | canOpTrap (unsigned Op, EVT VT) const |
Returns true if the operation can trap for the value type. | |
virtual bool | isVectorClearMaskLegal (ArrayRef< int >, EVT) const |
Similar to isShuffleMaskLegal. | |
virtual LegalizeAction | getCustomOperationAction (SDNode &Op) const |
How to legalize this custom operation? | |
LegalizeAction | getOperationAction (unsigned Op, EVT VT) const |
Return how this operation should be treated: either it is legal, needs to be promoted to a larger size, needs to be expanded to some other code sequence, or the target has a custom expander for it. | |
virtual bool | isSupportedFixedPointOperation (unsigned Op, EVT VT, unsigned Scale) const |
Custom method defined by each target to indicate if an operation which may require a scale is supported natively by the target. | |
LegalizeAction | getFixedPointOperationAction (unsigned Op, EVT VT, unsigned Scale) const |
Some fixed point operations may be natively supported by the target but only for specific scales. | |
LegalizeAction | getStrictFPOperationAction (unsigned Op, EVT VT) const |
bool | isOperationLegalOrCustom (unsigned Op, EVT VT, bool LegalOnly=false) const |
Return true if the specified operation is legal on this target or can be made legal with custom lowering. | |
bool | isOperationLegalOrPromote (unsigned Op, EVT VT, bool LegalOnly=false) const |
Return true if the specified operation is legal on this target or can be made legal using promotion. | |
bool | isOperationLegalOrCustomOrPromote (unsigned Op, EVT VT, bool LegalOnly=false) const |
Return true if the specified operation is legal on this target or can be made legal with custom lowering or using promotion. | |
bool | isOperationCustom (unsigned Op, EVT VT) const |
Return true if the operation uses custom lowering, regardless of whether the type is legal or not. | |
virtual bool | areJTsAllowed (const Function *Fn) const |
Return true if lowering to a jump table is allowed. | |
bool | rangeFitsInWord (const APInt &Low, const APInt &High, const DataLayout &DL) const |
Check whether the range [Low,High] fits in a machine word. | |
virtual bool | isSuitableForJumpTable (const SwitchInst *SI, uint64_t NumCases, uint64_t Range, ProfileSummaryInfo *PSI, BlockFrequencyInfo *BFI) const |
Return true if lowering to a jump table is suitable for a set of case clusters which may contain NumCases cases, Range range of values. | |
virtual MVT | getPreferredSwitchConditionType (LLVMContext &Context, EVT ConditionVT) const |
Returns preferred type for switch condition. | |
bool | isSuitableForBitTests (unsigned NumDests, unsigned NumCmps, const APInt &Low, const APInt &High, const DataLayout &DL) const |
Return true if lowering to a bit test is suitable for a set of case clusters which contains NumDests unique destinations, Low and High as its lowest and highest case values, and expects NumCmps case value comparisons. | |
bool | isOperationExpand (unsigned Op, EVT VT) const |
Return true if the specified operation is illegal on this target or unlikely to be made legal with custom lowering. | |
bool | isOperationLegal (unsigned Op, EVT VT) const |
Return true if the specified operation is legal on this target. | |
LegalizeAction | getLoadExtAction (unsigned ExtType, EVT ValVT, EVT MemVT) const |
Return how this load with extension should be treated: either it is legal, needs to be promoted to a larger size, needs to be expanded to some other code sequence, or the target has a custom expander for it. | |
bool | isLoadExtLegal (unsigned ExtType, EVT ValVT, EVT MemVT) const |
Return true if the specified load with extension is legal on this target. | |
bool | isLoadExtLegalOrCustom (unsigned ExtType, EVT ValVT, EVT MemVT) const |
Return true if the specified load with extension is legal or custom on this target. | |
LegalizeAction | getAtomicLoadExtAction (unsigned ExtType, EVT ValVT, EVT MemVT) const |
Same as getLoadExtAction, but for atomic loads. | |
bool | isAtomicLoadExtLegal (unsigned ExtType, EVT ValVT, EVT MemVT) const |
Return true if the specified atomic load with extension is legal on this target. | |
LegalizeAction | getTruncStoreAction (EVT ValVT, EVT MemVT) const |
Return how this store with truncation should be treated: either it is legal, needs to be promoted to a larger size, needs to be expanded to some other code sequence, or the target has a custom expander for it. | |
bool | isTruncStoreLegal (EVT ValVT, EVT MemVT) const |
Return true if the specified store with truncation is legal on this target. | |
bool | isTruncStoreLegalOrCustom (EVT ValVT, EVT MemVT) const |
Return true if the specified store with truncation has solution on this target. | |
virtual bool | canCombineTruncStore (EVT ValVT, EVT MemVT, bool LegalOnly) const |
LegalizeAction | getIndexedLoadAction (unsigned IdxMode, MVT VT) const |
Return how the indexed load should be treated: either it is legal, needs to be promoted to a larger size, needs to be expanded to some other code sequence, or the target has a custom expander for it. | |
bool | isIndexedLoadLegal (unsigned IdxMode, EVT VT) const |
Return true if the specified indexed load is legal on this target. | |
LegalizeAction | getIndexedStoreAction (unsigned IdxMode, MVT VT) const |
Return how the indexed store should be treated: either it is legal, needs to be promoted to a larger size, needs to be expanded to some other code sequence, or the target has a custom expander for it. | |
bool | isIndexedStoreLegal (unsigned IdxMode, EVT VT) const |
Return true if the specified indexed load is legal on this target. | |
LegalizeAction | getIndexedMaskedLoadAction (unsigned IdxMode, MVT VT) const |
Return how the indexed load should be treated: either it is legal, needs to be promoted to a larger size, needs to be expanded to some other code sequence, or the target has a custom expander for it. | |
bool | isIndexedMaskedLoadLegal (unsigned IdxMode, EVT VT) const |
Return true if the specified indexed load is legal on this target. | |
LegalizeAction | getIndexedMaskedStoreAction (unsigned IdxMode, MVT VT) const |
Return how the indexed store should be treated: either it is legal, needs to be promoted to a larger size, needs to be expanded to some other code sequence, or the target has a custom expander for it. | |
bool | isIndexedMaskedStoreLegal (unsigned IdxMode, EVT VT) const |
Return true if the specified indexed load is legal on this target. | |
virtual bool | shouldExtendGSIndex (EVT VT, EVT &EltTy) const |
Returns true if the index type for a masked gather/scatter requires extending. | |
virtual bool | shouldRemoveExtendFromGSIndex (SDValue Extend, EVT DataVT) const |
virtual bool | isLegalScaleForGatherScatter (uint64_t Scale, uint64_t ElemSize) const |
LegalizeAction | getCondCodeAction (ISD::CondCode CC, MVT VT) const |
Return how the condition code should be treated: either it is legal, needs to be expanded to some other code sequence, or the target has a custom expander for it. | |
bool | isCondCodeLegal (ISD::CondCode CC, MVT VT) const |
Return true if the specified condition code is legal on this target. | |
bool | isCondCodeLegalOrCustom (ISD::CondCode CC, MVT VT) const |
Return true if the specified condition code is legal or custom on this target. | |
MVT | getTypeToPromoteTo (unsigned Op, MVT VT) const |
If the action for this operation is to promote, this method returns the ValueType to promote to. | |
virtual EVT | getAsmOperandValueType (const DataLayout &DL, Type *Ty, bool AllowUnknown=false) const |
EVT | getValueType (const DataLayout &DL, Type *Ty, bool AllowUnknown=false) const |
Return the EVT corresponding to this LLVM type. | |
EVT | getMemValueType (const DataLayout &DL, Type *Ty, bool AllowUnknown=false) const |
MVT | getSimpleValueType (const DataLayout &DL, Type *Ty, bool AllowUnknown=false) const |
Return the MVT corresponding to this LLVM type. See getValueType. | |
virtual uint64_t | getByValTypeAlignment (Type *Ty, const DataLayout &DL) const |
Return the desired alignment for ByVal or InAlloca aggregate function arguments in the caller parameter area. | |
MVT | getRegisterType (MVT VT) const |
Return the type of registers that this ValueType will eventually require. | |
MVT | getRegisterType (LLVMContext &Context, EVT VT) const |
Return the type of registers that this ValueType will eventually require. | |
virtual unsigned | getNumRegisters (LLVMContext &Context, EVT VT, std::optional< MVT > RegisterVT=std::nullopt) const |
Return the number of registers that this ValueType will eventually require. | |
virtual MVT | getRegisterTypeForCallingConv (LLVMContext &Context, CallingConv::ID CC, EVT VT) const |
Certain combinations of ABIs, Targets and features require that types are legal for some operations and not for other operations. | |
virtual unsigned | getNumRegistersForCallingConv (LLVMContext &Context, CallingConv::ID CC, EVT VT) const |
Certain targets require unusual breakdowns of certain types. | |
virtual Align | getABIAlignmentForCallingConv (Type *ArgTy, const DataLayout &DL) const |
Certain targets have context sensitive alignment requirements, where one type has the alignment requirement of another type. | |
virtual bool | ShouldShrinkFPConstant (EVT) const |
If true, then instruction selection should seek to shrink the FP constant of the specified type to a smaller type in order to save space and / or reduce runtime. | |
virtual bool | shouldReduceLoadWidth (SDNode *Load, ISD::LoadExtType ExtTy, EVT NewVT) const |
Return true if it is profitable to reduce a load to a smaller type. | |
virtual bool | shouldRemoveRedundantExtend (SDValue Op) const |
Return true (the default) if it is profitable to remove a sext_inreg(x) where the sext is redundant, and use x directly. | |
bool | isPaddedAtMostSignificantBitsWhenStored (EVT VT) const |
Indicates if any padding is guaranteed to go at the most significant bits when storing the type to memory and the type size isn't equal to the store size. | |
bool | hasBigEndianPartOrdering (EVT VT, const DataLayout &DL) const |
When splitting a value of the specified type into parts, does the Lo or Hi part come first? This usually follows the endianness, except for ppcf128, where the Hi part always comes first. | |
bool | hasTargetDAGCombine (ISD::NodeType NT) const |
If true, the target has custom DAG combine transformations that it can perform for the specified node. | |
unsigned | getGatherAllAliasesMaxDepth () const |
virtual unsigned | getVaListSizeInBits (const DataLayout &DL) const |
Returns the size of the platform's va_list object. | |
unsigned | getMaxStoresPerMemset (bool OptSize) const |
Get maximum # of store operations permitted for llvm.memset. | |
unsigned | getMaxStoresPerMemcpy (bool OptSize) const |
Get maximum # of store operations permitted for llvm.memcpy. | |
virtual unsigned | getMaxGluedStoresPerMemcpy () const |
Get maximum # of store operations to be glued together. | |
unsigned | getMaxExpandSizeMemcmp (bool OptSize) const |
Get maximum # of load operations permitted for memcmp. | |
unsigned | getMaxStoresPerMemmove (bool OptSize) const |
Get maximum # of store operations permitted for llvm.memmove. | |
virtual bool | allowsMisalignedMemoryAccesses (EVT, unsigned AddrSpace=0, Align Alignment=Align(1), MachineMemOperand::Flags Flags=MachineMemOperand::MONone, unsigned *=nullptr) const |
Determine if the target supports unaligned memory accesses. | |
virtual bool | allowsMisalignedMemoryAccesses (LLT, unsigned AddrSpace=0, Align Alignment=Align(1), MachineMemOperand::Flags Flags=MachineMemOperand::MONone, unsigned *=nullptr) const |
LLT handling variant. | |
bool | allowsMemoryAccessForAlignment (LLVMContext &Context, const DataLayout &DL, EVT VT, unsigned AddrSpace=0, Align Alignment=Align(1), MachineMemOperand::Flags Flags=MachineMemOperand::MONone, unsigned *Fast=nullptr) const |
This function returns true if the memory access is aligned or if the target allows this specific unaligned memory access. | |
bool | allowsMemoryAccessForAlignment (LLVMContext &Context, const DataLayout &DL, EVT VT, const MachineMemOperand &MMO, unsigned *Fast=nullptr) const |
Return true if the memory access of this type is aligned or if the target allows this specific unaligned access for the given MachineMemOperand. | |
virtual bool | allowsMemoryAccess (LLVMContext &Context, const DataLayout &DL, EVT VT, unsigned AddrSpace=0, Align Alignment=Align(1), MachineMemOperand::Flags Flags=MachineMemOperand::MONone, unsigned *Fast=nullptr) const |
Return true if the target supports a memory access of this type for the given address space and alignment. | |
bool | allowsMemoryAccess (LLVMContext &Context, const DataLayout &DL, EVT VT, const MachineMemOperand &MMO, unsigned *Fast=nullptr) const |
Return true if the target supports a memory access of this type for the given MachineMemOperand. | |
bool | allowsMemoryAccess (LLVMContext &Context, const DataLayout &DL, LLT Ty, const MachineMemOperand &MMO, unsigned *Fast=nullptr) const |
LLT handling variant. | |
virtual EVT | getOptimalMemOpType (const MemOp &Op, const AttributeList &) const |
Returns the target specific optimal type for load and store operations as a result of memset, memcpy, and memmove lowering. | |
virtual LLT | getOptimalMemOpLLT (const MemOp &Op, const AttributeList &) const |
LLT returning variant. | |
virtual bool | isSafeMemOpType (MVT) const |
Returns true if it's safe to use load / store of the specified type to expand memcpy / memset inline. | |
virtual unsigned | getMinimumJumpTableEntries () const |
Return lower limit for number of blocks in a jump table. | |
unsigned | getMinimumJumpTableDensity (bool OptForSize) const |
Return lower limit of the density in a jump table. | |
unsigned | getMaximumJumpTableSize () const |
Return upper limit for number of entries in a jump table. | |
virtual bool | isJumpTableRelative () const |
Register | getStackPointerRegisterToSaveRestore () const |
If a physical register, this specifies the register that llvm.savestack/llvm.restorestack should save and restore. | |
virtual Register | getExceptionPointerRegister (const Constant *PersonalityFn) const |
If a physical register, this returns the register that receives the exception address on entry to an EH pad. | |
virtual Register | getExceptionSelectorRegister (const Constant *PersonalityFn) const |
If a physical register, this returns the register that receives the exception typeid on entry to a landing pad. | |
virtual bool | needsFixedCatchObjects () const |
Align | getMinStackArgumentAlignment () const |
Return the minimum stack alignment of an argument. | |
Align | getMinFunctionAlignment () const |
Return the minimum function alignment. | |
Align | getPrefFunctionAlignment () const |
Return the preferred function alignment. | |
virtual Align | getPrefLoopAlignment (MachineLoop *ML=nullptr) const |
Return the preferred loop alignment. | |
virtual unsigned | getMaxPermittedBytesForAlignment (MachineBasicBlock *MBB) const |
Return the maximum amount of bytes allowed to be emitted when padding for alignment. | |
virtual bool | alignLoopsWithOptSize () const |
Should loops be aligned even when the function is marked OptSize (but not MinSize). | |
virtual Value * | getIRStackGuard (IRBuilderBase &IRB) const |
If the target has a standard location for the stack protector guard, returns the address of that location. | |
virtual void | insertSSPDeclarations (Module &M) const |
Inserts necessary declarations for SSP (stack protection) purpose. | |
virtual Value * | getSDagStackGuard (const Module &M) const |
Return the variable that's previously inserted by insertSSPDeclarations, if any, otherwise return nullptr. | |
virtual bool | useStackGuardXorFP () const |
If this function returns true, stack protection checks should XOR the frame pointer (or whichever pointer is used to address locals) into the stack guard value before checking it. | |
virtual Function * | getSSPStackGuardCheck (const Module &M) const |
If the target has a standard stack protection check function that performs validation and error handling, returns the function. | |
virtual Value * | getSafeStackPointerLocation (IRBuilderBase &IRB) const |
Returns the target-specific address of the unsafe stack pointer. | |
virtual bool | hasStackProbeSymbol (const MachineFunction &MF) const |
Returns the name of the symbol used to emit stack probes or the empty string if not applicable. | |
virtual bool | hasInlineStackProbe (const MachineFunction &MF) const |
virtual StringRef | getStackProbeSymbolName (const MachineFunction &MF) const |
virtual bool | isFreeAddrSpaceCast (unsigned SrcAS, unsigned DestAS) const |
Returns true if a cast from SrcAS to DestAS is "cheap", such that e.g. | |
virtual bool | shouldAlignPointerArgs (CallInst *, unsigned &, Align &) const |
Return true if the pointer arguments to CI should be aligned by aligning the object whose address is being passed. | |
virtual void | emitAtomicCmpXchgNoStoreLLBalance (IRBuilderBase &Builder) const |
virtual bool | shouldSignExtendTypeInLibCall (EVT Type, bool IsSigned) const |
Returns true if arguments should be sign-extended in lib calls. | |
virtual bool | shouldExtendTypeInLibCall (EVT Type) const |
Returns true if arguments should be extended in lib calls. | |
virtual AtomicExpansionKind | shouldExpandAtomicLoadInIR (LoadInst *LI) const |
Returns how the given (atomic) load should be expanded by the IR-level AtomicExpand pass. | |
virtual AtomicExpansionKind | shouldCastAtomicLoadInIR (LoadInst *LI) const |
Returns how the given (atomic) load should be cast by the IR-level AtomicExpand pass. | |
virtual AtomicExpansionKind | shouldExpandAtomicStoreInIR (StoreInst *SI) const |
Returns how the given (atomic) store should be expanded by the IR-level AtomicExpand pass into. | |
virtual AtomicExpansionKind | shouldCastAtomicStoreInIR (StoreInst *SI) const |
Returns how the given (atomic) store should be cast by the IR-level AtomicExpand pass into. | |
virtual AtomicExpansionKind | shouldExpandAtomicCmpXchgInIR (AtomicCmpXchgInst *AI) const |
Returns how the given atomic cmpxchg should be expanded by the IR-level AtomicExpand pass. | |
virtual AtomicExpansionKind | shouldExpandAtomicRMWInIR (AtomicRMWInst *RMW) const |
Returns how the IR-level AtomicExpand pass should expand the given AtomicRMW, if at all. | |
virtual AtomicExpansionKind | shouldCastAtomicRMWIInIR (AtomicRMWInst *RMWI) const |
Returns how the given atomic atomicrmw should be cast by the IR-level AtomicExpand pass. | |
virtual LoadInst * | lowerIdempotentRMWIntoFencedLoad (AtomicRMWInst *RMWI) const |
On some platforms, an AtomicRMW that never actually modifies the value (such as fetch_add of 0) can be turned into a fence followed by an atomic load. | |
virtual ISD::NodeType | getExtendForAtomicOps () const |
Returns how the platform's atomic operations are extended (ZERO_EXTEND, SIGN_EXTEND, or ANY_EXTEND). | |
virtual ISD::NodeType | getExtendForAtomicCmpSwapArg () const |
Returns how the platform's atomic compare and swap expects its comparison value to be extended (ZERO_EXTEND, SIGN_EXTEND, or ANY_EXTEND). | |
virtual bool | shouldNormalizeToSelectSequence (LLVMContext &Context, EVT VT) const |
Returns true if we should normalize select(N0&N1, X, Y) => select(N0, select(N1, X, Y), Y) and select(N0|N1, X, Y) => select(N0, select(N1, X, Y, Y)) if it is likely that it saves us from materializing N0 and N1 in an integer register. | |
virtual bool | isProfitableToCombineMinNumMaxNum (EVT VT) const |
virtual bool | convertSelectOfConstantsToMath (EVT VT) const |
Return true if a select of constants (select Cond, C1, C2) should be transformed into simple math ops with the condition value. | |
virtual bool | decomposeMulByConstant (LLVMContext &Context, EVT VT, SDValue C) const |
Return true if it is profitable to transform an integer multiplication-by-constant into simpler operations like shifts and adds. | |
virtual bool | isMulAddWithConstProfitable (SDValue AddNode, SDValue ConstNode) const |
Return true if it may be profitable to transform (mul (add x, c1), c2) -> (add (mul x, c2), c1*c2). | |
virtual bool | shouldUseStrictFP_TO_INT (EVT FpVT, EVT IntVT, bool IsSigned) const |
Return true if it is more correct/profitable to use strict FP_TO_INT conversion operations - canonicalizing the FP source value instead of converting all cases and then selecting based on value. | |
bool | isBeneficialToExpandPowI (int64_t Exponent, bool OptForSize) const |
Return true if it is beneficial to expand an @llvm.powi. | |
virtual bool | getAddrModeArguments (IntrinsicInst *, SmallVectorImpl< Value * > &, Type *&) const |
CodeGenPrepare sinks address calculations into the same BB as Load/Store instructions reading the address. | |
virtual bool | isLegalAddressingMode (const DataLayout &DL, const AddrMode &AM, Type *Ty, unsigned AddrSpace, Instruction *I=nullptr) const |
Return true if the addressing mode represented by AM is legal for this target, for a load/store of the specified type. | |
virtual bool | addressingModeSupportsTLS (const GlobalValue &) const |
Returns true if the targets addressing mode can target thread local storage (TLS). | |
virtual int64_t | getPreferredLargeGEPBaseOffset (int64_t MinOffset, int64_t MaxOffset) const |
Return the prefered common base offset. | |
virtual bool | isLegalICmpImmediate (int64_t) const |
Return true if the specified immediate is legal icmp immediate, that is the target has icmp instructions which can compare a register against the immediate without having to materialize the immediate into a register. | |
virtual bool | isLegalAddImmediate (int64_t) const |
Return true if the specified immediate is legal add immediate, that is the target has add instructions which can add a register with the immediate without having to materialize the immediate into a register. | |
virtual bool | isLegalAddScalableImmediate (int64_t) const |
Return true if adding the specified scalable immediate is legal, that is the target has add instructions which can add a register with the immediate (multiplied by vscale) without having to materialize the immediate into a register. | |
virtual bool | isLegalStoreImmediate (int64_t Value) const |
Return true if the specified immediate is legal for the value input of a store instruction. | |
virtual bool | isVectorShiftByScalarCheap (Type *Ty) const |
Return true if it's significantly cheaper to shift a vector by a uniform scalar than by an amount which will vary across each lane. | |
virtual Type * | shouldConvertSplatType (ShuffleVectorInst *SVI) const |
Given a shuffle vector SVI representing a vector splat, return a new scalar type of size equal to SVI's scalar type if the new type is more profitable. | |
virtual bool | shouldConvertPhiType (Type *From, Type *To) const |
Given a set in interconnected phis of type 'From' that are loaded/stored or bitcast to type 'To', return true if the set should be converted to 'To'. | |
virtual bool | isCommutativeBinOp (unsigned Opcode) const |
Returns true if the opcode is a commutative binary operation. | |
virtual bool | isBinOp (unsigned Opcode) const |
Return true if the node is a math/logic binary operator. | |
virtual bool | isTruncateFree (Type *FromTy, Type *ToTy) const |
Return true if it's free to truncate a value of type FromTy to type ToTy. | |
virtual bool | allowTruncateForTailCall (Type *FromTy, Type *ToTy) const |
Return true if a truncation from FromTy to ToTy is permitted when deciding whether a call is in tail position. | |
virtual bool | isTruncateFree (EVT FromVT, EVT ToVT) const |
virtual bool | isTruncateFree (LLT FromTy, LLT ToTy, const DataLayout &DL, LLVMContext &Ctx) const |
virtual bool | isTruncateFree (SDValue Val, EVT VT2) const |
Return true if truncating the specific node Val to type VT2 is free. | |
virtual bool | isProfitableToHoist (Instruction *I) const |
bool | isExtFree (const Instruction *I) const |
Return true if the extension represented by I is free. | |
bool | isExtLoad (const LoadInst *Load, const Instruction *Ext, const DataLayout &DL) const |
Return true if Load and Ext can form an ExtLoad. | |
virtual bool | isZExtFree (Type *FromTy, Type *ToTy) const |
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the value to ToTy in the result register. | |
virtual bool | isZExtFree (EVT FromTy, EVT ToTy) const |
virtual bool | isZExtFree (LLT FromTy, LLT ToTy, const DataLayout &DL, LLVMContext &Ctx) const |
virtual bool | isZExtFree (SDValue Val, EVT VT2) const |
Return true if zero-extending the specific node Val to type VT2 is free (either because it's implicitly zero-extended such as ARM ldrb / ldrh or because it's folded such as X86 zero-extending loads). | |
virtual bool | isSExtCheaperThanZExt (EVT FromTy, EVT ToTy) const |
Return true if sign-extension from FromTy to ToTy is cheaper than zero-extension. | |
virtual bool | signExtendConstant (const ConstantInt *C) const |
Return true if this constant should be sign extended when promoting to a larger type. | |
virtual bool | shouldSinkOperands (Instruction *I, SmallVectorImpl< Use * > &Ops) const |
Return true if sinking I's operands to the same basic block as I is profitable, e.g. | |
virtual bool | optimizeExtendOrTruncateConversion (Instruction *I, Loop *L, const TargetTransformInfo &TTI) const |
Try to optimize extending or truncating conversion instructions (like zext, trunc, fptoui, uitofp) for the target. | |
virtual bool | hasPairedLoad (EVT, Align &) const |
Return true if the target supplies and combines to a paired load two loaded values of type LoadedType next to each other in memory. | |
virtual bool | hasVectorBlend () const |
Return true if the target has a vector blend instruction. | |
virtual unsigned | getMaxSupportedInterleaveFactor () const |
Get the maximum supported factor for interleaved memory accesses. | |
virtual bool | lowerInterleavedLoad (LoadInst *LI, ArrayRef< ShuffleVectorInst * > Shuffles, ArrayRef< unsigned > Indices, unsigned Factor) const |
Lower an interleaved load to target specific intrinsics. | |
virtual bool | lowerInterleavedStore (StoreInst *SI, ShuffleVectorInst *SVI, unsigned Factor) const |
Lower an interleaved store to target specific intrinsics. | |
virtual bool | lowerDeinterleaveIntrinsicToLoad (IntrinsicInst *DI, LoadInst *LI, SmallVectorImpl< Instruction * > &DeadInsts) const |
Lower a deinterleave intrinsic to a target specific load intrinsic. | |
virtual bool | lowerInterleaveIntrinsicToStore (IntrinsicInst *II, StoreInst *SI, SmallVectorImpl< Instruction * > &DeadInsts) const |
Lower an interleave intrinsic to a target specific store intrinsic. | |
virtual bool | isFPExtFree (EVT DestVT, EVT SrcVT) const |
Return true if an fpext operation is free (for instance, because single-precision floating-point numbers are implicitly extended to double-precision). | |
virtual bool | isFPExtFoldable (const MachineInstr &MI, unsigned Opcode, LLT DestTy, LLT SrcTy) const |
Return true if an fpext operation input to an Opcode operation is free (for instance, because half-precision floating-point numbers are implicitly extended to float-precision) for an FMA instruction. | |
virtual bool | isFPExtFoldable (const SelectionDAG &DAG, unsigned Opcode, EVT DestVT, EVT SrcVT) const |
Return true if an fpext operation input to an Opcode operation is free (for instance, because half-precision floating-point numbers are implicitly extended to float-precision) for an FMA instruction. | |
virtual bool | isVectorLoadExtDesirable (SDValue ExtVal) const |
Return true if folding a vector load into ExtVal (a sign, zero, or any extend node) is profitable. | |
virtual bool | isFNegFree (EVT VT) const |
Return true if an fneg operation is free to the point where it is never worthwhile to replace it with a bitwise operation. | |
virtual bool | isFAbsFree (EVT VT) const |
Return true if an fabs operation is free to the point where it is never worthwhile to replace it with a bitwise operation. | |
virtual bool | isFMAFasterThanFMulAndFAdd (const MachineFunction &MF, EVT) const |
Return true if an FMA operation is faster than a pair of fmul and fadd instructions. | |
virtual bool | isFMAFasterThanFMulAndFAdd (const MachineFunction &MF, LLT) const |
Return true if an FMA operation is faster than a pair of fmul and fadd instructions. | |
virtual bool | isFMAFasterThanFMulAndFAdd (const Function &F, Type *) const |
IR version. | |
virtual bool | isFMADLegal (const MachineInstr &MI, LLT Ty) const |
Returns true if MI can be combined with another instruction to form TargetOpcode::G_FMAD. | |
virtual bool | isFMADLegal (const SelectionDAG &DAG, const SDNode *N) const |
Returns true if be combined with to form an ISD::FMAD. | |
virtual bool | generateFMAsInMachineCombiner (EVT VT, CodeGenOptLevel OptLevel) const |
virtual bool | isNarrowingProfitable (EVT SrcVT, EVT DestVT) const |
Return true if it's profitable to narrow operations of type SrcVT to DestVT. | |
virtual bool | shouldFoldSelectWithIdentityConstant (unsigned BinOpcode, EVT VT) const |
Return true if pulling a binary operation into a select with an identity constant is profitable. | |
virtual bool | shouldConvertConstantLoadToIntImm (const APInt &Imm, Type *Ty) const |
Return true if it is beneficial to convert a load of a constant to just the constant itself. | |
virtual bool | isExtractSubvectorCheap (EVT ResVT, EVT SrcVT, unsigned Index) const |
Return true if EXTRACT_SUBVECTOR is cheap for extracting this result type from this source type with this index. | |
virtual bool | shouldScalarizeBinop (SDValue VecOp) const |
Try to convert an extract element of a vector binary operation into an extract element followed by a scalar operation. | |
virtual bool | isExtractVecEltCheap (EVT VT, unsigned Index) const |
Return true if extraction of a scalar element from the given vector type at the given index is cheap. | |
virtual bool | shouldFormOverflowOp (unsigned Opcode, EVT VT, bool MathUsed) const |
Try to convert math with an overflow comparison into the corresponding DAG node operation. | |
virtual bool | aggressivelyPreferBuildVectorSources (EVT VecVT) const |
virtual bool | shouldConsiderGEPOffsetSplit () const |
virtual bool | shouldAvoidTransformToShift (EVT VT, unsigned Amount) const |
Return true if creating a shift of the type by the given amount is not profitable. | |
virtual bool | shouldFoldSelectWithSingleBitTest (EVT VT, const APInt &AndMask) const |
virtual bool | shouldKeepZExtForFP16Conv () const |
Does this target require the clearing of high-order bits in a register passed to the fp16 to fp conversion library function. | |
virtual bool | shouldConvertFpToSat (unsigned Op, EVT FPVT, EVT VT) const |
Should we generate fp_to_si_sat and fp_to_ui_sat from type FPVT to type VT from min(max(fptoi)) saturation patterns. | |
virtual bool | shouldExpandCmpUsingSelects () const |
Should we expand [US]CMP nodes using two selects and two compares, or by doing arithmetic on boolean types. | |
virtual bool | isComplexDeinterleavingSupported () const |
Does this target support complex deinterleaving. | |
virtual bool | isComplexDeinterleavingOperationSupported (ComplexDeinterleavingOperation Operation, Type *Ty) const |
Does this target support complex deinterleaving with the given operation and type. | |
virtual Value * | createComplexDeinterleavingIR (IRBuilderBase &B, ComplexDeinterleavingOperation OperationType, ComplexDeinterleavingRotation Rotation, Value *InputA, Value *InputB, Value *Accumulator=nullptr) const |
Create the IR node for the given complex deinterleaving operation. | |
void | setLibcallName (RTLIB::Libcall Call, const char *Name) |
Rename the default libcall routine name for the specified libcall. | |
void | setLibcallName (ArrayRef< RTLIB::Libcall > Calls, const char *Name) |
const char * | getLibcallName (RTLIB::Libcall Call) const |
Get the libcall routine name for the specified libcall. | |
void | setCmpLibcallCC (RTLIB::Libcall Call, ISD::CondCode CC) |
Override the default CondCode to be used to test the result of the comparison libcall against zero. | |
ISD::CondCode | getCmpLibcallCC (RTLIB::Libcall Call) const |
Get the CondCode that's to be used to test the result of the comparison libcall against zero. | |
void | setLibcallCallingConv (RTLIB::Libcall Call, CallingConv::ID CC) |
Set the CallingConv that should be used for the specified libcall. | |
CallingConv::ID | getLibcallCallingConv (RTLIB::Libcall Call) const |
Get the CallingConv that should be used for the specified libcall. | |
virtual void | finalizeLowering (MachineFunction &MF) const |
Execute target specific actions to finalize target lowering. | |
virtual bool | shouldLocalize (const MachineInstr &MI, const TargetTransformInfo *TTI) const |
Check whether or not MI needs to be moved close to its uses. | |
int | InstructionOpcodeToISD (unsigned Opcode) const |
Get the ISD node that corresponds to the Instruction class opcode. | |
unsigned | getMaxAtomicSizeInBitsSupported () const |
Returns the maximum atomic operation size (in bits) supported by the backend. | |
unsigned | getMaxDivRemBitWidthSupported () const |
Returns the size in bits of the maximum div/rem the backend supports. | |
unsigned | getMaxLargeFPConvertBitWidthSupported () const |
Returns the size in bits of the maximum larget fp convert the backend supports. | |
unsigned | getMinCmpXchgSizeInBits () const |
Returns the size of the smallest cmpxchg or ll/sc instruction the backend supports. | |
bool | supportsUnalignedAtomics () const |
Whether the target supports unaligned atomic operations. | |
virtual bool | shouldInsertFencesForAtomic (const Instruction *I) const |
Whether AtomicExpandPass should automatically insert fences and reduce ordering for this atomic. | |
virtual bool | shouldInsertTrailingFenceForAtomicStore (const Instruction *I) const |
Whether AtomicExpandPass should automatically insert a trailing fence without reducing the ordering for this atomic. | |
virtual Value * | emitLoadLinked (IRBuilderBase &Builder, Type *ValueTy, Value *Addr, AtomicOrdering Ord) const |
Perform a load-linked operation on Addr, returning a "Value *" with the corresponding pointee type. | |
virtual Value * | emitStoreConditional (IRBuilderBase &Builder, Value *Val, Value *Addr, AtomicOrdering Ord) const |
Perform a store-conditional operation to Addr. | |
virtual Value * | emitMaskedAtomicRMWIntrinsic (IRBuilderBase &Builder, AtomicRMWInst *AI, Value *AlignedAddr, Value *Incr, Value *Mask, Value *ShiftAmt, AtomicOrdering Ord) const |
Perform a masked atomicrmw using a target-specific intrinsic. | |
virtual void | emitExpandAtomicRMW (AtomicRMWInst *AI) const |
Perform a atomicrmw expansion using a target-specific way. | |
virtual void | emitBitTestAtomicRMWIntrinsic (AtomicRMWInst *AI) const |
Perform a bit test atomicrmw using a target-specific intrinsic. | |
virtual void | emitCmpArithAtomicRMWIntrinsic (AtomicRMWInst *AI) const |
Perform a atomicrmw which the result is only used by comparison, using a target-specific intrinsic. | |
virtual Value * | emitMaskedAtomicCmpXchgIntrinsic (IRBuilderBase &Builder, AtomicCmpXchgInst *CI, Value *AlignedAddr, Value *CmpVal, Value *NewVal, Value *Mask, AtomicOrdering Ord) const |
Perform a masked cmpxchg using a target-specific intrinsic. | |
virtual MachineInstr * | EmitKCFICheck (MachineBasicBlock &MBB, MachineBasicBlock::instr_iterator &MBBI, const TargetInstrInfo *TII) const |
virtual Instruction * | emitLeadingFence (IRBuilderBase &Builder, Instruction *Inst, AtomicOrdering Ord) const |
Inserts in the IR a target-specific intrinsic specifying a fence. | |
virtual Instruction * | emitTrailingFence (IRBuilderBase &Builder, Instruction *Inst, AtomicOrdering Ord) const |
Static Public Member Functions | |
static unsigned | numBitsUnsigned (SDValue Op, SelectionDAG &DAG) |
static unsigned | numBitsSigned (SDValue Op, SelectionDAG &DAG) |
static SDValue | stripBitcast (SDValue Val) |
static bool | shouldFoldFNegIntoSrc (SDNode *FNeg, SDValue FNegSrc) |
static bool | allUsesHaveSourceMods (const SDNode *N, unsigned CostThreshold=4) |
static CCAssignFn * | CCAssignFnForCall (CallingConv::ID CC, bool IsVarArg) |
Selects the correct CCAssignFn for a given CallingConvention value. | |
static CCAssignFn * | CCAssignFnForReturn (CallingConv::ID CC, bool IsVarArg) |
Static Public Member Functions inherited from llvm::TargetLoweringBase | |
static ISD::NodeType | getExtendForContent (BooleanContent Content) |
Protected Member Functions | |
SDValue | LowerEXTRACT_SUBVECTOR (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerCONCAT_VECTORS (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFREM (SDValue Op, SelectionDAG &DAG) const |
Split a vector store into multiple scalar stores. | |
SDValue | LowerFCEIL (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFTRUNC (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFRINT (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFNEARBYINT (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFROUNDEVEN (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFROUND (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFFLOOR (SDValue Op, SelectionDAG &DAG) const |
SDValue | getIsLtSmallestNormal (SelectionDAG &DAG, SDValue Op, SDNodeFlags Flags) const |
SDValue | getIsFinite (SelectionDAG &DAG, SDValue Op, SDNodeFlags Flags) const |
std::pair< SDValue, SDValue > | getScaledLogInput (SelectionDAG &DAG, const SDLoc SL, SDValue Op, SDNodeFlags Flags) const |
If denormal handling is required return the scaled input to FLOG2, and the check for denormal range. | |
SDValue | LowerFLOG2 (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFLOGCommon (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFLOG10 (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFLOGUnsafe (SDValue Op, const SDLoc &SL, SelectionDAG &DAG, bool IsLog10, SDNodeFlags Flags) const |
SDValue | lowerFEXP2 (SDValue Op, SelectionDAG &DAG) const |
SDValue | lowerFEXPUnsafe (SDValue Op, const SDLoc &SL, SelectionDAG &DAG, SDNodeFlags Flags) const |
SDValue | lowerFEXP10Unsafe (SDValue Op, const SDLoc &SL, SelectionDAG &DAG, SDNodeFlags Flags) const |
Emit approx-funcs appropriate lowering for exp10. | |
SDValue | lowerFEXP (SDValue Op, SelectionDAG &DAG) const |
SDValue | lowerCTLZResults (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerCTLZ_CTTZ (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerINT_TO_FP32 (SDValue Op, SelectionDAG &DAG, bool Signed) const |
SDValue | LowerINT_TO_FP64 (SDValue Op, SelectionDAG &DAG, bool Signed) const |
SDValue | LowerUINT_TO_FP (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerSINT_TO_FP (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFP_TO_INT64 (SDValue Op, SelectionDAG &DAG, bool Signed) const |
SDValue | LowerFP_TO_FP16 (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerFP_TO_INT (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerSIGN_EXTEND_INREG (SDValue Op, SelectionDAG &DAG) const |
bool | shouldCombineMemoryType (EVT VT) const |
SDValue | performLoadCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performStoreCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performAssertSZExtCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performIntrinsicWOChainCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | splitBinaryBitConstantOpImpl (DAGCombinerInfo &DCI, const SDLoc &SL, unsigned Opc, SDValue LHS, uint32_t ValLo, uint32_t ValHi) const |
Split the 64-bit value LHS into two 32-bit components, and perform the binary operation Opc to it with the corresponding constant operands. | |
SDValue | performShlCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performSraCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performSrlCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performTruncateCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performMulCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performMulLoHiCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performMulhsCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performMulhuCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performCtlz_CttzCombine (const SDLoc &SL, SDValue Cond, SDValue LHS, SDValue RHS, DAGCombinerInfo &DCI) const |
SDValue | foldFreeOpFromSelect (TargetLowering::DAGCombinerInfo &DCI, SDValue N) const |
SDValue | performSelectCombine (SDNode *N, DAGCombinerInfo &DCI) const |
TargetLowering::NegatibleCost | getConstantNegateCost (const ConstantFPSDNode *C) const |
bool | isConstantCostlierToNegate (SDValue N) const |
bool | isConstantCheaperToNegate (SDValue N) const |
SDValue | performFNegCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performFAbsCombine (SDNode *N, DAGCombinerInfo &DCI) const |
SDValue | performRcpCombine (SDNode *N, DAGCombinerInfo &DCI) const |
virtual SDValue | LowerGlobalAddress (AMDGPUMachineFunction *MFI, SDValue Op, SelectionDAG &DAG) const |
std::pair< SDValue, SDValue > | split64BitValue (SDValue Op, SelectionDAG &DAG) const |
Return 64-bit value Op as two 32-bit integers. | |
SDValue | getLoHalf64 (SDValue Op, SelectionDAG &DAG) const |
SDValue | getHiHalf64 (SDValue Op, SelectionDAG &DAG) const |
std::pair< EVT, EVT > | getSplitDestVTs (const EVT &VT, SelectionDAG &DAG) const |
Split a vector type into two parts. | |
std::pair< SDValue, SDValue > | splitVector (const SDValue &N, const SDLoc &DL, const EVT &LoVT, const EVT &HighVT, SelectionDAG &DAG) const |
Split a vector value into two parts of types LoVT and HiVT. | |
SDValue | SplitVectorLoad (SDValue Op, SelectionDAG &DAG) const |
Split a vector load into 2 loads of half the vector. | |
SDValue | WidenOrSplitVectorLoad (SDValue Op, SelectionDAG &DAG) const |
Widen a suitably aligned v3 load. | |
SDValue | SplitVectorStore (SDValue Op, SelectionDAG &DAG) const |
Split a vector store into 2 stores of half the vector. | |
SDValue | LowerSTORE (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerSDIVREM (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerUDIVREM (SDValue Op, SelectionDAG &DAG) const |
SDValue | LowerDIVREM24 (SDValue Op, SelectionDAG &DAG, bool sign) const |
void | LowerUDIVREM64 (SDValue Op, SelectionDAG &DAG, SmallVectorImpl< SDValue > &Results) const |
void | analyzeFormalArgumentsCompute (CCState &State, const SmallVectorImpl< ISD::InputArg > &Ins) const |
The SelectionDAGBuilder will automatically promote function arguments with illegal types. | |
Protected Member Functions inherited from llvm::TargetLoweringBase | |
void | initActions () |
Initialize all of the actions to default values. | |
Value * | getDefaultSafeStackPointerLocation (IRBuilderBase &IRB, bool UseTLS) const |
void | setBooleanContents (BooleanContent Ty) |
Specify how the target extends the result of integer and floating point boolean values from i1 to a wider type. | |
void | setBooleanContents (BooleanContent IntTy, BooleanContent FloatTy) |
Specify how the target extends the result of integer and floating point boolean values from i1 to a wider type. | |
void | setBooleanVectorContents (BooleanContent Ty) |
Specify how the target extends the result of a vector boolean value from a vector of i1 to a wider type. | |
void | setSchedulingPreference (Sched::Preference Pref) |
Specify the target scheduling preference. | |
void | setMinimumJumpTableEntries (unsigned Val) |
Indicate the minimum number of blocks to generate jump tables. | |
void | setMaximumJumpTableSize (unsigned) |
Indicate the maximum number of entries in jump tables. | |
void | setStackPointerRegisterToSaveRestore (Register R) |
If set to a physical register, this specifies the register that llvm.savestack/llvm.restorestack should save and restore. | |
void | setHasMultipleConditionRegisters (bool hasManyRegs=true) |
Tells the code generator that the target has multiple (allocatable) condition registers that can be used to store the results of comparisons for use by selects and conditional branches. | |
void | setHasExtractBitsInsn (bool hasExtractInsn=true) |
Tells the code generator that the target has BitExtract instructions. | |
void | setJumpIsExpensive (bool isExpensive=true) |
Tells the code generator not to expand logic operations on comparison predicates into separate sequences that increase the amount of flow control. | |
void | addBypassSlowDiv (unsigned int SlowBitWidth, unsigned int FastBitWidth) |
Tells the code generator which bitwidths to bypass. | |
void | addRegisterClass (MVT VT, const TargetRegisterClass *RC) |
Add the specified register class as an available regclass for the specified value type. | |
virtual std::pair< const TargetRegisterClass *, uint8_t > | findRepresentativeClass (const TargetRegisterInfo *TRI, MVT VT) const |
Return the largest legal super-reg register class of the register class for the specified type and its associated "cost". | |
void | computeRegisterProperties (const TargetRegisterInfo *TRI) |
Once all of the register classes are added, this allows us to compute derived properties we expose. | |
void | setOperationAction (unsigned Op, MVT VT, LegalizeAction Action) |
Indicate that the specified operation does not work with the specified type and indicate what to do about it. | |
void | setOperationAction (ArrayRef< unsigned > Ops, MVT VT, LegalizeAction Action) |
void | setOperationAction (ArrayRef< unsigned > Ops, ArrayRef< MVT > VTs, LegalizeAction Action) |
void | setLoadExtAction (unsigned ExtType, MVT ValVT, MVT MemVT, LegalizeAction Action) |
Indicate that the specified load with extension does not work with the specified type and indicate what to do about it. | |
void | setLoadExtAction (ArrayRef< unsigned > ExtTypes, MVT ValVT, MVT MemVT, LegalizeAction Action) |
void | setLoadExtAction (ArrayRef< unsigned > ExtTypes, MVT ValVT, ArrayRef< MVT > MemVTs, LegalizeAction Action) |
void | setAtomicLoadExtAction (unsigned ExtType, MVT ValVT, MVT MemVT, LegalizeAction Action) |
Let target indicate that an extending atomic load of the specified type is legal. | |
void | setAtomicLoadExtAction (ArrayRef< unsigned > ExtTypes, MVT ValVT, MVT MemVT, LegalizeAction Action) |
void | setAtomicLoadExtAction (ArrayRef< unsigned > ExtTypes, MVT ValVT, ArrayRef< MVT > MemVTs, LegalizeAction Action) |
void | setTruncStoreAction (MVT ValVT, MVT MemVT, LegalizeAction Action) |
Indicate that the specified truncating store does not work with the specified type and indicate what to do about it. | |
void | setIndexedLoadAction (ArrayRef< unsigned > IdxModes, MVT VT, LegalizeAction Action) |
Indicate that the specified indexed load does or does not work with the specified type and indicate what to do abort it. | |
void | setIndexedLoadAction (ArrayRef< unsigned > IdxModes, ArrayRef< MVT > VTs, LegalizeAction Action) |
void | setIndexedStoreAction (ArrayRef< unsigned > IdxModes, MVT VT, LegalizeAction Action) |
Indicate that the specified indexed store does or does not work with the specified type and indicate what to do about it. | |
void | setIndexedStoreAction (ArrayRef< unsigned > IdxModes, ArrayRef< MVT > VTs, LegalizeAction Action) |
void | setIndexedMaskedLoadAction (unsigned IdxMode, MVT VT, LegalizeAction Action) |
Indicate that the specified indexed masked load does or does not work with the specified type and indicate what to do about it. | |
void | setIndexedMaskedStoreAction (unsigned IdxMode, MVT VT, LegalizeAction Action) |
Indicate that the specified indexed masked store does or does not work with the specified type and indicate what to do about it. | |
void | setCondCodeAction (ArrayRef< ISD::CondCode > CCs, MVT VT, LegalizeAction Action) |
Indicate that the specified condition code is or isn't supported on the target and indicate what to do about it. | |
void | setCondCodeAction (ArrayRef< ISD::CondCode > CCs, ArrayRef< MVT > VTs, LegalizeAction Action) |
void | AddPromotedToType (unsigned Opc, MVT OrigVT, MVT DestVT) |
If Opc/OrigVT is specified as being promoted, the promotion code defaults to trying a larger integer/fp until it can find one that works. | |
void | setOperationPromotedToType (unsigned Opc, MVT OrigVT, MVT DestVT) |
Convenience method to set an operation to Promote and specify the type in a single call. | |
void | setOperationPromotedToType (ArrayRef< unsigned > Ops, MVT OrigVT, MVT DestVT) |
void | setTargetDAGCombine (ArrayRef< ISD::NodeType > NTs) |
Targets should invoke this method for each target independent node that they want to provide a custom DAG combiner for by implementing the PerformDAGCombine virtual method. | |
void | setMinFunctionAlignment (Align Alignment) |
Set the target's minimum function alignment. | |
void | setPrefFunctionAlignment (Align Alignment) |
Set the target's preferred function alignment. | |
void | setPrefLoopAlignment (Align Alignment) |
Set the target's preferred loop alignment. | |
void | setMaxBytesForAlignment (unsigned MaxBytes) |
void | setMinStackArgumentAlignment (Align Alignment) |
Set the minimum stack alignment of an argument. | |
void | setMaxAtomicSizeInBitsSupported (unsigned SizeInBits) |
Set the maximum atomic operation size supported by the backend. | |
void | setMaxDivRemBitWidthSupported (unsigned SizeInBits) |
Set the size in bits of the maximum div/rem the backend supports. | |
void | setMaxLargeFPConvertBitWidthSupported (unsigned SizeInBits) |
Set the size in bits of the maximum fp convert the backend supports. | |
void | setMinCmpXchgSizeInBits (unsigned SizeInBits) |
Sets the minimum cmpxchg or ll/sc size supported by the backend. | |
void | setSupportsUnalignedAtomics (bool UnalignedSupported) |
Sets whether unaligned atomic operations are supported. | |
virtual bool | isExtFreeImpl (const Instruction *I) const |
Return true if the extension represented by I is free. | |
bool | isLegalRC (const TargetRegisterInfo &TRI, const TargetRegisterClass &RC) const |
Return true if the value types that can be represented by the specified register class are all legal. | |
MachineBasicBlock * | emitPatchPoint (MachineInstr &MI, MachineBasicBlock *MBB) const |
Replace/modify any TargetFrameIndex operands with a targte-dependent sequence of memory operands that is recognized by PrologEpilogInserter. | |
Static Protected Member Functions | |
static bool | allowApproxFunc (const SelectionDAG &DAG, SDNodeFlags Flags) |
static bool | needsDenormHandlingF32 (const SelectionDAG &DAG, SDValue Src, SDNodeFlags Flags) |
static EVT | getEquivalentMemType (LLVMContext &Context, EVT VT) |
Additional Inherited Members | |
Protected Attributes inherited from llvm::TargetLoweringBase | |
unsigned | GatherAllAliasesMaxDepth |
Depth that GatherAllAliases should continue looking for chain dependencies when trying to find a more preferable chain. | |
unsigned | MaxStoresPerMemset |
Specify maximum number of store instructions per memset call. | |
unsigned | MaxStoresPerMemsetOptSize |
Likewise for functions with the OptSize attribute. | |
unsigned | MaxStoresPerMemcpy |
Specify maximum number of store instructions per memcpy call. | |
unsigned | MaxStoresPerMemcpyOptSize |
Likewise for functions with the OptSize attribute. | |
unsigned | MaxGluedStoresPerMemcpy = 0 |
Specify max number of store instructions to glue in inlined memcpy. | |
unsigned | MaxLoadsPerMemcmp |
Specify maximum number of load instructions per memcmp call. | |
unsigned | MaxLoadsPerMemcmpOptSize |
Likewise for functions with the OptSize attribute. | |
unsigned | MaxStoresPerMemmove |
Specify maximum number of store instructions per memmove call. | |
unsigned | MaxStoresPerMemmoveOptSize |
Likewise for functions with the OptSize attribute. | |
bool | PredictableSelectIsExpensive |
Tells the code generator that select is more expensive than a branch if the branch is usually predicted right. | |
bool | EnableExtLdPromotion |
bool | IsStrictFPEnabled |
Definition at line 27 of file AMDGPUISelLowering.h.
Enumerator | |
---|---|
FIRST_IMPLICIT | |
PRIVATE_BASE | |
SHARED_BASE | |
QUEUE_PTR |
Definition at line 373 of file AMDGPUISelLowering.h.
AMDGPUTargetLowering::AMDGPUTargetLowering | ( | const TargetMachine & | TM, |
const AMDGPUSubtarget & | STI | ||
) |
Definition at line 61 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, llvm::TargetLoweringBase::addBypassSlowDiv(), llvm::ISD::ADDC, llvm::ISD::ADDE, llvm::TargetLoweringBase::AddPromotedToType(), AMDGPUBypassSlowDiv, llvm::ISD::AND, llvm::ISD::AssertSext, llvm::ISD::AssertZext, llvm::ISD::ATOMIC_LOAD, llvm::ISD::ATOMIC_STORE, llvm::ISD::BITCAST, llvm::ISD::BR_JT, llvm::ISD::BRIND, llvm::ISD::BSWAP, llvm::ISD::CONCAT_VECTORS, llvm::ISD::Constant, llvm::ISD::ConstantFP, llvm::ISD::CTLZ, llvm::ISD::CTLZ_ZERO_UNDEF, llvm::ISD::CTPOP, llvm::ISD::CTTZ, llvm::ISD::CTTZ_ZERO_UNDEF, llvm::TargetLoweringBase::Custom, llvm::ISD::DYNAMIC_STACKALLOC, llvm::TargetLoweringBase::Expand, llvm::ISD::EXTLOAD, llvm::ISD::EXTRACT_SUBVECTOR, llvm::ISD::FABS, llvm::ISD::FADD, llvm::ISD::FCANONICALIZE, llvm::ISD::FCEIL, llvm::ISD::FCOPYSIGN, llvm::ISD::FCOS, llvm::ISD::FDIV, llvm::ISD::FEXP, llvm::ISD::FEXP10, llvm::ISD::FEXP2, llvm::ISD::FFLOOR, llvm::ISD::FLOG, llvm::ISD::FLOG10, llvm::ISD::FLOG2, llvm::ISD::FMA, llvm::ISD::FMAXNUM, llvm::ISD::FMINNUM, llvm::ISD::FMUL, llvm::ISD::FNEARBYINT, llvm::ISD::FNEG, llvm::ISD::FP16_TO_FP, llvm::ISD::FP_TO_FP16, llvm::ISD::FP_TO_SINT, llvm::ISD::FP_TO_UINT, llvm::ISD::FPOW, llvm::ISD::FREM, llvm::ISD::FRINT, llvm::ISD::FROUND, llvm::ISD::FROUNDEVEN, llvm::ISD::FSHR, llvm::ISD::FSIN, llvm::ISD::FSQRT, llvm::ISD::FSUB, llvm::ISD::FTRUNC, llvm::TargetLoweringBase::GatherAllAliasesMaxDepth, llvm::AMDGPUSubtarget::has16BitInsts(), llvm::MVT::integer_fixedlen_vector_valuetypes(), llvm::MVT::integer_valuetypes(), llvm::ISD::INTRINSIC_WO_CHAIN, llvm::ISD::IS_FPCLASS, llvm::IRSimilarity::Legal, llvm::ISD::LLRINT, llvm::ISD::LLROUND, llvm::ISD::LOAD, llvm::ISD::LRINT, llvm::ISD::LROUND, llvm::TargetLoweringBase::MaxGluedStoresPerMemcpy, llvm::TargetLoweringBase::MaxStoresPerMemcpy, llvm::TargetLoweringBase::MaxStoresPerMemcpyOptSize, llvm::TargetLoweringBase::MaxStoresPerMemmove, llvm::TargetLoweringBase::MaxStoresPerMemmoveOptSize, llvm::TargetLoweringBase::MaxStoresPerMemset, llvm::TargetLoweringBase::MaxStoresPerMemsetOptSize, llvm::ISD::MUL, llvm::ISD::MULHS, llvm::ISD::MULHU, llvm::ISD::OR, llvm::TargetLoweringBase::PredictableSelectIsExpensive, llvm::TargetLoweringBase::Promote, llvm::Sched::RegPressure, llvm::ISD::ROTL, llvm::ISD::ROTR, llvm::ISD::SDIV, llvm::ISD::SDIVREM, llvm::ISD::SELECT, llvm::ISD::SELECT_CC, llvm::ISD::SETCC, llvm::TargetLoweringBase::setHasMultipleConditionRegisters(), llvm::TargetLoweringBase::setJumpIsExpensive(), llvm::TargetLoweringBase::setLoadExtAction(), llvm::TargetLoweringBase::setMaxAtomicSizeInBitsSupported(), llvm::TargetLoweringBase::setMaxDivRemBitWidthSupported(), llvm::TargetLoweringBase::setMaxLargeFPConvertBitWidthSupported(), llvm::TargetLoweringBase::setMinCmpXchgSizeInBits(), llvm::TargetLoweringBase::setOperationAction(), llvm::TargetLoweringBase::setSchedulingPreference(), llvm::TargetLoweringBase::setSupportsUnalignedAtomics(), llvm::TargetLoweringBase::setTargetDAGCombine(), llvm::TargetLoweringBase::setTruncStoreAction(), llvm::ISD::SEXTLOAD, llvm::ISD::SHL, llvm::ISD::SINT_TO_FP, llvm::ISD::SMAX, llvm::ISD::SMIN, llvm::ISD::SMUL_LOHI, llvm::ISD::SRA, llvm::ISD::SREM, llvm::ISD::SRL, llvm::ISD::STORE, llvm::ISD::SUB, llvm::ISD::SUBC, llvm::ISD::SUBE, llvm::ISD::TRUNCATE, llvm::ISD::UDIV, llvm::ISD::UDIVREM, llvm::ISD::UINT_TO_FP, llvm::ISD::UMAX, llvm::ISD::UMIN, llvm::ISD::UMUL_LOHI, llvm::ISD::UREM, llvm::ISD::VECTOR_SHUFFLE, llvm::ISD::VSELECT, llvm::ISD::XOR, and llvm::ISD::ZEXTLOAD.
SDValue AMDGPUTargetLowering::addTokenForArgument | ( | SDValue | Chain, |
SelectionDAG & | DAG, | ||
MachineFrameInfo & | MFI, | ||
int | ClobberedFI | ||
) | const |
Definition at line 1288 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::getEntryNode(), llvm::SDValue::getNode(), llvm::SelectionDAG::getNode(), llvm::MachineFrameInfo::getObjectOffset(), llvm::MachineFrameInfo::getObjectSize(), llvm::SmallVectorTemplateBase< T, bool >::push_back(), llvm::ISD::TokenFactor, and llvm::SDNode::uses().
Referenced by llvm::SITargetLowering::LowerCall().
Reimplemented from llvm::TargetLoweringBase.
Definition at line 965 of file AMDGPUISelLowering.cpp.
|
staticprotected |
Definition at line 2571 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::getTarget(), llvm::TargetMachine::Options, and Options.
Referenced by lowerFEXP().
|
static |
Definition at line 757 of file AMDGPUISelLowering.cpp.
References assert(), CostThreshold, hasSourceMods(), N, and opMustUseVOP3Encoding().
Referenced by foldFreeOpFromSelect(), getNegatedExpression(), and shouldFoldFNegIntoSrc().
|
protected |
The SelectionDAGBuilder will automatically promote function arguments with illegal types.
However, this does not work for the AMDGPU targets since the function arguments are stored in memory as these illegal types. In order to handle this properly we need to get the original types sizes from the LLVM IR Function and fixup the ISD:InputArg values before passing them to AnalyzeFormalArguments() When the SelectionDAGBuilder computes the Ins, it takes care of splitting input values across multiple registers. Each item in the Ins array represents a single value that will be stored in registers. Ins[x].VT is the value type of the value that will be stored in the register, so whatever SDNode we lower the argument to needs to be this type.
In order to correctly lower the arguments we need to know the size of each argument. Since Ins[x].VT gives us the size of the register that will hold the value, we need to look at Ins[x].ArgVT to see the 'real' type for the original function argument so that we can deduce the correct memory type to use for Ins[x]. In most cases the correct memory type will be Ins[x].ArgVT. However, this will not always be the case. If, for example, we have a kernel argument of type v8i8, this argument will be split into 8 parts and each part will be represented by its own item in the Ins array. For each part the Ins[x].ArgVT will be the v8i8, which is the full type of the argument before it was split. From this, we deduce that the memory type for each individual part is i8. We pass the memory type as LocVT to the calling convention analysis function and the register type (Ins[x].VT) as the ValVT.
Definition at line 1147 of file AMDGPUISelLowering.cpp.
References llvm::CCState::addLoc(), llvm::alignTo(), llvm::Function::args(), assert(), CC, llvm::ComputeValueVTs(), DL, llvm::CCValAssign::Full, llvm::AMDGPUSubtarget::get(), llvm::Function::getCallingConv(), llvm::CCState::getContext(), llvm::Module::getContext(), llvm::CCValAssign::getCustomMem(), llvm::Function::getDataLayout(), llvm::MachineFunction::getFunction(), llvm::EVT::getIntegerVT(), llvm::CCState::getMachineFunction(), llvm::TargetLoweringBase::getNumRegistersForCallingConv(), llvm::GlobalValue::getParent(), llvm::EVT::getPow2VectorType(), llvm::TargetLoweringBase::getRegisterTypeForCallingConv(), llvm::EVT::getRoundIntegerType(), llvm::EVT::getScalarType(), llvm::MVT::getScalarType(), llvm::EVT::getSimpleVT(), llvm::EVT::getStoreSize(), llvm::EVT::getStoreSizeInBits(), llvm::EVT::getVectorNumElements(), llvm::MVT::getVectorNumElements(), llvm::EVT::getVectorVT(), llvm::EVT::isExtended(), llvm::MVT::isFloatingPoint(), llvm::MVT::isInteger(), llvm::EVT::isPow2VectorType(), llvm::EVT::isSimple(), llvm::EVT::isVector(), llvm::MVT::isVector(), llvm_unreachable, and llvm::SmallVectorBase< Size_T >::size().
Referenced by llvm::R600TargetLowering::LowerFormalArguments(), and llvm::SITargetLowering::LowerFormalArguments().
|
static |
Selects the correct CCAssignFn for a given CallingConvention value.
Definition at line 1278 of file AMDGPUISelLowering.cpp.
References CC, and llvm::AMDGPUCallLowering::CCAssignFnForCall().
Referenced by getAssignFnsForCC(), llvm::SITargetLowering::isEligibleForTailCallOptimization(), llvm::SITargetLowering::LowerCall(), llvm::AMDGPUCallLowering::lowerFormalArguments(), and llvm::SITargetLowering::LowerFormalArguments().
|
static |
Definition at line 1283 of file AMDGPUISelLowering.cpp.
References CC, and llvm::AMDGPUCallLowering::CCAssignFnForReturn().
Referenced by llvm::SITargetLowering::CanLowerReturn(), llvm::AMDGPUCallLowering::lowerCall(), llvm::SITargetLowering::LowerCallResult(), and llvm::SITargetLowering::LowerReturn().
SDValue AMDGPUTargetLowering::combineFMinMaxLegacy | ( | const SDLoc & | DL, |
EVT | VT, | ||
SDValue | LHS, | ||
SDValue | RHS, | ||
SDValue | True, | ||
SDValue | False, | ||
SDValue | CC, | ||
DAGCombinerInfo & | DCI | ||
) | const |
Generate Min/Max node.
Definition at line 1661 of file AMDGPUISelLowering.cpp.
References CC, combineFMinMaxLegacyImpl(), llvm::TargetLowering::DAGCombinerInfo::DAG, DL, llvm::ISD::FNEG, llvm::SelectionDAG::getNode(), llvm::ConstantFPSDNode::getValueAPF(), LHS, llvm::neg(), peekFNeg(), and RHS.
Referenced by performSelectCombine().
SDValue AMDGPUTargetLowering::combineFMinMaxLegacyImpl | ( | const SDLoc & | DL, |
EVT | VT, | ||
SDValue | LHS, | ||
SDValue | RHS, | ||
SDValue | True, | ||
SDValue | False, | ||
SDValue | CC, | ||
DAGCombinerInfo & | DCI | ||
) | const |
Definition at line 1592 of file AMDGPUISelLowering.cpp.
References llvm::AfterLegalizeDAG, CC, llvm::TargetLowering::DAGCombinerInfo::DAG, DL, llvm::AMDGPUISD::FMAX_LEGACY, llvm::AMDGPUISD::FMIN_LEGACY, llvm::TargetLowering::DAGCombinerInfo::getDAGCombineLevel(), llvm::SelectionDAG::getNode(), llvm::TargetLowering::DAGCombinerInfo::isCalledByLegalizer(), LHS, llvm_unreachable, RHS, llvm::ISD::SETCC_INVALID, llvm::ISD::SETEQ, llvm::ISD::SETFALSE, llvm::ISD::SETFALSE2, llvm::ISD::SETGE, llvm::ISD::SETGT, llvm::ISD::SETLE, llvm::ISD::SETLT, llvm::ISD::SETNE, llvm::ISD::SETO, llvm::ISD::SETOEQ, llvm::ISD::SETOGE, llvm::ISD::SETOGT, llvm::ISD::SETOLE, llvm::ISD::SETOLT, llvm::ISD::SETONE, llvm::ISD::SETTRUE, llvm::ISD::SETTRUE2, llvm::ISD::SETUEQ, llvm::ISD::SETUGE, llvm::ISD::SETUGT, llvm::ISD::SETULE, llvm::ISD::SETULT, llvm::ISD::SETUNE, and llvm::ISD::SETUO.
Referenced by combineFMinMaxLegacy().
|
overridevirtual |
Determine which of the bits specified in Mask
are known to be either zero or one and return them in the KnownZero
and KnownOne
bitsets.
Reimplemented from llvm::TargetLowering.
Reimplemented in llvm::SITargetLowering.
Definition at line 5619 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUISD::BFE_I32, llvm::AMDGPUISD::BFE_U32, llvm::BitWidth, llvm::AMDGPUISD::BORROW, llvm::AMDGPUISD::BUFFER_LOAD_UBYTE, llvm::AMDGPUISD::BUFFER_LOAD_USHORT, llvm::AMDGPUISD::CARRY, llvm::SelectionDAG::computeKnownBits(), llvm::countl_zero(), llvm::KnownBits::countMaxActiveBits(), llvm::KnownBits::countMaxSignificantBits(), llvm::KnownBits::countMinTrailingZeros(), llvm::Depth, llvm::AMDGPUISD::FP_TO_FP16, llvm::KnownBits::getBitWidth(), llvm::SelectionDAG::getDataLayout(), llvm::MachineFunction::getFunction(), llvm::APInt::getHighBitsSet(), llvm::SelectionDAG::getMachineFunction(), llvm::AMDGPUSubtarget::getMaxWorkitemID(), llvm::APInt::getZExtValue(), llvm::ConstantSDNode::getZExtValue(), I, llvm::ISD::INTRINSIC_WO_CHAIN, llvm::KnownBits::isNegative(), llvm::KnownBits::isNonNegative(), llvm::KnownBits::isStrictlyPositive(), llvm::KnownBits::isUnknown(), llvm::AMDGPUISD::LDS, llvm::Log2(), llvm::AMDGPUISD::MUL_I24, llvm::AMDGPUISD::MUL_U24, llvm::KnownBits::One, llvm::AMDGPUISD::PERM, llvm::KnownBits::resetAll(), llvm::APInt::setBitsFrom(), llvm::APInt::setHighBits(), llvm::APInt::setLowBits(), llvm::AMDGPUISD::SMAX3, llvm::AMDGPUISD::SMED3, llvm::AMDGPUISD::SMIN3, llvm::KnownBits::trunc(), llvm::AMDGPUISD::UMAX3, llvm::AMDGPUISD::UMED3, llvm::AMDGPUISD::UMIN3, workitemIntrinsicDim(), and llvm::KnownBits::Zero.
Referenced by llvm::SITargetLowering::computeKnownBitsForTargetNode().
|
overridevirtual |
This method can be implemented by targets that want to expose additional information about sign bits to GlobalISel combiners.
The DemandedElts argument allows us to only collect the minimum sign bits that are shared by the requested vector elements.
Reimplemented from llvm::TargetLowering.
Definition at line 5845 of file AMDGPUISelLowering.cpp.
References Analysis, llvm::Depth, MI, and MRI.
|
overridevirtual |
This method can be implemented by targets that want to expose additional information about sign bits to the DAG Combiner.
The DemandedElts argument allows us to only collect the minimum sign bits that are shared by the requested vector elements.
Reimplemented from llvm::TargetLowering.
Definition at line 5784 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUISD::BFE_I32, llvm::AMDGPUISD::BFE_U32, llvm::AMDGPUISD::BORROW, llvm::AMDGPUISD::BUFFER_LOAD_BYTE, llvm::AMDGPUISD::BUFFER_LOAD_SHORT, llvm::AMDGPUISD::BUFFER_LOAD_UBYTE, llvm::AMDGPUISD::BUFFER_LOAD_USHORT, llvm::AMDGPUISD::CARRY, llvm::SelectionDAG::ComputeNumSignBits(), llvm::Depth, llvm::AMDGPUISD::FP_TO_FP16, llvm::ConstantSDNode::getZExtValue(), llvm::isNullConstant(), llvm::AMDGPUISD::SMAX3, llvm::AMDGPUISD::SMED3, llvm::AMDGPUISD::SMIN3, llvm::AMDGPUISD::UMAX3, llvm::AMDGPUISD::UMED3, and llvm::AMDGPUISD::UMIN3.
|
inline |
Definition at line 342 of file AMDGPUISelLowering.h.
References CreateLiveInRegister(), llvm::SelectionDAG::getEntryNode(), and Reg.
SDValue AMDGPUTargetLowering::CreateLiveInRegister | ( | SelectionDAG & | DAG, |
const TargetRegisterClass * | RC, | ||
Register | Reg, | ||
EVT | VT, | ||
const SDLoc & | SL, | ||
bool | RawReg = false |
||
) | const |
Helper function that adds Reg to the LiveIn list of the DAG's MachineFunction.
RawReg
is true, otherwise a copy from the register. Definition at line 5282 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::getCopyFromReg(), llvm::SelectionDAG::getEntryNode(), llvm::SelectionDAG::getMachineFunction(), llvm::MachineFunction::getRegInfo(), llvm::SelectionDAG::getRegister(), and MRI.
Referenced by CreateLiveInRegister(), CreateLiveInRegisterRaw(), and loadInputValue().
|
inline |
Definition at line 349 of file AMDGPUISelLowering.h.
References CreateLiveInRegister(), llvm::SelectionDAG::getEntryNode(), and Reg.
Referenced by llvm::R600TargetLowering::LowerOperation().
|
protected |
Definition at line 4534 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::DAGCombinerInfo::AddToWorklist(), allUsesHaveSourceMods(), llvm::TargetLoweringBase::Cheaper, Cond, llvm::TargetLowering::DAGCombinerInfo::DAG, distributeOpThroughSelect(), llvm::ISD::FABS, llvm::ISD::FMUL, llvm::ISD::FNEG, fnegFoldsIntoOp(), getConstantNegateCost(), llvm::SDValue::getNode(), llvm::SelectionDAG::getNode(), llvm::SDValue::getOpcode(), llvm::SDValue::hasOneUse(), llvm::ConstantFPSDNode::isNegative(), LHS, N, RHS, llvm::ISD::SELECT, selectSupportsSourceMods(), and std::swap().
Referenced by performSelectCombine().
|
protected |
Definition at line 4670 of file AMDGPUISelLowering.cpp.
References llvm::CallingConv::C, llvm::TargetLoweringBase::Cheaper, llvm::TargetLoweringBase::Expensive, llvm::AMDGPUSubtarget::hasInv2PiInlineImm(), isInv2Pi(), and llvm::TargetLoweringBase::Neutral.
Referenced by foldFreeOpFromSelect(), isConstantCheaperToNegate(), and isConstantCostlierToNegate().
|
staticprotected |
Definition at line 40 of file AMDGPUISelLowering.cpp.
References llvm::EVT::getIntegerVT(), llvm::EVT::getStoreSizeInBits(), and llvm::EVT::getVectorVT().
Referenced by performLoadCombine(), performStoreCombine(), and llvm::SITargetLowering::ReplaceNodeResults().
|
inlineoverridevirtual |
Return the type for operands of fence.
TODO: Let fence operands be of i32 type and remove this.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 387 of file AMDGPUISelLowering.h.
|
protected |
Definition at line 1722 of file AMDGPUISelLowering.cpp.
References llvm::ISD::BITCAST, llvm::ISD::EXTRACT_VECTOR_ELT, llvm::SelectionDAG::getConstant(), and llvm::SelectionDAG::getNode().
Referenced by LowerFTRUNC(), performSraCombine(), and performSrlCombine().
uint32_t AMDGPUTargetLowering::getImplicitParameterOffset | ( | const MachineFunction & | MF, |
const ImplicitParameter | Param | ||
) | const |
Helper function that returns the byte offset of the given type of implicit parameter.
Definition at line 5393 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUMachineFunction::getExplicitKernArgSize(), getImplicitParameterOffset(), and llvm::MachineFunction::getInfo().
Referenced by llvm::AMDGPULegalizerInfo::getImplicitArgPtr(), getImplicitParameterOffset(), llvm::AMDGPULegalizerInfo::legalizeTrapHsaQueuePtr(), and llvm::R600TargetLowering::LowerOperation().
uint32_t AMDGPUTargetLowering::getImplicitParameterOffset | ( | const uint64_t | ExplicitKernArgSize, |
const ImplicitParameter | Param | ||
) | const |
Definition at line 5374 of file AMDGPUISelLowering.cpp.
References llvm::alignTo(), FIRST_IMPLICIT, llvm::AMDGPUSubtarget::getAlignmentForImplicitArgPtr(), llvm::AMDGPUSubtarget::getExplicitKernelArgOffset(), llvm_unreachable, PRIVATE_BASE, llvm::AMDGPU::ImplicitArg::PRIVATE_BASE_OFFSET, QUEUE_PTR, llvm::AMDGPU::ImplicitArg::QUEUE_PTR_OFFSET, SHARED_BASE, and llvm::AMDGPU::ImplicitArg::SHARED_BASE_OFFSET.
|
protected |
Definition at line 2606 of file AMDGPUISelLowering.cpp.
References llvm::ISD::FABS, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::EVT::getFltSemantics(), llvm::APFloat::getInf(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), and llvm::ISD::SETOLT.
Referenced by LowerFLOGCommon().
|
protected |
Definition at line 2588 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::EVT::getFltSemantics(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::APFloat::getSmallestNormalized(), and llvm::ISD::SETOLT.
|
protected |
Definition at line 1714 of file AMDGPUISelLowering.cpp.
References llvm::ISD::BITCAST, llvm::ISD::EXTRACT_VECTOR_ELT, llvm::SelectionDAG::getConstant(), and llvm::SelectionDAG::getNode().
|
overridevirtual |
Return the newly negated expression if the cost is not expensive and set the cost in Cost
to indicate that if it is cheaper or neutral to do the negation.
Reimplemented from llvm::TargetLowering.
Definition at line 909 of file AMDGPUISelLowering.cpp.
References allUsesHaveSourceMods(), llvm::Depth, llvm::ISD::FMA, llvm::ISD::FMAD, getNegatedExpression(), llvm::TargetLowering::getNegatedExpression(), llvm::SelectionDAG::getNode(), and llvm::AMDGPUISD::RCP.
Referenced by getNegatedExpression().
|
overridevirtual |
Return a reciprocal estimate value for the input operand.
Enabled
is a ReciprocalEstimate enum with value either 'Unspecified' or 'Enabled' as set by a potential default override attribute. If RefinementSteps
is 'Unspecified', the number of Newton-Raphson refinement iterations required to generate a sufficient (though not necessarily IEEE-754 compliant) estimate is returned in that parameter. A target may choose to implement its own refinement within this function. If that's true, then return '0' as the number of RefinementSteps to avoid any further refinement of the estimate. An empty SDValue return means no estimate sequence can be created.
Reimplemented from llvm::TargetLowering.
Definition at line 5585 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::getNode(), llvm::SDValue::getValueType(), and llvm::AMDGPUISD::RCP.
|
protected |
If denormal handling is required return the scaled input to FLOG2, and the check for denormal range.
Otherwise, return null values.
Definition at line 2623 of file AMDGPUISelLowering.cpp.
References llvm::ISD::FMUL, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::APFloat::getSmallestNormalized(), llvm::APFloatBase::IEEEsingle(), needsDenormHandlingF32(), llvm::ISD::SELECT, and llvm::ISD::SETOLT.
Referenced by LowerFLOG2(), LowerFLOGCommon(), and LowerFLOGUnsafe().
|
protected |
Split a vector type into two parts.
The first part is a power of two vector. The second part is whatever is left over, and is a scalar if it would otherwise be a 1-vector.
Definition at line 1734 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::getContext(), llvm::EVT::getVectorElementType(), llvm::EVT::getVectorNumElements(), llvm::EVT::getVectorVT(), and llvm::PowerOf2Ceil().
Referenced by SplitVectorLoad(), and SplitVectorStore().
|
overridevirtual |
Hooks for building estimates in place of slower divisions and square roots.
Return either a square root or its reciprocal estimate value for the input operand. Enabled
is a ReciprocalEstimate enum with value either 'Unspecified' or 'Enabled' as set by a potential default override attribute. If RefinementSteps
is 'Unspecified', the number of Newton-Raphson refinement iterations required to generate a sufficient (though not necessarily IEEE-754 compliant) estimate is returned in that parameter. The boolean UseOneConstNR output is used to select a Newton-Raphson algorithm implementation that uses either one or two constants. The boolean Reciprocal is used to select whether the estimate is for the square root of the input operand or the reciprocal of its square root. A target may choose to implement its own refinement within this function. If that's true, then return '0' as the number of RefinementSteps to avoid any further refinement of the estimate. An empty SDValue return means no estimate sequence can be created.
Reimplemented from llvm::TargetLowering.
Definition at line 5567 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::getNode(), llvm::SDValue::getValueType(), and llvm::AMDGPUISD::RSQ.
This method returns the name of a target specific DAG node.
Reimplemented from llvm::TargetLowering.
Definition at line 5401 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUISD::FIRST_MEM_OPCODE_NUMBER, llvm::AMDGPUISD::FIRST_NUMBER, llvm::AMDGPUISD::LAST_AMDGPU_ISD_NUMBER, LDS, and NODE_NAME_CASE.
|
overridevirtual |
Return the type that should be used to zero or sign extend a zeroext/signext integer return value.
FIXME: Some C calling conventions require the return type to be promoted, but this is not true all the time, e.g. i1/i8/i16 on x86/x86_64. It is also not necessary for non-C calling conventions. The frontend should handle this and include all of the necessary information.
Reimplemented from llvm::TargetLowering.
Definition at line 783 of file AMDGPUISelLowering.cpp.
References assert(), llvm::EVT::getIntegerVT(), llvm::EVT::getSizeInBits(), llvm::EVT::isVector(), and Size.
|
overridevirtual |
Returns the type to be used for the index operand of: ISD::INSERT_VECTOR_ELT, ISD::EXTRACT_VECTOR_ELT, ISD::INSERT_SUBVECTOR, and ISD::EXTRACT_SUBVECTOR.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 794 of file AMDGPUISelLowering.cpp.
Return true if it is cheap to speculate a call to intrinsic ctlz.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 885 of file AMDGPUISelLowering.cpp.
Return true if it is cheap to speculate a call to intrinsic cttz.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 881 of file AMDGPUISelLowering.cpp.
Definition at line 4686 of file AMDGPUISelLowering.cpp.
References llvm::CallingConv::C, llvm::TargetLoweringBase::Cheaper, getConstantNegateCost(), llvm::isConstOrConstSplatFP(), and N.
Definition at line 4680 of file AMDGPUISelLowering.cpp.
References llvm::CallingConv::C, llvm::TargetLoweringBase::Expensive, getConstantNegateCost(), llvm::isConstOrConstSplatFP(), and N.
Referenced by performFNegCombine().
|
overridevirtual |
Return true if it is profitable to move this shift by a constant amount through its operand, adjusting any immediate operands as necessary to preserve semantics.
This transformation may not be desirable if it disrupts a particularly auspicious target-specific tree (e.g. bitfield extraction in AArch64). By default, it returns true.
N | the shift node |
Level | the current DAGCombine legalization level. |
Reimplemented from llvm::TargetLowering.
Definition at line 1030 of file AMDGPUISelLowering.cpp.
References llvm::AfterLegalizeTypes, assert(), LHS, N, llvm::ISD::OR, RHS, llvm::ISD::SHL, llvm::ISD::SRA, llvm::ISD::SRL, and llvm::ISD::ZEXTLOAD.
Return true if an fabs operation is free to the point where it is never worthwhile to replace it with a bitwise operation.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 944 of file AMDGPUISelLowering.cpp.
References assert(), llvm::AMDGPUSubtarget::has16BitInsts(), and llvm::EVT::isFloatingPoint().
Return true if an fneg operation is free to the point where it is never worthwhile to replace it with a bitwise operation.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 952 of file AMDGPUISelLowering.cpp.
References assert(), llvm::EVT::getScalarType(), and llvm::EVT::isFloatingPoint().
Referenced by llvm::GCNTTIImpl::getArithmeticInstrCost().
|
overridevirtual |
Returns true if the target can instruction select the specified FP immediate natively.
If false, the legalizer will materialize the FP immediate as a load from a constant pool.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 804 of file AMDGPUISelLowering.cpp.
References llvm::EVT::getScalarType(), and llvm::AMDGPUSubtarget::has16BitInsts().
|
inlineoverridevirtual |
Return true if SQRT(X) shouldn't be replaced with X*RSQRT(X).
Reimplemented from llvm::TargetLoweringBase.
Definition at line 293 of file AMDGPUISelLowering.h.
|
overridevirtual |
If SNaN
is false,.
Op
is known to never be any NaN. If sNaN
is true, returns if Op
is known to never be a signaling NaN. Reimplemented from llvm::TargetLowering.
Reimplemented in llvm::SITargetLowering.
Definition at line 5882 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUISD::COS_HW, llvm::AMDGPUISD::CVT_F32_UBYTE0, llvm::AMDGPUISD::CVT_F32_UBYTE1, llvm::AMDGPUISD::CVT_F32_UBYTE2, llvm::AMDGPUISD::CVT_F32_UBYTE3, llvm::AMDGPUISD::CVT_PKRTZ_F16_F32, llvm::Depth, llvm::AMDGPUISD::DIV_FIXUP, llvm::AMDGPUISD::DIV_FMAS, llvm::AMDGPUISD::DIV_SCALE, llvm::ISD::FLDEXP, llvm::AMDGPUISD::FMAD_FTZ, llvm::AMDGPUISD::FMAX3, llvm::AMDGPUISD::FMAX_LEGACY, llvm::AMDGPUISD::FMAXIMUM3, llvm::AMDGPUISD::FMED3, llvm::AMDGPUISD::FMIN3, llvm::AMDGPUISD::FMIN_LEGACY, llvm::AMDGPUISD::FMINIMUM3, llvm::AMDGPUISD::FMUL_LEGACY, llvm::AMDGPUISD::FRACT, llvm::ISD::INTRINSIC_WO_CHAIN, llvm::SelectionDAG::isKnownNeverNaN(), llvm::AMDGPUISD::RCP, llvm::AMDGPUISD::RCP_LEGACY, llvm::AMDGPUISD::RSQ, llvm::AMDGPUISD::RSQ_CLAMP, and llvm::AMDGPUISD::SIN_HW.
Referenced by llvm::SITargetLowering::isKnownNeverNaNForTargetNode().
|
finalvirtual |
Return true if the following transform is beneficial: fold (conv (load x)) -> (load (conv*)x) On architectures that don't natively support some vector loads efficiently, casting the load to a smaller vector of larger types and loading is more efficient, however, this can be undone by optimizations in dag combiner.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 857 of file AMDGPUISelLowering.cpp.
References llvm::TargetLoweringBase::allowsMemoryAccessForAlignment(), assert(), llvm::CallingConv::Fast, llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::EVT::getScalarSizeInBits(), llvm::EVT::getScalarType(), and llvm::EVT::getSizeInBits().
Return true if it's profitable to narrow operations of type SrcVT to DestVT.
e.g. on x86, it's profitable to narrow from i32 to i8 but not from i32 to i16.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 1020 of file AMDGPUISelLowering.cpp.
References llvm::EVT::getSizeInBits().
|
overridevirtual |
Reimplemented from llvm::TargetLowering.
Reimplemented in llvm::SITargetLowering.
Definition at line 5996 of file AMDGPUISelLowering.cpp.
References MRI.
Reimplemented from llvm::TargetLowering.
Definition at line 889 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUAS::CONSTANT_ADDRESS_32BIT, llvm::ISD::EntryToken, llvm::ISD::INTRINSIC_WO_CHAIN, llvm::AMDGPU::isIntrinsicAlwaysUniform(), llvm::ISD::LOAD, N, llvm::AMDGPUISD::SETCC, and llvm::ISD::TokenFactor.
|
overridevirtual |
Reimplemented from llvm::TargetLoweringBase.
Definition at line 798 of file AMDGPUISelLowering.cpp.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 977 of file AMDGPUISelLowering.cpp.
References llvm::EVT::getSizeInBits().
Return true if it's free to truncate a value of type FromTy to type ToTy.
e.g. On x86 it's free to truncate a i32 value in register EAX to i16 by referencing its sub-register AX. Targets must return false when FromTy <= ToTy.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 986 of file AMDGPUISelLowering.cpp.
References llvm::Type::getScalarSizeInBits(), and llvm::AMDGPUSubtarget::has16BitInsts().
Reimplemented from llvm::TargetLoweringBase.
Definition at line 1008 of file AMDGPUISelLowering.cpp.
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the value to ToTy in the result register.
The function should return true when it is likely that the truncate can be freely folded with an instruction defining a value of FromTy. If the defining instruction is unknown (because you're looking at a function argument, PHI, etc.) then the target may require an explicit truncate, which is not necessarily free, but this function does not deal with those cases. Targets must return false when FromTy >= ToTy.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 998 of file AMDGPUISelLowering.cpp.
References llvm::Type::getScalarSizeInBits(), and llvm::AMDGPUSubtarget::has16BitInsts().
SDValue AMDGPUTargetLowering::loadInputValue | ( | SelectionDAG & | DAG, |
const TargetRegisterClass * | RC, | ||
EVT | VT, | ||
const SDLoc & | SL, | ||
const ArgDescriptor & | Arg | ||
) | const |
Definition at line 5353 of file AMDGPUISelLowering.cpp.
References llvm::ISD::AND, assert(), CreateLiveInRegister(), llvm::SelectionDAG::getConstant(), llvm::ArgDescriptor::getMask(), llvm::SelectionDAG::getNode(), llvm::ArgDescriptor::getRegister(), llvm::SelectionDAG::getShiftAmountConstant(), llvm::ArgDescriptor::getStackOffset(), llvm::ArgDescriptor::isMasked(), llvm::ArgDescriptor::isRegister(), loadStackInputValue(), and llvm::ISD::SRL.
Referenced by llvm::SITargetLowering::passSpecialInputs().
SDValue AMDGPUTargetLowering::loadStackInputValue | ( | SelectionDAG & | DAG, |
EVT | VT, | ||
const SDLoc & | SL, | ||
int64_t | Offset | ||
) | const |
Similar to CreateLiveInRegister, except value maybe loaded from a stack slot rather than passed in a register.
Definition at line 5318 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::getEntryNode(), llvm::SelectionDAG::getFrameIndex(), llvm::MachineFunction::getFrameInfo(), llvm::SelectionDAG::getLoad(), llvm::SelectionDAG::getMachineFunction(), getOrCreateFixedStackObject(), llvm::MachinePointerInfo::getStack(), llvm::EVT::getStoreSize(), llvm::MachineMemOperand::MODereferenceable, llvm::MachineMemOperand::MOInvariant, llvm::Offset, and Ptr.
Referenced by loadInputValue().
|
overridevirtual |
This hook must be implemented to lower calls into the specified DAG.
The outgoing arguments to the call are described by the Outs array, and the values to be returned by the call are described by the Ins array. The implementation should fill in the InVals array with legal-type return values from the call, and return the resulting token chain value.
Reimplemented from llvm::TargetLowering.
Reimplemented in llvm::SITargetLowering.
Definition at line 1349 of file AMDGPUISelLowering.cpp.
References lowerUnhandledCall().
|
protected |
Definition at line 1504 of file AMDGPUISelLowering.cpp.
References llvm::ISD::BITCAST, llvm::SelectionDAG::ExtractVectorElements(), llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getNode(), llvm::DWARFExpression::Operation::getNumOperands(), llvm::EVT::getSizeInBits(), llvm::EVT::getVectorElementType(), and llvm::EVT::getVectorVT().
Referenced by LowerOperation().
|
protected |
Definition at line 3143 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, assert(), llvm::ISD::CTLZ_ZERO_UNDEF, llvm::ISD::CTTZ_ZERO_UNDEF, llvm::AMDGPUISD::FFBH_U32, llvm::AMDGPUISD::FFBL_B32, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), llvm::Hi, isCtlzOpc(), isCttzOpc(), llvm::Lo, split64BitValue(), llvm::ISD::UADDSAT, llvm::ISD::UMIN, and llvm::ISD::ZERO_EXTEND.
Referenced by LowerOperation().
|
protected |
Definition at line 3113 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ANY_EXTEND, assert(), llvm::ISD::CTLZ_ZERO_UNDEF, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), isCtlzOpc(), llvm::ISD::SHL, llvm::ISD::SUB, llvm::ISD::TRUNCATE, and llvm::ISD::ZERO_EXTEND.
Referenced by ReplaceNodeResults().
|
protected |
Definition at line 1902 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, llvm::ISD::AND, llvm::SelectionDAG::ComputeNumSignBits(), DL, llvm::ISD::FABS, llvm::ISD::FMA, llvm::ISD::FMAD, llvm::AMDGPUISD::FMAD_FTZ, llvm::ISD::FMUL, llvm::ISD::FNEG, llvm::SIModeRegisterDefaults::FP32Denormals, llvm::ISD::FP_TO_SINT, llvm::ISD::FP_TO_UINT, llvm::ISD::FTRUNC, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::MachineFunction::getInfo(), llvm::EVT::getIntegerVT(), llvm::SelectionDAG::getMachineFunction(), llvm::SelectionDAG::getMergeValues(), llvm::SIMachineFunctionInfo::getMode(), llvm::SelectionDAG::getNode(), llvm::DenormalMode::getPreserveSign(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::EVT::getSizeInBits(), llvm::SelectionDAG::getValueType(), llvm::AMDGPUSubtarget::hasMadMacF32Insts(), llvm::AMDGPUSubtarget::isGCN(), LHS, llvm::ISD::MUL, llvm::ISD::OR, llvm::AMDGPUISD::RCP, RHS, llvm::ISD::SELECT, llvm::ISD::SETOGE, llvm::ISD::SIGN_EXTEND_INREG, llvm::ISD::SINT_TO_FP, llvm::ISD::SRA, llvm::ISD::SUB, llvm::ISD::UINT_TO_FP, and llvm::ISD::XOR.
Referenced by LowerSDIVREM(), and LowerUDIVREM().
SDValue AMDGPUTargetLowering::LowerDYNAMIC_STACKALLOC | ( | SDValue | Op, |
SelectionDAG & | DAG | ||
) | const |
Definition at line 1354 of file AMDGPUISelLowering.cpp.
References llvm::LLVMContext::diagnose(), llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getContext(), getDebugLoc(), llvm::MachineFunction::getFunction(), llvm::SelectionDAG::getMachineFunction(), and llvm::SelectionDAG::getMergeValues().
Referenced by llvm::SITargetLowering::LowerDYNAMIC_STACKALLOC(), and LowerOperation().
|
protected |
Definition at line 1539 of file AMDGPUISelLowering.cpp.
References assert(), llvm::ISD::BITCAST, llvm::SelectionDAG::ExtractVectorElements(), llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getNode(), llvm::EVT::getScalarSizeInBits(), llvm::EVT::getVectorNumElements(), and llvm::EVT::getVectorVT().
Referenced by LowerOperation().
|
protected |
Definition at line 2361 of file AMDGPUISelLowering.cpp.
References llvm::Add, llvm::And, llvm::ISD::AND, llvm::ISD::FADD, llvm::ISD::FTRUNC, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::ISD::SELECT, llvm::ISD::SETOGT, and llvm::ISD::SETONE.
Referenced by LowerOperation().
|
protected |
Definition at line 2972 of file AMDGPUISelLowering.cpp.
References A, allowApproxFunc(), llvm::ISD::AND, assert(), llvm::ISD::BITCAST, llvm::CallingConv::C, CC, CH, llvm::AMDGPUISD::EXP, llvm::ISD::FADD, llvm::ISD::FEXP10, llvm::ISD::FLDEXP, llvm::ISD::FMA, llvm::ISD::FMUL, llvm::ISD::FNEG, llvm::ISD::FP_EXTEND, llvm::ISD::FP_ROUND, llvm::ISD::FP_TO_SINT, llvm::ISD::FROUNDEVEN, llvm::ISD::FSUB, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::APFloat::getInf(), getMad(), llvm::SelectionDAG::getNode(), llvm::EVT::getScalarType(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::SelectionDAG::getTargetConstant(), llvm::TargetLoweringBase::getTargetMachine(), llvm::AMDGPUSubtarget::hasFastFMAF32(), llvm::APFloatBase::IEEEsingle(), llvm::EVT::isVector(), llvm::numbers::log2ef, lowerFEXP10Unsafe(), lowerFEXPUnsafe(), llvm::TargetMachine::Options, Options, llvm::ISD::SELECT, llvm::SDNodeFlags::setAllowContract(), llvm::ISD::SETOGT, llvm::ISD::SETOLT, and X.
Referenced by LowerOperation(), and ReplaceNodeResults().
|
protected |
Emit approx-funcs appropriate lowering for exp10.
inf/nan should still be handled correctly.
Definition at line 2920 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUISD::EXP, llvm::ISD::FADD, llvm::ISD::FEXP2, llvm::ISD::FMUL, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), needsDenormHandlingF32(), llvm::ISD::SELECT, llvm::ISD::SETOLT, and X.
Referenced by lowerFEXP().
|
protected |
Definition at line 2829 of file AMDGPUISelLowering.cpp.
References assert(), llvm::AMDGPUISD::EXP, llvm::ISD::FADD, llvm::ISD::FMUL, llvm::ISD::FP_EXTEND, llvm::ISD::FP_ROUND, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::SelectionDAG::getTargetConstant(), llvm::AMDGPUSubtarget::has16BitInsts(), needsDenormHandlingF32(), llvm::ISD::SELECT, and llvm::ISD::SETOLT.
Referenced by LowerOperation(), and ReplaceNodeResults().
|
protected |
Definition at line 2880 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUISD::EXP, llvm::ISD::FADD, llvm::ISD::FEXP2, llvm::ISD::FMUL, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::numbers::log2e, llvm::Mul, needsDenormHandlingF32(), llvm::ISD::SELECT, llvm::ISD::SETOLT, and X.
Referenced by lowerFEXP().
|
protected |
Definition at line 2522 of file AMDGPUISelLowering.cpp.
References llvm::Add, llvm::And, llvm::ISD::AND, llvm::ISD::FADD, llvm::ISD::FTRUNC, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::ISD::SELECT, llvm::ISD::SETOLT, and llvm::ISD::SETONE.
Referenced by LowerOperation().
|
protected |
Definition at line 2784 of file AMDGPUISelLowering.cpp.
References LowerFLOGCommon().
|
protected |
Definition at line 2646 of file AMDGPUISelLowering.cpp.
References assert(), llvm::ISD::FP_EXTEND, llvm::ISD::FP_ROUND, llvm::ISD::FSUB, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getNode(), getScaledLogInput(), llvm::SelectionDAG::getTargetConstant(), llvm::AMDGPUSubtarget::has16BitInsts(), llvm::AMDGPUISD::LOG, llvm::Log2(), and llvm::ISD::SELECT.
Referenced by LowerOperation(), and ReplaceNodeResults().
|
protected |
Definition at line 2687 of file AMDGPUISelLowering.cpp.
References llvm::ISD::AND, assert(), llvm::ISD::BITCAST, llvm::CallingConv::C, CC, CH, DL, llvm::ISD::FADD, llvm::ISD::FLOG, llvm::ISD::FLOG10, llvm::ISD::FMA, llvm::ISD::FMUL, llvm::ISD::FNEG, llvm::ISD::FP_EXTEND, llvm::ISD::FP_ROUND, llvm::ISD::FSUB, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getConstantFP(), getIsFinite(), getMad(), llvm::SelectionDAG::getNode(), getScaledLogInput(), llvm::SelectionDAG::getTargetConstant(), llvm::TargetLoweringBase::getTargetMachine(), llvm::AMDGPUSubtarget::has16BitInsts(), llvm::AMDGPUSubtarget::hasFastFMAF32(), llvm::AMDGPUISD::LOG, LowerFLOGUnsafe(), llvm::TargetMachine::Options, Options, llvm::ISD::SELECT, X, and Y.
Referenced by LowerFLOG10(), LowerOperation(), and ReplaceNodeResults().
|
protected |
Definition at line 2790 of file AMDGPUISelLowering.cpp.
References llvm::ISD::FADD, llvm::ISD::FLOG2, llvm::ISD::FMA, llvm::ISD::FMUL, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getNode(), getScaledLogInput(), llvm::AMDGPUSubtarget::hasFastFMAF32(), llvm::numbers::ln10, llvm::numbers::ln2, llvm::AMDGPUISD::LOG, llvm::Mul, and llvm::ISD::SELECT.
Referenced by LowerFLOGCommon().
|
protected |
Definition at line 2475 of file AMDGPUISelLowering.cpp.
References llvm::ISD::FROUNDEVEN, and llvm::SelectionDAG::getNode().
Referenced by LowerOperation().
|
protected |
Definition at line 3518 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, llvm::ISD::AND, assert(), B, llvm::ISD::BITCAST, D, DL, llvm::AMDGPUISD::FP_TO_FP16, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSelectCC(), llvm::SDValue::getSimpleValueType(), llvm::TargetLoweringBase::getTargetMachine(), llvm::SDValue::getValueType(), llvm::SelectionDAG::getZExtOrTrunc(), I, N, Options, llvm::ISD::OR, llvm::ISD::SETEQ, llvm::ISD::SETGT, llvm::ISD::SETLT, llvm::ISD::SETNE, llvm::ISD::SHL, llvm::ISD::SMAX, llvm::ISD::SMIN, llvm::ISD::SRL, and llvm::ISD::SUB.
Referenced by LowerOperation().
|
protected |
Definition at line 3617 of file AMDGPUISelLowering.cpp.
References DL, llvm::ISD::FP16_TO_FP, llvm::ISD::FP_EXTEND, llvm::ISD::FP_TO_SINT, llvm::SelectionDAG::getNode(), LowerFP_TO_INT64(), llvm::ISD::SIGN_EXTEND, llvm::ISD::TRUNCATE, and llvm::ISD::ZERO_EXTEND.
Referenced by LowerOperation(), and llvm::SITargetLowering::LowerOperation().
|
protected |
Definition at line 3443 of file AMDGPUISelLowering.cpp.
References assert(), llvm::ISD::BITCAST, llvm::ISD::FABS, llvm::ISD::FFLOOR, llvm::ISD::FMA, llvm::ISD::FMUL, llvm::ISD::FP_TO_SINT, llvm::ISD::FP_TO_UINT, llvm::ISD::FTRUNC, llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getNode(), llvm::Hi, llvm::Lo, llvm::Mul, Signed, llvm::ISD::SRA, llvm::ISD::SUB, and llvm::ISD::XOR.
Referenced by LowerFP_TO_INT().
|
protected |
Split a vector store into multiple scalar stores.
Definition at line 2347 of file AMDGPUISelLowering.cpp.
References llvm::ISD::FDIV, llvm::ISD::FMA, llvm::ISD::FNEG, llvm::ISD::FTRUNC, llvm::SelectionDAG::getNode(), X, and Y.
Referenced by LowerOperation().
|
protected |
Definition at line 2484 of file AMDGPUISelLowering.cpp.
References llvm::ISD::FROUNDEVEN, and llvm::SelectionDAG::getNode().
Referenced by LowerOperation().
|
protected |
Definition at line 2495 of file AMDGPUISelLowering.cpp.
References llvm::ISD::FABS, llvm::ISD::FADD, llvm::ISD::FCOPYSIGN, llvm::ISD::FSUB, llvm::ISD::FTRUNC, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::ISD::SELECT, llvm::ISD::SETOGE, and X.
Referenced by LowerOperation().
|
protected |
Definition at line 2447 of file AMDGPUISelLowering.cpp.
References assert(), Cond, llvm::ISD::FABS, llvm::ISD::FADD, llvm::ISD::FCOPYSIGN, llvm::ISD::FSUB, llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSelect(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::APFloatBase::IEEEdouble(), and llvm::ISD::SETOGT.
Referenced by LowerOperation().
|
protected |
Definition at line 2401 of file AMDGPUISelLowering.cpp.
References llvm::ISD::AND, assert(), llvm::ISD::BITCAST, extractF64Exponent(), llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), getHiHalf64(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getNOT(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), llvm::Hi, llvm::ISD::SELECT, llvm::ISD::SETGT, llvm::ISD::SETLT, and llvm::ISD::SRA.
Referenced by LowerOperation().
|
protectedvirtual |
Definition at line 1453 of file AMDGPUISelLowering.cpp.
References llvm::Address, llvm::AMDGPUMachineFunction::allocateLDSGlobal(), assert(), llvm::LLVMContext::diagnose(), DL, llvm::DS_Warning, G, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getEntryNode(), llvm::MachineFunction::getFunction(), llvm::AMDGPUMachineFunction::getLDSAbsoluteAddress(), llvm::SelectionDAG::getMachineFunction(), llvm::Value::getName(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getRoot(), llvm::SelectionDAG::getUNDEF(), llvm::AMDGPUMachineFunction::isModuleEntryFunction(), llvm::AMDGPUAS::LOCAL_ADDRESS, llvm::Offset, llvm::AMDGPUAS::REGION_ADDRESS, llvm::SelectionDAG::setRoot(), llvm::ISD::TokenFactor, llvm::ISD::TRAP, and Trap.
|
protected |
Definition at line 3203 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, llvm::ISD::BITCAST, llvm::ISD::CTLZ, llvm::AMDGPUISD::FFBH_I32, llvm::ISD::FLDEXP, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), llvm::Hi, llvm::AMDGPUSubtarget::isGCN(), llvm::Lo, llvm::ISD::OR, llvm::ISD::SHL, Signed, llvm::ISD::SINT_TO_FP, split64BitValue(), llvm::ISD::SRA, llvm::ISD::SUB, llvm::ISD::TRUNCATE, llvm::ISD::UINT_TO_FP, llvm::ISD::UMIN, and llvm::ISD::XOR.
Referenced by LowerSINT_TO_FP(), and LowerUINT_TO_FP().
|
protected |
Definition at line 3329 of file AMDGPUISelLowering.cpp.
References llvm::ISD::FADD, llvm::ISD::FLDEXP, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), llvm::Hi, llvm::Lo, Signed, llvm::ISD::SINT_TO_FP, split64BitValue(), and llvm::ISD::UINT_TO_FP.
Referenced by LowerSINT_TO_FP(), and LowerUINT_TO_FP().
|
overridevirtual |
This callback is invoked for operations that are unsupported by the target, which are registered to use 'custom' lowering, and whose defined values are all legal.
If the target has no operations that require custom lowering, it need not implement this. The default implementation of this aborts.
Reimplemented from llvm::TargetLowering.
Reimplemented in llvm::R600TargetLowering, and llvm::SITargetLowering.
Definition at line 1365 of file AMDGPUISelLowering.cpp.
References llvm::ISD::CONCAT_VECTORS, llvm::ISD::CTLZ, llvm::ISD::CTLZ_ZERO_UNDEF, llvm::ISD::CTTZ, llvm::ISD::CTTZ_ZERO_UNDEF, llvm::ISD::DYNAMIC_STACKALLOC, llvm::errs(), llvm::ISD::EXTRACT_SUBVECTOR, llvm::ISD::FCEIL, llvm::ISD::FEXP, llvm::ISD::FEXP10, llvm::ISD::FEXP2, llvm::ISD::FFLOOR, llvm::ISD::FLOG, llvm::ISD::FLOG10, llvm::ISD::FLOG2, llvm::ISD::FNEARBYINT, llvm::ISD::FP_TO_FP16, llvm::ISD::FP_TO_SINT, llvm::ISD::FP_TO_UINT, llvm::ISD::FREM, llvm::ISD::FRINT, llvm::ISD::FROUND, llvm::ISD::FROUNDEVEN, llvm::ISD::FTRUNC, llvm_unreachable, LowerCONCAT_VECTORS(), LowerCTLZ_CTTZ(), LowerDYNAMIC_STACKALLOC(), LowerEXTRACT_SUBVECTOR(), LowerFCEIL(), lowerFEXP(), lowerFEXP2(), LowerFFLOOR(), LowerFLOG2(), LowerFLOGCommon(), LowerFNEARBYINT(), LowerFP_TO_FP16(), LowerFP_TO_INT(), LowerFREM(), LowerFRINT(), LowerFROUND(), LowerFROUNDEVEN(), LowerFTRUNC(), LowerSDIVREM(), LowerSIGN_EXTEND_INREG(), LowerSINT_TO_FP(), LowerUDIVREM(), LowerUINT_TO_FP(), llvm::DWARFExpression::Operation::print(), llvm::ISD::SDIVREM, llvm::ISD::SIGN_EXTEND_INREG, llvm::ISD::SINT_TO_FP, llvm::ISD::UDIVREM, and llvm::ISD::UINT_TO_FP.
Referenced by llvm::R600TargetLowering::LowerOperation(), and llvm::SITargetLowering::LowerOperation().
|
overridevirtual |
This hook must be implemented to lower outgoing return values, described by the Outs array, into the specified DAG.
The implementation should return the resulting token chain value.
Reimplemented from llvm::TargetLowering.
Reimplemented in llvm::SITargetLowering.
Definition at line 1261 of file AMDGPUISelLowering.cpp.
References DL, llvm::AMDGPUISD::ENDPGM, and llvm::SelectionDAG::getNode().
Referenced by llvm::SITargetLowering::LowerReturn().
|
protected |
Definition at line 2286 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, llvm::SelectionDAG::ComputeNumSignBits(), DL, llvm::ISD::EXTRACT_ELEMENT, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getContext(), llvm::EVT::getHalfSizedIntegerVT(), llvm::SelectionDAG::getMergeValues(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSelectCC(), llvm::SDValue::getValue(), llvm::SelectionDAG::getVTList(), LHS, LowerDIVREM24(), RHS, llvm::ISD::SDIVREM, llvm::ISD::SETLT, llvm::ISD::SIGN_EXTEND, llvm::ISD::SUB, llvm::ISD::UDIVREM, and llvm::ISD::XOR.
Referenced by LowerOperation(), and llvm::R600TargetLowering::ReplaceNodeResults().
|
protected |
Definition at line 3661 of file AMDGPUISelLowering.cpp.
References assert(), DL, llvm::SelectionDAG::ExtractVectorElements(), llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getNode(), llvm::EVT::getScalarType(), llvm::MVT::getScalarType(), llvm::SelectionDAG::getValueType(), llvm::MVT::getVectorNumElements(), I, llvm::MVT::isVector(), and llvm::ISD::SIGN_EXTEND_INREG.
Referenced by LowerOperation().
|
protected |
Definition at line 3394 of file AMDGPUISelLowering.cpp.
References assert(), DL, llvm::ISD::FP_ROUND, llvm::SelectionDAG::getIntPtrConstant(), llvm::SelectionDAG::getNode(), llvm::AMDGPUSubtarget::has16BitInsts(), LowerINT_TO_FP32(), LowerINT_TO_FP64(), llvm::ISD::SIGN_EXTEND, and llvm::ISD::SINT_TO_FP.
Referenced by LowerOperation().
|
protected |
|
protected |
Definition at line 2231 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, Cond, DL, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getMergeValues(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::TargetLoweringBase::getSetCCResultType(), LowerDIVREM24(), LowerUDIVREM64(), llvm::ISD::MUL, llvm::ISD::MULHU, Results, llvm::ISD::SELECT, llvm::ISD::SETUGE, llvm::ISD::SUB, llvm::AMDGPUISD::URECIP, X, and Y.
Referenced by LowerOperation().
|
protected |
Definition at line 2017 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, llvm::ISD::AND, assert(), llvm::ISD::BITCAST, DL, llvm::ISD::FMA, llvm::ISD::FMAD, llvm::AMDGPUISD::FMAD_FTZ, llvm::ISD::FMUL, llvm::SIModeRegisterDefaults::FP32Denormals, llvm::ISD::FP_TO_UINT, llvm::ISD::FTRUNC, llvm::SelectionDAG::getBitcast(), llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::EVT::getHalfSizedIntegerVT(), llvm::APInt::getHighBitsSet(), llvm::MachineFunction::getInfo(), llvm::SelectionDAG::getMachineFunction(), llvm::SIMachineFunctionInfo::getMode(), llvm::SelectionDAG::getNode(), llvm::DenormalMode::getPreserveSign(), llvm::SelectionDAG::getSelectCC(), llvm::EVT::getSizeInBits(), llvm::SDValue::getValue(), llvm::SelectionDAG::getVTList(), llvm::AMDGPUSubtarget::hasMadMacF32Insts(), llvm::TargetLoweringBase::isTypeLegal(), LHS, llvm::SelectionDAG::MaskedValueIsZero(), llvm::ISD::MUL, llvm::ISD::MULHU, llvm::ISD::OR, llvm::AMDGPUISD::RCP, Results, RHS, llvm::ISD::SETEQ, llvm::ISD::SETNE, llvm::ISD::SETUGE, llvm::ISD::SHL, llvm::SelectionDAG::SplitScalar(), llvm::ISD::SRL, llvm::ISD::SUB, llvm::ISD::UADDO_CARRY, llvm::ISD::UDIV, llvm::ISD::UDIVREM, llvm::ISD::UINT_TO_FP, llvm::ISD::UREM, llvm::ISD::USUBO_CARRY, and llvm::ISD::ZERO_EXTEND.
Referenced by LowerUDIVREM(), and llvm::R600TargetLowering::ReplaceNodeResults().
|
protected |
Definition at line 3348 of file AMDGPUISelLowering.cpp.
References assert(), DL, llvm::ISD::FP_ROUND, llvm::SelectionDAG::getIntPtrConstant(), llvm::SelectionDAG::getNode(), llvm::AMDGPUSubtarget::has16BitInsts(), LowerINT_TO_FP32(), LowerINT_TO_FP64(), llvm::ISD::UINT_TO_FP, and llvm::ISD::ZERO_EXTEND.
Referenced by LowerOperation().
SDValue AMDGPUTargetLowering::lowerUnhandledCall | ( | CallLoweringInfo & | CLI, |
SmallVectorImpl< SDValue > & | InVals, | ||
StringRef | Reason | ||
) | const |
Definition at line 1322 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::CallLoweringInfo::Callee, llvm::TargetLowering::CallLoweringInfo::DAG, llvm::LLVMContext::diagnose(), llvm::TargetLowering::CallLoweringInfo::DL, G, llvm::SelectionDAG::getContext(), llvm::SDLoc::getDebugLoc(), llvm::SelectionDAG::getEntryNode(), llvm::MachineFunction::getFunction(), llvm::SelectionDAG::getMachineFunction(), llvm::SelectionDAG::getUNDEF(), llvm::TargetLowering::CallLoweringInfo::Ins, llvm::TargetLowering::CallLoweringInfo::IsTailCall, llvm::SmallVectorTemplateBase< T, bool >::push_back(), and llvm::ISD::InputArg::VT.
Referenced by LowerCall(), and llvm::SITargetLowering::LowerCall().
Definition at line 630 of file AMDGPUISelLowering.cpp.
References llvm::TargetLoweringBase::getTargetMachine(), and Options.
Referenced by performFNegCombine().
|
inlineoverridevirtual |
Allow store merging for the specified type after legalization in addition to before legalization.
This may transform stores that do not exist earlier (for example, stores created from intrinsics).
Reimplemented from llvm::TargetLoweringBase.
Definition at line 291 of file AMDGPUISelLowering.h.
|
staticprotected |
Definition at line 2579 of file AMDGPUISelLowering.cpp.
References llvm::MachineFunction::getDenormalMode(), llvm::SelectionDAG::getMachineFunction(), llvm::APFloatBase::IEEEsingle(), llvm::DenormalMode::Input, llvm::DenormalMode::PreserveSign, and valueIsKnownNeverF32Denorm().
Referenced by getScaledLogInput(), lowerFEXP10Unsafe(), lowerFEXP2(), and lowerFEXPUnsafe().
|
static |
Definition at line 55 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::ComputeMaxSignificantBits().
Referenced by isI24().
|
static |
Definition at line 51 of file AMDGPUISelLowering.cpp.
References llvm::SelectionDAG::computeKnownBits(), and llvm::KnownBits::countMaxActiveBits().
Referenced by isU24().
|
protected |
Definition at line 3904 of file AMDGPUISelLowering.cpp.
References llvm::EVT::bitsGE(), llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::SelectionDAG::getNode(), llvm::SDValue::getOpcode(), llvm::SDValue::getOperand(), N, and llvm::ISD::TRUNCATE.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4477 of file AMDGPUISelLowering.cpp.
References Cond, llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::AMDGPUISD::FFBH_U32, llvm::AMDGPUISD::FFBL_B32, llvm::isAllOnesConstant(), isCtlzOpc(), isCttzOpc(), llvm::isNullConstant(), LHS, RHS, llvm::ISD::SETEQ, and llvm::ISD::SETNE.
Referenced by performSelectCombine().
|
overridevirtual |
This method will be invoked for all target nodes and for any target-independent nodes that the target has registered with invoke it for.
The semantics are as follows: Return Value: SDValue.Val == 0 - No change was made SDValue.Val == N - N was replaced, is dead, and is already handled. otherwise - N should be replaced by the returned Operand.
In addition, methods provided by DAGCombinerInfo may be used to perform more complex transformations.
Reimplemented from llvm::TargetLowering.
Reimplemented in llvm::R600TargetLowering, and llvm::SITargetLowering.
Definition at line 5035 of file AMDGPUISelLowering.cpp.
References llvm::APFloat::add(), llvm::AfterLegalizeDAG, assert(), llvm::ISD::AssertSext, llvm::ISD::AssertZext, llvm::AMDGPUISD::BFE_I32, llvm::AMDGPUISD::BFE_U32, llvm::ISD::BITCAST, llvm::ISD::BUILD_VECTOR, llvm::CallingConv::C, llvm::TargetLowering::DAGCombinerInfo::CommitTargetLoweringOpt(), llvm::SelectionDAG::ComputeNumSignBits(), llvm::TargetLowering::DAGCombinerInfo::DAG, DL, llvm::ISD::FABS, llvm::AMDGPUISD::FMAD_FTZ, llvm::ISD::FNEG, llvm::APInt::getBitsSet(), llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getConstantFP(), llvm::SelectionDAG::getContext(), llvm::TargetLowering::DAGCombinerInfo::getDAGCombineLevel(), llvm::EVT::getIntegerVT(), llvm::SelectionDAG::getNode(), llvm::EVT::getSizeInBits(), llvm::SelectionDAG::getTargetLoweringInfo(), llvm::ConstantFPSDNode::getValueAPF(), llvm::SelectionDAG::getValueType(), llvm::EVT::getVectorElementType(), llvm::EVT::getVectorNumElements(), llvm::SelectionDAG::getZeroExtendInReg(), llvm::APInt::getZExtValue(), llvm::ConstantSDNode::getZExtValue(), llvm::SDValue::hasOneUse(), llvm::AMDGPUSubtarget::hasSDWA(), llvm::Hi_32(), I, llvm::ISD::INTRINSIC_WO_CHAIN, llvm::TargetLowering::DAGCombinerInfo::isBeforeLegalize(), llvm::TargetLowering::DAGCombinerInfo::isBeforeLegalizeOps(), llvm::TargetLoweringBase::isOperationLegal(), llvm::EVT::isVector(), llvm::Lo_32(), llvm::ISD::LOAD, llvm::ISD::MUL, llvm::AMDGPUISD::MUL_I24, llvm::AMDGPUISD::MUL_U24, llvm::AMDGPUISD::MULHI_I24, llvm::AMDGPUISD::MULHI_U24, llvm::ISD::MULHS, llvm::ISD::MULHU, llvm::APFloat::multiply(), N, llvm::Offset, performAssertSZExtCombine(), performFAbsCombine(), performFNegCombine(), performIntrinsicWOChainCombine(), performLoadCombine(), performMulCombine(), performMulhsCombine(), performMulhuCombine(), performMulLoHiCombine(), performRcpCombine(), performSelectCombine(), performShlCombine(), performSraCombine(), performSrlCombine(), performStoreCombine(), performTruncateCombine(), llvm::SmallVectorTemplateBase< T, bool >::push_back(), llvm::AMDGPUISD::RCP, llvm::AMDGPUISD::RCP_IFLAG, llvm::APFloatBase::rmNearestTiesToEven, llvm::ISD::SELECT, llvm::ISD::SHL, llvm::TargetLowering::ShrinkDemandedConstant(), llvm::ISD::SIGN_EXTEND_INREG, Signed, llvm::TargetLowering::SimplifyDemandedBits(), simplifyMul24(), llvm::ISD::SMUL_LOHI, llvm::ISD::SRA, llvm::ISD::SRL, llvm::ISD::STORE, llvm::ISD::TRUNCATE, and llvm::ISD::UMUL_LOHI.
Referenced by llvm::R600TargetLowering::PerformDAGCombine(), and llvm::SITargetLowering::PerformDAGCombine().
|
protected |
Definition at line 4998 of file AMDGPUISelLowering.cpp.
References llvm::ISD::AND, assert(), llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::ISD::FP16_TO_FP, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), llvm::SDValue::getOpcode(), llvm::SDValue::getOperand(), llvm::AMDGPUSubtarget::has16BitInsts(), llvm::SDValue::hasOneUse(), and N.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4736 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::DAGCombinerInfo::AddToWorklist(), llvm::SmallVectorTemplateCommon< T, typename >::back(), llvm::ISD::BITCAST, llvm::ISD::BUILD_VECTOR, llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::ISD::FADD, llvm::ISD::FCANONICALIZE, llvm::ISD::FMA, llvm::ISD::FMAD, llvm::AMDGPUISD::FMAX_LEGACY, llvm::ISD::FMAXIMUM, llvm::ISD::FMAXNUM, llvm::ISD::FMAXNUM_IEEE, llvm::AMDGPUISD::FMED3, llvm::AMDGPUISD::FMIN_LEGACY, llvm::ISD::FMINIMUM, llvm::ISD::FMINNUM, llvm::ISD::FMINNUM_IEEE, llvm::ISD::FMUL, llvm::AMDGPUISD::FMUL_LEGACY, llvm::ISD::FNEARBYINT, llvm::ISD::FNEG, fnegFoldsIntoOp(), llvm::ISD::FP16_TO_FP, llvm::ISD::FP_EXTEND, llvm::ISD::FP_ROUND, llvm::ISD::FRINT, llvm::ISD::FROUNDEVEN, llvm::ISD::FSIN, llvm::ISD::FTRUNC, llvm::SelectionDAG::getConstant(), llvm::SDNode::getFlags(), llvm::SDValue::getNode(), llvm::SelectionDAG::getNode(), llvm::SDValue::getNumOperands(), llvm::SDValue::getOpcode(), llvm::SDValue::getOperand(), llvm::SDNode::getOperand(), llvm::EVT::getSizeInBits(), llvm::SDValue::getValueType(), llvm::SDValue::hasOneUse(), I, inverseMinMax(), isConstantCostlierToNegate(), LHS, mayIgnoreSignedZero(), N, llvm::SDNode::ops(), llvm::AMDGPUISD::RCP, llvm::AMDGPUISD::RCP_IFLAG, llvm::AMDGPUISD::RCP_LEGACY, llvm::SelectionDAG::ReplaceAllUsesWith(), RHS, llvm::ISD::SELECT, shouldFoldFNegIntoSrc(), llvm::AMDGPUISD::SIN_HW, llvm::SDNode::uses(), and llvm::ISD::XOR.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 3927 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::DAGCombinerInfo::DAG, N, peekFPSignOps(), simplifyMul24(), and llvm::SelectionDAG::UpdateNodeOperands().
Referenced by PerformDAGCombine().
|
protected |
Definition at line 3794 of file AMDGPUISelLowering.cpp.
References llvm::TargetLoweringBase::allowsMisalignedMemoryAccesses(), llvm::ISD::BITCAST, llvm::TargetLowering::DAGCombinerInfo::CombineTo(), llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::TargetLowering::expandUnalignedLoad(), llvm::MemSDNode::getAddressSpace(), llvm::MemSDNode::getAlign(), llvm::LoadSDNode::getBasePtr(), llvm::MemSDNode::getChain(), llvm::SelectionDAG::getContext(), getEquivalentMemType(), llvm::MachineMemOperand::getFlags(), llvm::SelectionDAG::getLoad(), llvm::MemSDNode::getMemOperand(), llvm::MemSDNode::getMemoryVT(), llvm::SelectionDAG::getMergeValues(), llvm::SelectionDAG::getNode(), llvm::EVT::getStoreSize(), llvm::SDValue::getValue(), hasVolatileUser(), llvm::TargetLowering::DAGCombinerInfo::isBeforeLegalize(), llvm::ISD::isNormalLoad(), llvm::MemSDNode::isSimple(), llvm::TargetLoweringBase::isTypeLegal(), llvm::EVT::isVector(), N, shouldCombineMemoryType(), Size, and SplitVectorLoad().
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4256 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, llvm::all_of(), llvm::ISD::ANY_EXTEND, assert(), llvm::EVT::bitsLE(), llvm::TargetLowering::DAGCombinerInfo::DAG, DL, getAddOneOp(), getMul24(), llvm::SelectionDAG::getNode(), llvm::SDValue::getOpcode(), llvm::SDValue::getOperand(), llvm::EVT::getScalarType(), llvm::SelectionDAG::getSExtOrTrunc(), llvm::EVT::getSizeInBits(), llvm::SelectionDAG::getZExtOrTrunc(), llvm::AMDGPUSubtarget::has16BitInsts(), llvm::AMDGPUSubtarget::hasMulI24(), llvm::AMDGPUSubtarget::hasMulU24(), isI24(), isU24(), llvm::EVT::isVector(), llvm::Mul, llvm::ISD::MUL, N, and Size.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4384 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::DAGCombinerInfo::AddToWorklist(), llvm::TargetLowering::DAGCombinerInfo::DAG, DL, llvm::SDValue::getNode(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSExtOrTrunc(), llvm::AMDGPUSubtarget::hasMulI24(), llvm::AMDGPUSubtarget::hasSMulHi(), isI24(), llvm::EVT::isVector(), llvm::AMDGPUISD::MULHI_I24, and N.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4417 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::DAGCombinerInfo::AddToWorklist(), llvm::TargetLowering::DAGCombinerInfo::DAG, DL, llvm::SDValue::getNode(), llvm::SelectionDAG::getNode(), llvm::EVT::getSizeInBits(), llvm::SelectionDAG::getZExtOrTrunc(), llvm::AMDGPUSubtarget::hasMulU24(), llvm::AMDGPUSubtarget::hasSMulHi(), isU24(), llvm::EVT::isVector(), llvm::AMDGPUISD::MULHI_U24, and N.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4341 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ANY_EXTEND, llvm::TargetLowering::DAGCombinerInfo::CombineTo(), llvm::TargetLowering::DAGCombinerInfo::DAG, DL, llvm::SelectionDAG::getNode(), llvm::SDValue::getOpcode(), llvm::SDValue::getOperand(), llvm::SelectionDAG::getSExtOrTrunc(), llvm::SelectionDAG::getZExtOrTrunc(), llvm::AMDGPUSubtarget::hasMulI24(), llvm::AMDGPUSubtarget::hasMulU24(), llvm::Hi, isI24(), isU24(), llvm::Lo, llvm::AMDGPUISD::MUL_I24, llvm::AMDGPUISD::MUL_U24, llvm::AMDGPUISD::MULHI_I24, llvm::AMDGPUISD::MULHI_U24, and N.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 5023 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::SelectionDAG::getConstantFP(), llvm::APFloat::getSemantics(), and N.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4611 of file AMDGPUISelLowering.cpp.
References CC, combineFMinMaxLegacy(), Cond, llvm::TargetLowering::DAGCombinerInfo::DAG, foldFreeOpFromSelect(), llvm::get(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getSetCC(), llvm::AMDGPUSubtarget::hasFminFmaxLegacy(), llvm::SelectionDAG::isConstantValueOfAnyType(), LHS, N, performCtlz_CttzCombine(), RHS, llvm::ISD::SELECT, and llvm::ISD::SETCC.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 3986 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ANY_EXTEND, llvm::ISD::BITCAST, llvm::ISD::BUILD_VECTOR, llvm::SelectionDAG::computeKnownBits(), llvm::KnownBits::countMinLeadingZeros(), llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getZExtOrTrunc(), llvm::TargetLoweringBase::isOperationLegal(), LHS, llvm::Lo, N, RHS, llvm::ISD::SHL, llvm::ISD::SIGN_EXTEND, llvm::ISD::TRUNCATE, X, and llvm::ISD::ZERO_EXTEND.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4054 of file AMDGPUISelLowering.cpp.
References llvm::ISD::BITCAST, llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getConstant(), getHiHalf64(), llvm::SelectionDAG::getNode(), llvm::Hi, N, RHS, and llvm::ISD::SRA.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4089 of file AMDGPUISelLowering.cpp.
References llvm::ISD::AND, llvm::ISD::BITCAST, llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getConstant(), getHiHalf64(), llvm::SelectionDAG::getNode(), llvm::Hi, LHS, N, RHS, and llvm::ISD::SRL.
Referenced by PerformDAGCombine().
|
protected |
Definition at line 3847 of file AMDGPUISelLowering.cpp.
References llvm::TargetLoweringBase::allowsMisalignedMemoryAccesses(), llvm::ISD::BITCAST, llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::TargetLowering::expandUnalignedStore(), llvm::MemSDNode::getAddressSpace(), llvm::MemSDNode::getAlign(), llvm::StoreSDNode::getBasePtr(), llvm::MemSDNode::getChain(), llvm::SelectionDAG::getContext(), getEquivalentMemType(), llvm::MachineMemOperand::getFlags(), llvm::MemSDNode::getMemOperand(), llvm::MemSDNode::getMemoryVT(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getStore(), llvm::EVT::getStoreSize(), llvm::StoreSDNode::getValue(), llvm::SDValue::hasOneUse(), llvm::TargetLowering::DAGCombinerInfo::isBeforeLegalize(), llvm::ISD::isNormalStore(), llvm::MemSDNode::isSimple(), llvm::TargetLoweringBase::isTypeLegal(), llvm::EVT::isVector(), N, llvm::SelectionDAG::ReplaceAllUsesOfValueWith(), shouldCombineMemoryType(), Size, and SplitVectorStore().
Referenced by PerformDAGCombine().
|
protected |
Definition at line 4137 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::DAGCombinerInfo::AddToWorklist(), llvm::ISD::BITCAST, llvm::ISD::BUILD_VECTOR, llvm::EVT::changeTypeToInteger(), llvm::SelectionDAG::computeKnownBits(), llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::EVT::getFixedSizeInBits(), llvm::KnownBits::getMaxValue(), llvm::SDValue::getNode(), llvm::SelectionDAG::getNode(), llvm::SDValue::getOpcode(), llvm::SDValue::getOperand(), llvm::EVT::getScalarSizeInBits(), llvm::TargetLoweringBase::getShiftAmountTy(), llvm::SDValue::getValueType(), llvm::EVT::getVectorNumElements(), llvm::EVT::getVectorVT(), llvm::SelectionDAG::getZExtOrTrunc(), llvm::isConstOrConstSplat(), llvm::EVT::isFloatingPoint(), llvm::EVT::isVector(), N, llvm::ISD::SHL, llvm::ISD::SRA, llvm::ISD::SRL, stripBitcast(), llvm::ISD::TRUNCATE, and llvm::APInt::ule().
Referenced by PerformDAGCombine().
|
pure virtual |
Implemented in llvm::SITargetLowering.
|
overridevirtual |
This callback is invoked when a node result type is illegal for the target, and the operation was registered to use 'custom' lowering for that result type.
The target places new result values for the node in Results (their number and types must exactly match those of the original return values of the node), or leaves Results empty, which indicates that the node is not to be custom lowered after all.
If the target has no operations that require custom lowering, it need not implement this. The default implementation aborts.
Reimplemented from llvm::TargetLowering.
Reimplemented in llvm::R600TargetLowering, and llvm::SITargetLowering.
Definition at line 1413 of file AMDGPUISelLowering.cpp.
References llvm::ISD::CTLZ, llvm::ISD::CTLZ_ZERO_UNDEF, llvm::ISD::FEXP, llvm::ISD::FEXP10, llvm::ISD::FEXP2, llvm::ISD::FLOG, llvm::ISD::FLOG10, llvm::ISD::FLOG2, lowerCTLZResults(), lowerFEXP(), lowerFEXP2(), LowerFLOG2(), LowerFLOGCommon(), N, Results, and llvm::ISD::SIGN_EXTEND_INREG.
Referenced by llvm::R600TargetLowering::ReplaceNodeResults(), and llvm::SITargetLowering::ReplaceNodeResults().
|
inlineoverridevirtual |
Returns how the given (atomic) load should be cast by the IR-level AtomicExpand pass.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 235 of file AMDGPUISelLowering.h.
References llvm::TargetLoweringBase::None.
|
inlineoverridevirtual |
Returns how the given atomic atomicrmw should be cast by the IR-level AtomicExpand pass.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 243 of file AMDGPUISelLowering.h.
References llvm::TargetLoweringBase::None.
|
inlineoverridevirtual |
Returns how the given (atomic) store should be cast by the IR-level AtomicExpand pass into.
For instance AtomicExpansionKind::CastToInteger will try to cast the operands to integer values.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 239 of file AMDGPUISelLowering.h.
References llvm::TargetLoweringBase::None.
Definition at line 3773 of file AMDGPUISelLowering.cpp.
References llvm::EVT::getScalarType(), llvm::EVT::getStoreSize(), llvm::EVT::isByteSized(), llvm::TargetLoweringBase::isTypeLegal(), llvm::EVT::isVector(), and Size.
Referenced by performLoadCombine(), and performStoreCombine().
Definition at line 4717 of file AMDGPUISelLowering.cpp.
References allUsesHaveSourceMods(), fnegFoldsIntoOp(), llvm::SDValue::getNode(), llvm::SDValue::hasOneUse(), and N.
Referenced by performFNegCombine().
|
overridevirtual |
Return true if it is profitable to reduce a load to a smaller type.
Example: (i16 (trunc (i32 (load x))) -> i16 load x
Reimplemented from llvm::TargetLoweringBase.
Definition at line 817 of file AMDGPUISelLowering.cpp.
References llvm::AMDGPUAS::CONSTANT_ADDRESS, llvm::AMDGPUAS::CONSTANT_ADDRESS_32BIT, llvm::MemSDNode::getAddressSpace(), llvm::getAlign(), llvm::MemSDNode::getMemOperand(), llvm::EVT::getStoreSizeInBits(), llvm::AMDGPUAS::GLOBAL_ADDRESS, llvm::MemSDNode::isInvariant(), llvm::AMDGPUInstrInfo::isUniformMMO(), N, and llvm::TargetLoweringBase::shouldReduceLoadWidth().
If true, then instruction selection should seek to shrink the FP constant of the specified type to a smaller type in order to save space and / or reduce runtime.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 812 of file AMDGPUISelLowering.cpp.
References llvm::EVT::getScalarType().
|
overridevirtual |
Whether it is profitable to sink the operands of an Instruction I to the basic block of I.
This helps using several modifiers (like abs and neg) more often.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 6004 of file AMDGPUISelLowering.cpp.
References llvm::any_of(), llvm::SmallVectorBase< Size_T >::empty(), I, llvm::PatternMatch::m_FAbs(), llvm::PatternMatch::m_FNeg(), llvm::PatternMatch::m_Value(), llvm::PatternMatch::match(), and llvm::SmallVectorTemplateBase< T, bool >::push_back().
|
protected |
Return 64-bit value Op as two 32-bit integers.
Definition at line 1700 of file AMDGPUISelLowering.cpp.
References llvm::ISD::BITCAST, llvm::ISD::EXTRACT_VECTOR_ELT, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), llvm::Hi, and llvm::Lo.
Referenced by LowerCTLZ_CTTZ(), LowerINT_TO_FP32(), LowerINT_TO_FP64(), and splitBinaryBitConstantOpImpl().
|
protected |
Split the 64-bit value LHS
into two 32-bit components, and perform the binary operation Opc
to it with the corresponding constant operands.
Definition at line 3963 of file AMDGPUISelLowering.cpp.
References llvm::TargetLowering::DAGCombinerInfo::AddToWorklist(), llvm::ISD::BITCAST, llvm::TargetLowering::DAGCombinerInfo::DAG, llvm::SelectionDAG::getBuildVector(), llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getNode(), llvm::Hi, LHS, llvm::Lo, and split64BitValue().
|
protected |
Split a vector value into two parts of types LoVT and HiVT.
HiVT could be scalar.
Definition at line 1749 of file AMDGPUISelLowering.cpp.
References assert(), DL, llvm::ISD::EXTRACT_SUBVECTOR, llvm::ISD::EXTRACT_VECTOR_ELT, llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getVectorIdxConstant(), llvm::EVT::getVectorNumElements(), llvm::Hi, llvm::EVT::isVector(), llvm::Lo, and N.
Referenced by SplitVectorLoad(), and SplitVectorStore().
|
protected |
Split a vector load into 2 loads of half the vector.
Definition at line 1764 of file AMDGPUISelLowering.cpp.
References llvm::commonAlignment(), llvm::ISD::CONCAT_VECTORS, llvm::SelectionDAG::getExtLoad(), llvm::TypeSize::getFixed(), llvm::SelectionDAG::getMergeValues(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getObjectPtrOffset(), getSplitDestVTs(), llvm::EVT::getStoreSize(), llvm::SelectionDAG::getUNDEF(), llvm::SDValue::getValue(), llvm::SelectionDAG::getVectorIdxConstant(), llvm::EVT::getVectorNumElements(), llvm::MachinePointerInfo::getWithOffset(), llvm::Hi, llvm::ISD::INSERT_SUBVECTOR, llvm::ISD::INSERT_VECTOR_ELT, llvm::EVT::isVector(), llvm::Lo, llvm::TargetLowering::scalarizeVectorLoad(), Size, splitVector(), and llvm::ISD::TokenFactor.
Referenced by performLoadCombine(), and WidenOrSplitVectorLoad().
|
protected |
Split a vector store into 2 stores of half the vector.
Definition at line 1858 of file AMDGPUISelLowering.cpp.
References llvm::commonAlignment(), llvm::SelectionDAG::getNode(), llvm::SelectionDAG::getObjectPtrOffset(), getSplitDestVTs(), llvm::EVT::getStoreSize(), llvm::SelectionDAG::getTruncStore(), llvm::SDValue::getValueType(), llvm::EVT::getVectorNumElements(), llvm::MachinePointerInfo::getWithOffset(), llvm::Hi, llvm::Lo, llvm::TargetLowering::scalarizeVectorStore(), Size, splitVector(), and llvm::ISD::TokenFactor.
Referenced by performStoreCombine().
|
overridevirtual |
Return true if it is expected to be cheaper to do a store of vector constant with the given size and type for the address space than to store the individual scalar element constants.
Reimplemented from llvm::TargetLoweringBase.
Definition at line 959 of file AMDGPUISelLowering.cpp.
SDValue AMDGPUTargetLowering::storeStackInputValue | ( | SelectionDAG & | DAG, |
const SDLoc & | SL, | ||
SDValue | Chain, | ||
SDValue | ArgVal, | ||
int64_t | Offset | ||
) | const |
Definition at line 5334 of file AMDGPUISelLowering.cpp.
References llvm::ISD::ADD, llvm::SelectionDAG::getConstant(), llvm::SelectionDAG::getCopyFromReg(), llvm::MachineFunction::getInfo(), llvm::SelectionDAG::getMachineFunction(), llvm::SelectionDAG::getNode(), llvm::MachinePointerInfo::getStack(), llvm::SelectionDAG::getStore(), Info, llvm::MachineMemOperand::MODereferenceable, llvm::Offset, and Ptr.
Referenced by llvm::SITargetLowering::passSpecialInputs().
Definition at line 184 of file AMDGPUISelLowering.h.
References llvm::ISD::BITCAST, llvm::SDValue::getOpcode(), and llvm::SDValue::getOperand().
Referenced by findMemSDNode(), and performTruncateCombine().
|
protected |
Widen a suitably aligned v3 load.
For all other cases, split the input vector load.
Definition at line 1824 of file AMDGPUISelLowering.cpp.
References assert(), llvm::ISD::EXTRACT_SUBVECTOR, llvm::SelectionDAG::getContext(), llvm::SelectionDAG::getDataLayout(), llvm::SelectionDAG::getExtLoad(), llvm::SelectionDAG::getMergeValues(), llvm::SelectionDAG::getNode(), llvm::SDValue::getValue(), llvm::EVT::getVectorElementType(), llvm::SelectionDAG::getVectorIdxConstant(), llvm::EVT::getVectorNumElements(), llvm::EVT::getVectorVT(), llvm::MachinePointerInfo::isDereferenceable(), and SplitVectorLoad().