doxygen/NVPTXISelLowering_8h_source.html

//===-- NVPTXISelLowering.h - NVPTX DAG Lowering Interface ------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file defines the interfaces that NVPTX uses to lower LLVM code into a

// selection DAG.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_NVPTX_NVPTXISELLOWERING_H

#define LLVM_LIB_TARGET_NVPTX_NVPTXISELLOWERING_H


#include "NVPTX.h"

#include "llvm/CodeGen/SelectionDAG.h"

#include "llvm/CodeGen/TargetLowering.h"


namespace llvm {

namespace NVPTXISD {

enum NodeType : unsigned {

  // Start the numbering from where ISD NodeType finishes.

  FIRST_NUMBER = ISD::BUILTIN_OP_END,

  Wrapper,

  CALL,

  RET_GLUE,

  LOAD_PARAM,

  DeclareParam,

  DeclareScalarParam,

  DeclareRetParam,

  DeclareRet,

  DeclareScalarRet,

  PrintCall,

  PrintConvergentCall,

  PrintCallUni,

  PrintConvergentCallUni,

  CallArgBegin,

  CallArg,

  LastCallArg,

  CallArgEnd,

  CallVoid,

  CallVal,

  CallSymbol,

  Prototype,

  MoveParam,

  PseudoUseParam,

  RETURN,

  CallSeqBegin,

  CallSeqEnd,

  CallPrototype,

  ProxyReg,

  FSHL_CLAMP,

  FSHR_CLAMP,

  MUL_WIDE_SIGNED,

  MUL_WIDE_UNSIGNED,

  SETP_F16X2,

  SETP_BF16X2,

  BFE,

  BFI,

  PRMT,

  FCOPYSIGN,

  DYNAMIC_STACKALLOC,

  STACKRESTORE,

  STACKSAVE,

  BrxStart,

  BrxItem,

  BrxEnd,

  Dummy,


  FIRST_MEMORY_OPCODE,

  LoadV2 = FIRST_MEMORY_OPCODE,

  LoadV4,

  LDUV2, // LDU.v2

  LDUV4, // LDU.v4

  StoreV2,

  StoreV4,

  LoadParam,

  LoadParamV2,

  LoadParamV4,

  StoreParam,

  StoreParamV2,

  StoreParamV4,

  StoreParamS32, // to sext and store a <32bit value, not used currently

  StoreParamU32, // to zext and store a <32bit value, not used currently

  StoreRetval,

  StoreRetvalV2,

  StoreRetvalV4,

  LAST_MEMORY_OPCODE = StoreRetvalV4,

};

}


class NVPTXSubtarget;


//===--------------------------------------------------------------------===//

// TargetLowering Implementation

//===--------------------------------------------------------------------===//

class NVPTXTargetLowering : public TargetLowering {

public:

  explicit NVPTXTargetLowering(const NVPTXTargetMachine &TM,

                               const NVPTXSubtarget &STI);

  SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;


  SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;


  const char *getTargetNodeName(unsigned Opcode) const override;


  bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallInst &I,

                          MachineFunction &MF,

                          unsigned Intrinsic) const override;


  Align getFunctionArgumentAlignment(const Function *F, Type *Ty, unsigned Idx,

                                     const DataLayout &DL) const;


  /// getFunctionParamOptimizedAlign - since function arguments are passed via

  /// .param space, we may want to increase their alignment in a way that

  /// ensures that we can effectively vectorize their loads & stores. We can

  /// increase alignment only if the function has internal or has private

  /// linkage as for other linkage types callers may already rely on default

  /// alignment. To allow using 128-bit vectorized loads/stores, this function

  /// ensures that alignment is 16 or greater.

  Align getFunctionParamOptimizedAlign(const Function *F, Type *ArgTy,

                                       const DataLayout &DL) const;


  /// Helper for computing alignment of a device function byval parameter.

  Align getFunctionByValParamAlign(const Function *F, Type *ArgTy,

                                   Align InitialAlign,

                                   const DataLayout &DL) const;


  // Helper for getting a function parameter name. Name is composed from

  // its index and the function name. Negative index corresponds to special

  // parameter (unsized array) used for passing variable arguments.

  std::string getParamName(const Function *F, int Idx) const;


  /// isLegalAddressingMode - Return true if the addressing mode represented

  /// by AM is legal for this target, for a load/store of the specified type

  /// Used to guide target specific optimizations, like loop strength

  /// reduction (LoopStrengthReduce.cpp) and memory optimization for

  /// address mode (CodeGenPrepare.cpp)

  bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM, Type *Ty,

                             unsigned AS,

                             Instruction *I = nullptr) const override;


  bool isTruncateFree(Type *SrcTy, Type *DstTy) const override {

    // Truncating 64-bit to 32-bit is free in SASS.

    if (!SrcTy->isIntegerTy() || !DstTy->isIntegerTy())

      return false;

    return SrcTy->getPrimitiveSizeInBits() == 64 &&

           DstTy->getPrimitiveSizeInBits() == 32;

  }


  EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Ctx,

                         EVT VT) const override {

    if (VT.isVector())

      return EVT::getVectorVT(Ctx, MVT::i1, VT.getVectorNumElements());

    return MVT::i1;

  }


  ConstraintType getConstraintType(StringRef Constraint) const override;

  std::pair<unsigned, const TargetRegisterClass *>

  getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,

                               StringRef Constraint, MVT VT) const override;


  SDValue LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv,

                               bool isVarArg,

                               const SmallVectorImpl<ISD::InputArg> &Ins,

                               const SDLoc &dl, SelectionDAG &DAG,

                               SmallVectorImpl<SDValue> &InVals) const override;


  SDValue LowerCall(CallLoweringInfo &CLI,

                    SmallVectorImpl<SDValue> &InVals) const override;


  SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerSTACKSAVE(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerSTACKRESTORE(SDValue Op, SelectionDAG &DAG) const;


  std::string

  getPrototype(const DataLayout &DL, Type *, const ArgListTy &,

               const SmallVectorImpl<ISD::OutputArg> &, MaybeAlign retAlignment,

               std::optional<std::pair<unsigned, const APInt &>> VAInfo,

               const CallBase &CB, unsigned UniqueCallSite) const;


  SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,

                      const SmallVectorImpl<ISD::OutputArg> &Outs,

                      const SmallVectorImpl<SDValue> &OutVals, const SDLoc &dl,

                      SelectionDAG &DAG) const override;


  void LowerAsmOperandForConstraint(SDValue Op, StringRef Constraint,

                                    std::vector<SDValue> &Ops,

                                    SelectionDAG &DAG) const override;


  const NVPTXTargetMachine *nvTM;


  // PTX always uses 32-bit shift amounts

  MVT getScalarShiftAmountTy(const DataLayout &, EVT) const override {

    return MVT::i32;

  }


  TargetLoweringBase::LegalizeTypeAction

  getPreferredVectorAction(MVT VT) const override;


  // Get the degree of precision we want from 32-bit floating point division

  // operations.

  //

  //  0 - Use ptx div.approx

  //  1 - Use ptx.div.full (approximate, but less so than div.approx)

  //  2 - Use IEEE-compliant div instructions, if available.

  int getDivF32Level() const;


  // Get whether we should use a precise or approximate 32-bit floating point

  // sqrt instruction.

  bool usePrecSqrtF32() const;


  // Get whether we should use instructions that flush floating-point denormals

  // to sign-preserving zero.

  bool useF32FTZ(const MachineFunction &MF) const;


  SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,

                          int &ExtraSteps, bool &UseOneConst,

                          bool Reciprocal) const override;


  unsigned combineRepeatedFPDivisors() const override { return 2; }


  bool allowFMA(MachineFunction &MF, CodeGenOptLevel OptLevel) const;

  bool allowUnsafeFPMath(MachineFunction &MF) const;


  bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF,

                                  EVT) const override {

    return true;

  }


  // The default is the same as pointer type, but brx.idx only accepts i32

  MVT getJumpTableRegTy(const DataLayout &) const override { return MVT::i32; }


  unsigned getJumpTableEncoding() const override;


  bool enableAggressiveFMAFusion(EVT VT) const override { return true; }


  // The default is to transform llvm.ctlz(x, false) (where false indicates that

  // x == 0 is not undefined behavior) into a branch that checks whether x is 0

  // and avoids calling ctlz in that case.  We have a dedicated ctlz

  // instruction, so we say that ctlz is cheap to speculate.

  bool isCheapToSpeculateCtlz(Type *Ty) const override { return true; }


  AtomicExpansionKind shouldCastAtomicLoadInIR(LoadInst *LI) const override {

    return AtomicExpansionKind::None;

  }


  AtomicExpansionKind shouldCastAtomicStoreInIR(StoreInst *SI) const override {

    return AtomicExpansionKind::None;

  }


  AtomicExpansionKind

  shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;


  bool aggressivelyPreferBuildVectorSources(EVT VecVT) const override {

    // There's rarely any point of packing something into a vector type if we

    // already have the source data.

    return true;

  }


private:

  const NVPTXSubtarget &STI; // cache the subtarget here

  SDValue getParamSymbol(SelectionDAG &DAG, int idx, EVT) const;


  SDValue LowerBITCAST(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerFROUND(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFROUND32(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFROUND64(SDValue Op, SelectionDAG &DAG) const;


  SDValue PromoteBinOpIfF32FTZ(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerFP_ROUND(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFP_EXTEND(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerLOAD(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerLOADi1(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerSTOREi1(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerSTOREVector(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerShiftRightParts(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerShiftLeftParts(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerSelect(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerBR_JT(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerCopyToReg_128(SDValue Op, SelectionDAG &DAG) const;

  unsigned getNumRegisters(LLVMContext &Context, EVT VT,

                           std::optional<MVT> RegisterVT) const override;

  bool

  splitValueIntoRegisterParts(SelectionDAG &DAG, const SDLoc &DL, SDValue Val,

                              SDValue *Parts, unsigned NumParts, MVT PartVT,

                              std::optional<CallingConv::ID> CC) const override;


  void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results,

                          SelectionDAG &DAG) const override;

  SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;


  Align getArgumentAlignment(const CallBase *CB, Type *Ty, unsigned Idx,

                             const DataLayout &DL) const;

};


} // namespace llvm


#endif

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

Results
Function Alias Analysis Results
Definition: AliasAnalysis.cpp:731

Info
Analysis containing CSE Info
Definition: CSEInfo.cpp:27

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:353

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

TRI
unsigned const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:2029

NVPTX.h

CC
auto CC
Definition: RISCVRedundantCopyElimination.cpp:79

SelectionDAG.h

TargetLowering.h
This file describes how to lower LLVM code to machine code.

llvm::AtomicRMWInst
an instruction that atomically reads a memory location, combines it with another value,...
Definition: Instructions.h:704

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1112

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1479

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::Function
Definition: Function.h:63

llvm::Instruction
Definition: Instruction.h:68

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:176

llvm::MVT
Machine Value Type.
Definition: MachineValueType.h:35

llvm::MachineFunction
Definition: MachineFunction.h:267

llvm::NVPTXSubtarget
Definition: NVPTXSubtarget.h:30

llvm::NVPTXTargetLowering
Definition: NVPTXISelLowering.h:99

llvm::NVPTXTargetLowering::enableAggressiveFMAFusion
bool enableAggressiveFMAFusion(EVT VT) const override
Return true if target always benefits from combining into FMA for a given value type.
Definition: NVPTXISelLowering.h:238

llvm::NVPTXTargetLowering::getConstraintType
ConstraintType getConstraintType(StringRef Constraint) const override
getConstraintType - Given a constraint letter, return the type of constraint it is for this target.
Definition: NVPTXISelLowering.cpp:4386

llvm::NVPTXTargetLowering::LowerOperation
SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override
This callback is invoked for operations that are unsupported by the target, which are registered to u...
Definition: NVPTXISelLowering.cpp:2649

llvm::NVPTXTargetLowering::nvTM
const NVPTXTargetMachine * nvTM
Definition: NVPTXISelLowering.h:193

llvm::NVPTXTargetLowering::LowerGlobalAddress
SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const
Definition: NVPTXISelLowering.cpp:1139

llvm::NVPTXTargetLowering::getJumpTableRegTy
MVT getJumpTableRegTy(const DataLayout &) const override
Definition: NVPTXISelLowering.h:234

llvm::NVPTXTargetLowering::useF32FTZ
bool useF32FTZ(const MachineFunction &MF) const
Definition: NVPTXISelLowering.cpp:133

llvm::NVPTXTargetLowering::LowerSTACKSAVE
SDValue LowerSTACKSAVE(SDValue Op, SelectionDAG &DAG) const
Definition: NVPTXISelLowering.cpp:2061

llvm::NVPTXTargetLowering::combineRepeatedFPDivisors
unsigned combineRepeatedFPDivisors() const override
Indicate whether this target prefers to combine FDIVs with the same divisor.
Definition: NVPTXISelLowering.h:223

llvm::NVPTXTargetLowering::getFunctionArgumentAlignment
Align getFunctionArgumentAlignment(const Function *F, Type *Ty, unsigned Idx, const DataLayout &DL) const
Definition: NVPTXISelLowering.cpp:1266

llvm::NVPTXTargetLowering::getSqrtEstimate
SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &ExtraSteps, bool &UseOneConst, bool Reciprocal) const override
Hooks for building estimates in place of slower divisions and square roots.
Definition: NVPTXISelLowering.cpp:1089

llvm::NVPTXTargetLowering::LowerReturn
SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg, const SmallVectorImpl< ISD::OutputArg > &Outs, const SmallVectorImpl< SDValue > &OutVals, const SDLoc &dl, SelectionDAG &DAG) const override
This hook must be implemented to lower outgoing return values, described by the Outs array,...
Definition: NVPTXISelLowering.cpp:3304

llvm::NVPTXTargetLowering::LowerFormalArguments
SDValue LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, bool isVarArg, const SmallVectorImpl< ISD::InputArg > &Ins, const SDLoc &dl, SelectionDAG &DAG, SmallVectorImpl< SDValue > &InVals) const override
This hook must be implemented to lower the incoming (formal) arguments, described by the Ins array,...
Definition: NVPTXISelLowering.cpp:3079

llvm::NVPTXTargetLowering::shouldCastAtomicLoadInIR
AtomicExpansionKind shouldCastAtomicLoadInIR(LoadInst *LI) const override
Returns how the given (atomic) load should be cast by the IR-level AtomicExpand pass.
Definition: NVPTXISelLowering.h:246

llvm::NVPTXTargetLowering::shouldCastAtomicStoreInIR
AtomicExpansionKind shouldCastAtomicStoreInIR(StoreInst *SI) const override
Returns how the given (atomic) store should be cast by the IR-level AtomicExpand pass into.
Definition: NVPTXISelLowering.h:250

llvm::NVPTXTargetLowering::LowerAsmOperandForConstraint
void LowerAsmOperandForConstraint(SDValue Op, StringRef Constraint, std::vector< SDValue > &Ops, SelectionDAG &DAG) const override
Lower the specified operand into the Ops vector.
Definition: NVPTXISelLowering.cpp:3426

llvm::NVPTXTargetLowering::LowerSTACKRESTORE
SDValue LowerSTACKRESTORE(SDValue Op, SelectionDAG &DAG) const
Definition: NVPTXISelLowering.cpp:2038

llvm::NVPTXTargetLowering::aggressivelyPreferBuildVectorSources
bool aggressivelyPreferBuildVectorSources(EVT VecVT) const override
Definition: NVPTXISelLowering.h:257

llvm::NVPTXTargetLowering::isTruncateFree
bool isTruncateFree(Type *SrcTy, Type *DstTy) const override
Return true if it's free to truncate a value of type FromTy to type ToTy.
Definition: NVPTXISelLowering.h:145

llvm::NVPTXTargetLowering::getParamName
std::string getParamName(const Function *F, int Idx) const
Definition: NVPTXISelLowering.cpp:4326

llvm::NVPTXTargetLowering::getPreferredVectorAction
TargetLoweringBase::LegalizeTypeAction getPreferredVectorAction(MVT VT) const override
Return the preferred vector type legalization action.
Definition: NVPTXISelLowering.cpp:1082

llvm::NVPTXTargetLowering::getPrototype
std::string getPrototype(const DataLayout &DL, Type *, const ArgListTy &, const SmallVectorImpl< ISD::OutputArg > &, MaybeAlign retAlignment, std::optional< std::pair< unsigned, const APInt & > > VAInfo, const CallBase &CB, unsigned UniqueCallSite) const
Definition: NVPTXISelLowering.cpp:1152

llvm::NVPTXTargetLowering::getFunctionParamOptimizedAlign
Align getFunctionParamOptimizedAlign(const Function *F, Type *ArgTy, const DataLayout &DL) const
getFunctionParamOptimizedAlign - since function arguments are passed via .param space,...
Definition: NVPTXISelLowering.cpp:4279

llvm::NVPTXTargetLowering::LowerDYNAMIC_STACKALLOC
SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const
Definition: NVPTXISelLowering.cpp:2007

llvm::NVPTXTargetLowering::getScalarShiftAmountTy
MVT getScalarShiftAmountTy(const DataLayout &, EVT) const override
Return the type to use for a scalar shift opcode, given the shifted amount type.
Definition: NVPTXISelLowering.h:196

llvm::NVPTXTargetLowering::getSetCCResultType
EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Ctx, EVT VT) const override
Return the ValueType of the result of SETCC operations.
Definition: NVPTXISelLowering.h:153

llvm::NVPTXTargetLowering::getRegForInlineAsmConstraint
std::pair< unsigned, const TargetRegisterClass * > getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const override
Given a physical register constraint (e.g.
Definition: NVPTXISelLowering.cpp:4408

llvm::NVPTXTargetLowering::isLegalAddressingMode
bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM, Type *Ty, unsigned AS, Instruction *I=nullptr) const override
isLegalAddressingMode - Return true if the addressing mode represented by AM is legal for this target...
Definition: NVPTXISelLowering.cpp:4345

llvm::NVPTXTargetLowering::shouldExpandAtomicRMWInIR
AtomicExpansionKind shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override
Returns how the IR-level AtomicExpand pass should expand the given AtomicRMW, if at all.
Definition: NVPTXISelLowering.cpp:5522

llvm::NVPTXTargetLowering::isCheapToSpeculateCtlz
bool isCheapToSpeculateCtlz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic ctlz.
Definition: NVPTXISelLowering.h:244

llvm::NVPTXTargetLowering::getFunctionByValParamAlign
Align getFunctionByValParamAlign(const Function *F, Type *ArgTy, Align InitialAlign, const DataLayout &DL) const
Helper for computing alignment of a device function byval parameter.
Definition: NVPTXISelLowering.cpp:4300

llvm::NVPTXTargetLowering::getTgtMemIntrinsic
bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallInst &I, MachineFunction &MF, unsigned Intrinsic) const override
Given an intrinsic, checks if on the target the intrinsic will need to map to a MemIntrinsicNode (tou...
Definition: NVPTXISelLowering.cpp:3439

llvm::NVPTXTargetLowering::getTargetNodeName
const char * getTargetNodeName(unsigned Opcode) const override
This method returns the name of a target specific DAG node.
Definition: NVPTXISelLowering.cpp:1003

llvm::NVPTXTargetLowering::allowFMA
bool allowFMA(MachineFunction &MF, CodeGenOptLevel OptLevel) const
Definition: NVPTXISelLowering.cpp:4443

llvm::NVPTXTargetLowering::usePrecSqrtF32
bool usePrecSqrtF32() const
Definition: NVPTXISelLowering.cpp:123

llvm::NVPTXTargetLowering::getJumpTableEncoding
unsigned getJumpTableEncoding() const override
Return the entry encoding for a jump table in the current function.
Definition: NVPTXISelLowering.cpp:2766

llvm::NVPTXTargetLowering::isFMAFasterThanFMulAndFAdd
bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF, EVT) const override
Return true if an FMA operation is faster than a pair of fmul and fadd instructions.
Definition: NVPTXISelLowering.h:228

llvm::NVPTXTargetLowering::allowUnsafeFPMath
bool allowUnsafeFPMath(MachineFunction &MF) const
Definition: NVPTXISelLowering.cpp:4460

llvm::NVPTXTargetLowering::getDivF32Level
int getDivF32Level() const
Definition: NVPTXISelLowering.cpp:110

llvm::NVPTXTargetLowering::LowerCall
SDValue LowerCall(CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals) const override
This hook must be implemented to lower calls into the specified DAG.
Definition: NVPTXISelLowering.cpp:1411

llvm::NVPTXTargetMachine
NVPTXTargetMachine.
Definition: NVPTXTargetMachine.h:25

llvm::SDLoc
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Definition: SelectionDAGNodes.h:1182

llvm::SDNode
Represents one node in the SelectionDAG.
Definition: SelectionDAGNodes.h:496

llvm::SDValue
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
Definition: SelectionDAGNodes.h:145

llvm::SelectionDAG
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
Definition: SelectionDAG.h:228

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:573

llvm::StoreInst
An instruction for storing to memory.
Definition: Instructions.h:292

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51

llvm::TargetLoweringBase::Enabled
@ Enabled
Definition: TargetLowering.h:576

llvm::TargetLoweringBase::LegalizeTypeAction
LegalizeTypeAction
This enum indicates whether a types are legal for a target, and if not, what action should be used to...
Definition: TargetLowering.h:209

llvm::TargetLoweringBase::AtomicExpansionKind
AtomicExpansionKind
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all.
Definition: TargetLowering.h:253

llvm::TargetLoweringBase::AtomicExpansionKind::None
@ None

llvm::TargetLoweringBase::ArgListTy
std::vector< ArgListEntry > ArgListTy
Definition: TargetLowering.h:329

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition: TargetLowering.h:3780

llvm::TargetLowering::ConstraintType
ConstraintType
Definition: TargetLowering.h:4950

llvm::TargetRegisterInfo
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Definition: TargetRegisterInfo.h:235

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:237

llvm::Type::getPrimitiveSizeInBits
TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.

unsigned

llvm::ISD::BUILTIN_OP_END
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
Definition: ISDOpcodes.h:1494

llvm::NVPTXISD::NodeType
NodeType
Definition: NVPTXISelLowering.h:23

llvm::NVPTXISD::Prototype
@ Prototype
Definition: NVPTXISelLowering.h:46

llvm::NVPTXISD::PrintConvergentCallUni
@ PrintConvergentCallUni
Definition: NVPTXISelLowering.h:38

llvm::NVPTXISD::LastCallArg
@ LastCallArg
Definition: NVPTXISelLowering.h:41

llvm::NVPTXISD::LOAD_PARAM
@ LOAD_PARAM
Definition: NVPTXISelLowering.h:29

llvm::NVPTXISD::CallArg
@ CallArg
Definition: NVPTXISelLowering.h:40

llvm::NVPTXISD::DeclareRetParam
@ DeclareRetParam
Definition: NVPTXISelLowering.h:32

llvm::NVPTXISD::STACKSAVE
@ STACKSAVE
Definition: NVPTXISelLowering.h:66

llvm::NVPTXISD::PRMT
@ PRMT
Definition: NVPTXISelLowering.h:62

llvm::NVPTXISD::StoreParamS32
@ StoreParamS32
Definition: NVPTXISelLowering.h:85

llvm::NVPTXISD::MoveParam
@ MoveParam
Definition: NVPTXISelLowering.h:47

llvm::NVPTXISD::CALL
@ CALL
Definition: NVPTXISelLowering.h:27

llvm::NVPTXISD::CallSymbol
@ CallSymbol
Definition: NVPTXISelLowering.h:45

llvm::NVPTXISD::BrxItem
@ BrxItem
Definition: NVPTXISelLowering.h:68

llvm::NVPTXISD::LoadParamV2
@ LoadParamV2
Definition: NVPTXISelLowering.h:80

llvm::NVPTXISD::PrintConvergentCall
@ PrintConvergentCall
Definition: NVPTXISelLowering.h:36

llvm::NVPTXISD::StoreV2
@ StoreV2
Definition: NVPTXISelLowering.h:77

llvm::NVPTXISD::RETURN
@ RETURN
Definition: NVPTXISelLowering.h:49

llvm::NVPTXISD::CallSeqBegin
@ CallSeqBegin
Definition: NVPTXISelLowering.h:50

llvm::NVPTXISD::FIRST_NUMBER
@ FIRST_NUMBER
Definition: NVPTXISelLowering.h:25

llvm::NVPTXISD::StoreRetval
@ StoreRetval
Definition: NVPTXISelLowering.h:87

llvm::NVPTXISD::StoreRetvalV2
@ StoreRetvalV2
Definition: NVPTXISelLowering.h:88

llvm::NVPTXISD::LDUV2
@ LDUV2
Definition: NVPTXISelLowering.h:75

llvm::NVPTXISD::MUL_WIDE_SIGNED
@ MUL_WIDE_SIGNED
Definition: NVPTXISelLowering.h:56

llvm::NVPTXISD::FSHL_CLAMP
@ FSHL_CLAMP
Definition: NVPTXISelLowering.h:54

llvm::NVPTXISD::SETP_F16X2
@ SETP_F16X2
Definition: NVPTXISelLowering.h:58

llvm::NVPTXISD::ProxyReg
@ ProxyReg
Definition: NVPTXISelLowering.h:53

llvm::NVPTXISD::LAST_MEMORY_OPCODE
@ LAST_MEMORY_OPCODE
Definition: NVPTXISelLowering.h:90

llvm::NVPTXISD::StoreV4
@ StoreV4
Definition: NVPTXISelLowering.h:78

llvm::NVPTXISD::CallVal
@ CallVal
Definition: NVPTXISelLowering.h:44

llvm::NVPTXISD::BrxEnd
@ BrxEnd
Definition: NVPTXISelLowering.h:69

llvm::NVPTXISD::LoadParamV4
@ LoadParamV4
Definition: NVPTXISelLowering.h:81

llvm::NVPTXISD::Dummy
@ Dummy
Definition: NVPTXISelLowering.h:70

llvm::NVPTXISD::PrintCall
@ PrintCall
Definition: NVPTXISelLowering.h:35

llvm::NVPTXISD::CallPrototype
@ CallPrototype
Definition: NVPTXISelLowering.h:52

llvm::NVPTXISD::DeclareScalarRet
@ DeclareScalarRet
Definition: NVPTXISelLowering.h:34

llvm::NVPTXISD::DYNAMIC_STACKALLOC
@ DYNAMIC_STACKALLOC
Definition: NVPTXISelLowering.h:64

llvm::NVPTXISD::LoadV2
@ LoadV2
Definition: NVPTXISelLowering.h:73

llvm::NVPTXISD::CallArgEnd
@ CallArgEnd
Definition: NVPTXISelLowering.h:42

llvm::NVPTXISD::StoreRetvalV4
@ StoreRetvalV4
Definition: NVPTXISelLowering.h:89

llvm::NVPTXISD::BrxStart
@ BrxStart
Definition: NVPTXISelLowering.h:67

llvm::NVPTXISD::StoreParamV4
@ StoreParamV4
Definition: NVPTXISelLowering.h:84

llvm::NVPTXISD::CallArgBegin
@ CallArgBegin
Definition: NVPTXISelLowering.h:39

llvm::NVPTXISD::BFI
@ BFI
Definition: NVPTXISelLowering.h:61

llvm::NVPTXISD::StoreParamV2
@ StoreParamV2
Definition: NVPTXISelLowering.h:83

llvm::NVPTXISD::FIRST_MEMORY_OPCODE
@ FIRST_MEMORY_OPCODE
Definition: NVPTXISelLowering.h:72

llvm::NVPTXISD::STACKRESTORE
@ STACKRESTORE
Definition: NVPTXISelLowering.h:65

llvm::NVPTXISD::Wrapper
@ Wrapper
Definition: NVPTXISelLowering.h:26

llvm::NVPTXISD::SETP_BF16X2
@ SETP_BF16X2
Definition: NVPTXISelLowering.h:59

llvm::NVPTXISD::DeclareParam
@ DeclareParam
Definition: NVPTXISelLowering.h:30

llvm::NVPTXISD::LDUV4
@ LDUV4
Definition: NVPTXISelLowering.h:76

llvm::NVPTXISD::CallVoid
@ CallVoid
Definition: NVPTXISelLowering.h:43

llvm::NVPTXISD::StoreParam
@ StoreParam
Definition: NVPTXISelLowering.h:82

llvm::NVPTXISD::StoreParamU32
@ StoreParamU32
Definition: NVPTXISelLowering.h:86

llvm::NVPTXISD::PrintCallUni
@ PrintCallUni
Definition: NVPTXISelLowering.h:37

llvm::NVPTXISD::DeclareRet
@ DeclareRet
Definition: NVPTXISelLowering.h:33

llvm::NVPTXISD::FSHR_CLAMP
@ FSHR_CLAMP
Definition: NVPTXISelLowering.h:55

llvm::NVPTXISD::DeclareScalarParam
@ DeclareScalarParam
Definition: NVPTXISelLowering.h:31

llvm::NVPTXISD::CallSeqEnd
@ CallSeqEnd
Definition: NVPTXISelLowering.h:51

llvm::NVPTXISD::BFE
@ BFE
Definition: NVPTXISelLowering.h:60

llvm::NVPTXISD::RET_GLUE
@ RET_GLUE
Definition: NVPTXISelLowering.h:28

llvm::NVPTXISD::FCOPYSIGN
@ FCOPYSIGN
Definition: NVPTXISelLowering.h:63

llvm::NVPTXISD::PseudoUseParam
@ PseudoUseParam
Definition: NVPTXISelLowering.h:48

llvm::NVPTXISD::MUL_WIDE_UNSIGNED
@ MUL_WIDE_UNSIGNED
Definition: NVPTXISelLowering.h:57

llvm::NVPTXISD::LoadV4
@ LoadV4
Definition: NVPTXISelLowering.h:74

llvm::NVPTXISD::LoadParam
@ LoadParam
Definition: NVPTXISelLowering.h:79

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::CodeGenOptLevel
CodeGenOptLevel
Code generation optimization level.
Definition: CodeGen.h:54

N
#define N

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::EVT::getVectorVT
static EVT getVectorVT(LLVMContext &Context, EVT VT, unsigned NumElements, bool IsScalable=false)
Returns the EVT that represents a vector NumElements in length, where each element is of type VT.
Definition: ValueTypes.h:74

llvm::EVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: ValueTypes.h:168

llvm::EVT::getVectorNumElements
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
Definition: ValueTypes.h:331

llvm::MaybeAlign
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition: Alignment.h:117

llvm::TargetLoweringBase::AddrMode
This represents an addressing mode of: BaseGV + BaseOffs + BaseReg + Scale*ScaleReg + ScalableOffset*...
Definition: TargetLowering.h:2816

llvm::TargetLoweringBase::IntrinsicInfo
Definition: TargetLowering.h:1202