LLVM 20.0.0git
NVPTXISelDAGToDAG.h
Go to the documentation of this file.
1//===-- NVPTXISelDAGToDAG.h - A dag to dag inst selector for NVPTX --------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines an instruction selector for the NVPTX target.
10//
11//===----------------------------------------------------------------------===//
12
13#ifndef LLVM_LIB_TARGET_NVPTX_NVPTXISELDAGTODAG_H
14#define LLVM_LIB_TARGET_NVPTX_NVPTXISELDAGTODAG_H
15
17#include "NVPTX.h"
18#include "NVPTXISelLowering.h"
19#include "NVPTXRegisterInfo.h"
20#include "NVPTXTargetMachine.h"
21#include "llvm/ADT/MapVector.h"
23#include "llvm/IR/InlineAsm.h"
24#include "llvm/IR/Intrinsics.h"
25#include "llvm/IR/LLVMContext.h"
27
28namespace llvm {
29
31 NVPTXScopes() = default;
34 bool empty() const;
35
36private:
38};
39
41 const NVPTXTargetMachine &TM;
42
43 // If true, generate mul.wide from sext and mul
44 bool doMulWide;
45
46 int getDivF32Level() const;
47 bool usePrecSqrtF32() const;
48 bool useF32FTZ() const;
49 bool allowFMA() const;
50 bool allowUnsafeFPMath() const;
51 bool doRsqrtOpt() const;
52
53 NVPTXScopes Scopes{};
54
55public:
57
59
60 bool runOnMachineFunction(MachineFunction &MF) override;
61 const NVPTXSubtarget *Subtarget = nullptr;
62
63 bool SelectInlineAsmMemoryOperand(const SDValue &Op,
64 InlineAsm::ConstraintCode ConstraintID,
65 std::vector<SDValue> &OutOps) override;
66
67private:
68// Include the pieces autogenerated from the target description.
69#include "NVPTXGenDAGISel.inc"
70
71 void Select(SDNode *N) override;
72 bool tryIntrinsicNoChain(SDNode *N);
73 bool tryIntrinsicChain(SDNode *N);
74 bool tryIntrinsicVoid(SDNode *N);
75 void SelectTexSurfHandle(SDNode *N);
76 bool tryLoad(SDNode *N);
77 bool tryLoadVector(SDNode *N);
78 bool tryLDGLDU(SDNode *N);
79 bool tryStore(SDNode *N);
80 bool tryStoreVector(SDNode *N);
81 bool tryLoadParam(SDNode *N);
82 bool tryStoreRetval(SDNode *N);
83 bool tryStoreParam(SDNode *N);
84 bool tryFence(SDNode *N);
85 void SelectAddrSpaceCast(SDNode *N);
86 bool tryBFE(SDNode *N);
87 bool tryConstantFP(SDNode *N);
88 bool SelectSETP_F16X2(SDNode *N);
89 bool SelectSETP_BF16X2(SDNode *N);
90 bool tryEXTRACT_VECTOR_ELEMENT(SDNode *N);
91 void SelectV2I64toI128(SDNode *N);
92 void SelectI128toV2I64(SDNode *N);
93 void SelectCpAsyncBulkG2S(SDNode *N);
94 void SelectCpAsyncBulkS2G(SDNode *N);
95 void SelectCpAsyncBulkTensorG2SCommon(SDNode *N, bool IsIm2Col = false);
96 void SelectCpAsyncBulkTensorS2GCommon(SDNode *N, bool IsIm2Col = false);
97 void SelectCpAsyncBulkTensorPrefetchCommon(SDNode *N, bool IsIm2Col = false);
98 void SelectCpAsyncBulkTensorReduceCommon(SDNode *N, unsigned RedOp,
99 bool IsIm2Col = false);
100
101 inline SDValue getI32Imm(unsigned Imm, const SDLoc &DL) {
102 return CurDAG->getTargetConstant(Imm, DL, MVT::i32);
103 }
104
105 // Match direct address complex pattern.
106 bool SelectDirectAddr(SDValue N, SDValue &Address);
107
108 bool SelectADDRri_imp(SDNode *OpNode, SDValue Addr, SDValue &Base,
109 SDValue &Offset, MVT VT);
110 bool SelectADDRri(SDNode *OpNode, SDValue Addr, SDValue &Base,
111 SDValue &Offset);
112 bool SelectADDRri64(SDNode *OpNode, SDValue Addr, SDValue &Base,
113 SDValue &Offset);
114 bool SelectADDRsi_imp(SDNode *OpNode, SDValue Addr, SDValue &Base,
115 SDValue &Offset, MVT VT);
116 bool SelectADDRsi(SDNode *OpNode, SDValue Addr, SDValue &Base,
117 SDValue &Offset);
118 bool SelectADDRsi64(SDNode *OpNode, SDValue Addr, SDValue &Base,
119 SDValue &Offset);
120
121 bool ChkMemSDNodeAddressSpace(SDNode *N, unsigned int spN) const;
122
123 static unsigned GetConvertOpcode(MVT DestTy, MVT SrcTy, LoadSDNode *N);
124
125 // Returns the Memory Order and Scope that the PTX memory instruction should
126 // use, and inserts appropriate fence instruction before the memory
127 // instruction, if needed to implement the instructions memory order. Required
128 // fences after the instruction need to be handled elsewhere.
129 std::pair<NVPTX::Ordering, NVPTX::Scope>
130 insertMemoryInstructionFence(SDLoc DL, SDValue &Chain, MemSDNode *N);
131 NVPTX::Scope getOperationScope(MemSDNode *N, NVPTX::Ordering O) const;
132};
133
135public:
136 static char ID;
138 CodeGenOptLevel OptLevel);
139};
140} // end namespace llvm
141
142#endif
AMDGPU Register Bank Select
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
#define LLVM_LIBRARY_VISIBILITY
Definition: Compiler.h:133
uint64_t Addr
uint64_t Offset
Definition: ELF_riscv.cpp:478
This file implements a map that provides insertion order iteration.
This class represents an Operation in the Expression.
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67
This class is used to represent ISD::LOAD nodes.
Machine Value Type.
This is an abstract virtual class for memory operations.
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
SelectionDAGISel - This is the common base class used for SelectionDAG-based pattern-matching instruc...
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
CodeGenOptLevel
Code generation optimization level.
Definition: CodeGen.h:54
#define N
NVPTXScopes()=default
NVPTX::Scope operator[](SyncScope::ID ID) const
A MapVector that performs no allocations if smaller than a certain size.
Definition: MapVector.h:254