LLVM 19.0.0git
AMDGPUAsmUtils.cpp
Go to the documentation of this file.
1//===-- AMDGPUAsmUtils.cpp - AsmParser/InstPrinter common -----------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8#include "AMDGPUAsmUtils.h"
9#include "AMDGPUBaseInfo.h"
10#include "SIDefines.h"
11
12namespace llvm {
13namespace AMDGPU {
14
15namespace DepCtr {
16
17// NOLINTBEGIN
19 // Name max dflt offset width constraint
20 {{"depctr_hold_cnt"}, 1, 1, 7, 1, isGFX10_BEncoding},
21 {{"depctr_sa_sdst"}, 1, 1, 0, 1},
22 {{"depctr_va_vdst"}, 15, 15, 12, 4},
23 {{"depctr_va_sdst"}, 7, 7, 9, 3},
24 {{"depctr_va_ssrc"}, 1, 1, 8, 1},
25 {{"depctr_va_vcc"}, 1, 1, 1, 1},
26 {{"depctr_vm_vsrc"}, 7, 7, 2, 3},
27};
28// NOLINTEND
29
30const int DEP_CTR_SIZE =
31 static_cast<int>(sizeof(DepCtrInfo) / sizeof(CustomOperandVal));
32
33} // namespace DepCtr
34
35namespace SendMsg {
36
37// Disable lint checking for this block since it makes the table unreadable.
38// NOLINTBEGIN
39// clang-format off
41 {{""}},
42 {{"MSG_INTERRUPT"}, ID_INTERRUPT},
43 {{"MSG_GS"}, ID_GS_PreGFX11, isNotGFX11Plus},
44 {{"MSG_GS_DONE"}, ID_GS_DONE_PreGFX11, isNotGFX11Plus},
45 {{"MSG_SAVEWAVE"}, ID_SAVEWAVE, isGFX8_GFX9_GFX10},
46 {{"MSG_STALL_WAVE_GEN"}, ID_STALL_WAVE_GEN, isGFX9_GFX10_GFX11},
47 {{"MSG_HALT_WAVES"}, ID_HALT_WAVES, isGFX9_GFX10_GFX11},
48 {{"MSG_ORDERED_PS_DONE"}, ID_ORDERED_PS_DONE, isGFX9_GFX10},
49 {{"MSG_EARLY_PRIM_DEALLOC"}, ID_EARLY_PRIM_DEALLOC, isGFX9_GFX10},
50 {{"MSG_GS_ALLOC_REQ"}, ID_GS_ALLOC_REQ, isGFX9Plus},
51 {{"MSG_GET_DOORBELL"}, ID_GET_DOORBELL, isGFX9_GFX10},
52 {{"MSG_GET_DDID"}, ID_GET_DDID, isGFX10},
53 {{"MSG_HS_TESSFACTOR"}, ID_HS_TESSFACTOR_GFX11Plus, isGFX11Plus},
54 {{"MSG_DEALLOC_VGPRS"}, ID_DEALLOC_VGPRS_GFX11Plus, isGFX11Plus},
55 {{""}},
56 {{"MSG_SYSMSG"}, ID_SYSMSG},
57 {{"MSG_RTN_GET_DOORBELL"}, ID_RTN_GET_DOORBELL, isGFX11Plus},
58 {{"MSG_RTN_GET_DDID"}, ID_RTN_GET_DDID, isGFX11Plus},
59 {{"MSG_RTN_GET_TMA"}, ID_RTN_GET_TMA, isGFX11Plus},
60 {{"MSG_RTN_GET_REALTIME"}, ID_RTN_GET_REALTIME, isGFX11Plus},
61 {{"MSG_RTN_SAVE_WAVE"}, ID_RTN_SAVE_WAVE, isGFX11Plus},
62 {{"MSG_RTN_GET_TBA"}, ID_RTN_GET_TBA, isGFX11Plus},
63 {{"MSG_RTN_GET_TBA_TO_PC"}, ID_RTN_GET_TBA_TO_PC, isGFX11Plus},
64 {{"MSG_RTN_GET_SE_AID_ID"}, ID_RTN_GET_SE_AID_ID, isGFX12Plus},
65};
66// clang-format on
67// NOLINTEND
68
69const int MSG_SIZE = static_cast<int>(
71
72// These two must be in sync with llvm::AMDGPU::SendMsg::Op enum members, see SIDefines.h.
73const char *const OpSysSymbolic[OP_SYS_LAST_] = {
74 nullptr,
75 "SYSMSG_OP_ECC_ERR_INTERRUPT",
76 "SYSMSG_OP_REG_RD",
77 "SYSMSG_OP_HOST_TRAP_ACK",
78 "SYSMSG_OP_TTRACE_PC"
79};
80
81const char *const OpGsSymbolic[OP_GS_LAST_] = {
82 "GS_OP_NOP",
83 "GS_OP_CUT",
84 "GS_OP_EMIT",
85 "GS_OP_EMIT_CUT"
86};
87
88} // namespace SendMsg
89
90namespace Hwreg {
91
92// Disable lint checking for this block since it makes the table unreadable.
93// NOLINTBEGIN
94// clang-format off
96 {{""}},
97 {{"HW_REG_MODE"}, ID_MODE},
98 {{"HW_REG_STATUS"}, ID_STATUS},
99 {{"HW_REG_TRAPSTS"}, ID_TRAPSTS, isNotGFX12Plus},
100 {{"HW_REG_HW_ID"}, ID_HW_ID, isNotGFX10Plus},
101 {{"HW_REG_GPR_ALLOC"}, ID_GPR_ALLOC},
102 {{"HW_REG_LDS_ALLOC"}, ID_LDS_ALLOC},
103 {{"HW_REG_IB_STS"}, ID_IB_STS},
104 {{""}},
105 {{""}},
106 {{"HW_REG_PERF_SNAPSHOT_DATA"}, ID_PERF_SNAPSHOT_DATA_gfx12, isGFX12Plus},
107 {{"HW_REG_PERF_SNAPSHOT_PC_LO"}, ID_PERF_SNAPSHOT_PC_LO_gfx12, isGFX12Plus},
108 {{"HW_REG_PERF_SNAPSHOT_PC_HI"}, ID_PERF_SNAPSHOT_PC_HI_gfx12, isGFX12Plus},
109 {{""}},
110 {{""}},
111 {{"HW_REG_SH_MEM_BASES"}, ID_MEM_BASES, isGFX9_GFX10_GFX11},
112 {{"HW_REG_TBA_LO"}, ID_TBA_LO, isGFX9_GFX10},
113 {{"HW_REG_TBA_HI"}, ID_TBA_HI, isGFX9_GFX10},
114 {{"HW_REG_TMA_LO"}, ID_TMA_LO, isGFX9_GFX10},
115 {{"HW_REG_TMA_HI"}, ID_TMA_HI, isGFX9_GFX10},
116 {{"HW_REG_FLAT_SCR_LO"}, ID_FLAT_SCR_LO, isGFX10_GFX11},
117 {{"HW_REG_FLAT_SCR_HI"}, ID_FLAT_SCR_HI, isGFX10_GFX11},
118 {{"HW_REG_XNACK_MASK"}, ID_XNACK_MASK, isGFX10Before1030},
119 {{"HW_REG_HW_ID1"}, ID_HW_ID1, isGFX10Plus},
120 {{"HW_REG_HW_ID2"}, ID_HW_ID2, isGFX10Plus},
121 {{"HW_REG_POPS_PACKER"}, ID_POPS_PACKER, isGFX10},
122 {{""}},
123 {{"HW_REG_PERF_SNAPSHOT_DATA"}, ID_PERF_SNAPSHOT_DATA_gfx11, isGFX11},
124 {{""}},
125 {{"HW_REG_SHADER_CYCLES"}, ID_SHADER_CYCLES, isGFX10_3_GFX11},
126 {{"HW_REG_SHADER_CYCLES_HI"}, ID_SHADER_CYCLES_HI, isGFX12Plus},
127 {{"HW_REG_DVGPR_ALLOC_LO"}, ID_DVGPR_ALLOC_LO, isGFX12Plus},
128 {{"HW_REG_DVGPR_ALLOC_HI"}, ID_DVGPR_ALLOC_HI, isGFX12Plus},
129
130 // Register numbers reused in GFX11
131 {{"HW_REG_PERF_SNAPSHOT_PC_LO"}, ID_PERF_SNAPSHOT_PC_LO_gfx11, isGFX11},
132 {{"HW_REG_PERF_SNAPSHOT_PC_HI"}, ID_PERF_SNAPSHOT_PC_HI_gfx11, isGFX11},
133
134 // Register numbers reused in GFX12+
135 {{"HW_REG_STATE_PRIV"}, ID_STATE_PRIV, isGFX12Plus},
136 {{"HW_REG_PERF_SNAPSHOT_DATA1"}, ID_PERF_SNAPSHOT_DATA1, isGFX12Plus},
137 {{"HW_REG_PERF_SNAPSHOT_DATA2"}, ID_PERF_SNAPSHOT_DATA2, isGFX12Plus},
138 {{"HW_REG_EXCP_FLAG_PRIV"}, ID_EXCP_FLAG_PRIV, isGFX12Plus},
139 {{"HW_REG_EXCP_FLAG_USER"}, ID_EXCP_FLAG_USER, isGFX12Plus},
140 {{"HW_REG_TRAP_CTRL"}, ID_TRAP_CTRL, isGFX12Plus},
141 {{"HW_REG_SCRATCH_BASE_LO"}, ID_FLAT_SCR_LO, isGFX12Plus},
142 {{"HW_REG_SCRATCH_BASE_HI"}, ID_FLAT_SCR_HI, isGFX12Plus},
143 {{"HW_REG_SHADER_CYCLES_LO"}, ID_SHADER_CYCLES, isGFX12Plus},
144
145 // GFX940 specific registers
146 {{"HW_REG_XCC_ID"}, ID_XCC_ID, isGFX940},
147 {{"HW_REG_SQ_PERF_SNAPSHOT_DATA"}, ID_SQ_PERF_SNAPSHOT_DATA, isGFX940},
148 {{"HW_REG_SQ_PERF_SNAPSHOT_DATA1"}, ID_SQ_PERF_SNAPSHOT_DATA1, isGFX940},
149 {{"HW_REG_SQ_PERF_SNAPSHOT_PC_LO"}, ID_SQ_PERF_SNAPSHOT_PC_LO, isGFX940},
150 {{"HW_REG_SQ_PERF_SNAPSHOT_PC_HI"}, ID_SQ_PERF_SNAPSHOT_PC_HI, isGFX940},
151
152 // Aliases
153 {{"HW_REG_HW_ID"}, ID_HW_ID1, isGFX10},
154};
155// clang-format on
156// NOLINTEND
157
158const int OPR_SIZE = static_cast<int>(
160
161} // namespace Hwreg
162
163namespace MTBUFFormat {
164
166 "BUF_DATA_FORMAT_INVALID",
167 "BUF_DATA_FORMAT_8",
168 "BUF_DATA_FORMAT_16",
169 "BUF_DATA_FORMAT_8_8",
170 "BUF_DATA_FORMAT_32",
171 "BUF_DATA_FORMAT_16_16",
172 "BUF_DATA_FORMAT_10_11_11",
173 "BUF_DATA_FORMAT_11_11_10",
174 "BUF_DATA_FORMAT_10_10_10_2",
175 "BUF_DATA_FORMAT_2_10_10_10",
176 "BUF_DATA_FORMAT_8_8_8_8",
177 "BUF_DATA_FORMAT_32_32",
178 "BUF_DATA_FORMAT_16_16_16_16",
179 "BUF_DATA_FORMAT_32_32_32",
180 "BUF_DATA_FORMAT_32_32_32_32",
181 "BUF_DATA_FORMAT_RESERVED_15"
182};
183
185 "BUF_NUM_FORMAT_UNORM",
186 "BUF_NUM_FORMAT_SNORM",
187 "BUF_NUM_FORMAT_USCALED",
188 "BUF_NUM_FORMAT_SSCALED",
189 "BUF_NUM_FORMAT_UINT",
190 "BUF_NUM_FORMAT_SINT",
191 "",
192 "BUF_NUM_FORMAT_FLOAT"
193};
194
196 "BUF_NUM_FORMAT_UNORM",
197 "BUF_NUM_FORMAT_SNORM",
198 "BUF_NUM_FORMAT_USCALED",
199 "BUF_NUM_FORMAT_SSCALED",
200 "BUF_NUM_FORMAT_UINT",
201 "BUF_NUM_FORMAT_SINT",
202 "BUF_NUM_FORMAT_SNORM_OGL",
203 "BUF_NUM_FORMAT_FLOAT"
204};
205
206StringLiteral const NfmtSymbolicVI[] = { // VI and GFX9
207 "BUF_NUM_FORMAT_UNORM",
208 "BUF_NUM_FORMAT_SNORM",
209 "BUF_NUM_FORMAT_USCALED",
210 "BUF_NUM_FORMAT_SSCALED",
211 "BUF_NUM_FORMAT_UINT",
212 "BUF_NUM_FORMAT_SINT",
213 "BUF_NUM_FORMAT_RESERVED_6",
214 "BUF_NUM_FORMAT_FLOAT"
215};
216
218 "BUF_FMT_INVALID",
219
220 "BUF_FMT_8_UNORM",
221 "BUF_FMT_8_SNORM",
222 "BUF_FMT_8_USCALED",
223 "BUF_FMT_8_SSCALED",
224 "BUF_FMT_8_UINT",
225 "BUF_FMT_8_SINT",
226
227 "BUF_FMT_16_UNORM",
228 "BUF_FMT_16_SNORM",
229 "BUF_FMT_16_USCALED",
230 "BUF_FMT_16_SSCALED",
231 "BUF_FMT_16_UINT",
232 "BUF_FMT_16_SINT",
233 "BUF_FMT_16_FLOAT",
234
235 "BUF_FMT_8_8_UNORM",
236 "BUF_FMT_8_8_SNORM",
237 "BUF_FMT_8_8_USCALED",
238 "BUF_FMT_8_8_SSCALED",
239 "BUF_FMT_8_8_UINT",
240 "BUF_FMT_8_8_SINT",
241
242 "BUF_FMT_32_UINT",
243 "BUF_FMT_32_SINT",
244 "BUF_FMT_32_FLOAT",
245
246 "BUF_FMT_16_16_UNORM",
247 "BUF_FMT_16_16_SNORM",
248 "BUF_FMT_16_16_USCALED",
249 "BUF_FMT_16_16_SSCALED",
250 "BUF_FMT_16_16_UINT",
251 "BUF_FMT_16_16_SINT",
252 "BUF_FMT_16_16_FLOAT",
253
254 "BUF_FMT_10_11_11_UNORM",
255 "BUF_FMT_10_11_11_SNORM",
256 "BUF_FMT_10_11_11_USCALED",
257 "BUF_FMT_10_11_11_SSCALED",
258 "BUF_FMT_10_11_11_UINT",
259 "BUF_FMT_10_11_11_SINT",
260 "BUF_FMT_10_11_11_FLOAT",
261
262 "BUF_FMT_11_11_10_UNORM",
263 "BUF_FMT_11_11_10_SNORM",
264 "BUF_FMT_11_11_10_USCALED",
265 "BUF_FMT_11_11_10_SSCALED",
266 "BUF_FMT_11_11_10_UINT",
267 "BUF_FMT_11_11_10_SINT",
268 "BUF_FMT_11_11_10_FLOAT",
269
270 "BUF_FMT_10_10_10_2_UNORM",
271 "BUF_FMT_10_10_10_2_SNORM",
272 "BUF_FMT_10_10_10_2_USCALED",
273 "BUF_FMT_10_10_10_2_SSCALED",
274 "BUF_FMT_10_10_10_2_UINT",
275 "BUF_FMT_10_10_10_2_SINT",
276
277 "BUF_FMT_2_10_10_10_UNORM",
278 "BUF_FMT_2_10_10_10_SNORM",
279 "BUF_FMT_2_10_10_10_USCALED",
280 "BUF_FMT_2_10_10_10_SSCALED",
281 "BUF_FMT_2_10_10_10_UINT",
282 "BUF_FMT_2_10_10_10_SINT",
283
284 "BUF_FMT_8_8_8_8_UNORM",
285 "BUF_FMT_8_8_8_8_SNORM",
286 "BUF_FMT_8_8_8_8_USCALED",
287 "BUF_FMT_8_8_8_8_SSCALED",
288 "BUF_FMT_8_8_8_8_UINT",
289 "BUF_FMT_8_8_8_8_SINT",
290
291 "BUF_FMT_32_32_UINT",
292 "BUF_FMT_32_32_SINT",
293 "BUF_FMT_32_32_FLOAT",
294
295 "BUF_FMT_16_16_16_16_UNORM",
296 "BUF_FMT_16_16_16_16_SNORM",
297 "BUF_FMT_16_16_16_16_USCALED",
298 "BUF_FMT_16_16_16_16_SSCALED",
299 "BUF_FMT_16_16_16_16_UINT",
300 "BUF_FMT_16_16_16_16_SINT",
301 "BUF_FMT_16_16_16_16_FLOAT",
302
303 "BUF_FMT_32_32_32_UINT",
304 "BUF_FMT_32_32_32_SINT",
305 "BUF_FMT_32_32_32_FLOAT",
306 "BUF_FMT_32_32_32_32_UINT",
307 "BUF_FMT_32_32_32_32_SINT",
308 "BUF_FMT_32_32_32_32_FLOAT"
309};
310
311unsigned const DfmtNfmt2UFmtGFX10[] = {
313
320
328
335
339
347
355
363
370
377
384
388
396
403};
404
406 "BUF_FMT_INVALID",
407
408 "BUF_FMT_8_UNORM",
409 "BUF_FMT_8_SNORM",
410 "BUF_FMT_8_USCALED",
411 "BUF_FMT_8_SSCALED",
412 "BUF_FMT_8_UINT",
413 "BUF_FMT_8_SINT",
414
415 "BUF_FMT_16_UNORM",
416 "BUF_FMT_16_SNORM",
417 "BUF_FMT_16_USCALED",
418 "BUF_FMT_16_SSCALED",
419 "BUF_FMT_16_UINT",
420 "BUF_FMT_16_SINT",
421 "BUF_FMT_16_FLOAT",
422
423 "BUF_FMT_8_8_UNORM",
424 "BUF_FMT_8_8_SNORM",
425 "BUF_FMT_8_8_USCALED",
426 "BUF_FMT_8_8_SSCALED",
427 "BUF_FMT_8_8_UINT",
428 "BUF_FMT_8_8_SINT",
429
430 "BUF_FMT_32_UINT",
431 "BUF_FMT_32_SINT",
432 "BUF_FMT_32_FLOAT",
433
434 "BUF_FMT_16_16_UNORM",
435 "BUF_FMT_16_16_SNORM",
436 "BUF_FMT_16_16_USCALED",
437 "BUF_FMT_16_16_SSCALED",
438 "BUF_FMT_16_16_UINT",
439 "BUF_FMT_16_16_SINT",
440 "BUF_FMT_16_16_FLOAT",
441
442 "BUF_FMT_10_11_11_FLOAT",
443
444 "BUF_FMT_11_11_10_FLOAT",
445
446 "BUF_FMT_10_10_10_2_UNORM",
447 "BUF_FMT_10_10_10_2_SNORM",
448 "BUF_FMT_10_10_10_2_UINT",
449 "BUF_FMT_10_10_10_2_SINT",
450
451 "BUF_FMT_2_10_10_10_UNORM",
452 "BUF_FMT_2_10_10_10_SNORM",
453 "BUF_FMT_2_10_10_10_USCALED",
454 "BUF_FMT_2_10_10_10_SSCALED",
455 "BUF_FMT_2_10_10_10_UINT",
456 "BUF_FMT_2_10_10_10_SINT",
457
458 "BUF_FMT_8_8_8_8_UNORM",
459 "BUF_FMT_8_8_8_8_SNORM",
460 "BUF_FMT_8_8_8_8_USCALED",
461 "BUF_FMT_8_8_8_8_SSCALED",
462 "BUF_FMT_8_8_8_8_UINT",
463 "BUF_FMT_8_8_8_8_SINT",
464
465 "BUF_FMT_32_32_UINT",
466 "BUF_FMT_32_32_SINT",
467 "BUF_FMT_32_32_FLOAT",
468
469 "BUF_FMT_16_16_16_16_UNORM",
470 "BUF_FMT_16_16_16_16_SNORM",
471 "BUF_FMT_16_16_16_16_USCALED",
472 "BUF_FMT_16_16_16_16_SSCALED",
473 "BUF_FMT_16_16_16_16_UINT",
474 "BUF_FMT_16_16_16_16_SINT",
475 "BUF_FMT_16_16_16_16_FLOAT",
476
477 "BUF_FMT_32_32_32_UINT",
478 "BUF_FMT_32_32_32_SINT",
479 "BUF_FMT_32_32_32_FLOAT",
480 "BUF_FMT_32_32_32_32_UINT",
481 "BUF_FMT_32_32_32_32_SINT",
482 "BUF_FMT_32_32_32_32_FLOAT"
483};
484
485unsigned const DfmtNfmt2UFmtGFX11[] = {
487
494
502
509
513
521
523
525
530
537
544
548
556
563};
564
565} // namespace MTBUFFormat
566
567namespace Swizzle {
568
569// This must be in sync with llvm::AMDGPU::Swizzle::Id enum members, see SIDefines.h.
570const char* const IdSymbolic[] = {
571 "QUAD_PERM",
572 "BITMASK_PERM",
573 "SWAP",
574 "REVERSE",
575 "BROADCAST",
576};
577
578} // namespace Swizzle
579
580namespace VGPRIndexMode {
581
582// This must be in sync with llvm::AMDGPU::VGPRIndexMode::Id enum members, see SIDefines.h.
583const char* const IdSymbolic[] = {
584 "SRC0",
585 "SRC1",
586 "SRC2",
587 "DST",
588};
589
590} // namespace VGPRIndexMode
591
592} // namespace AMDGPU
593} // namespace llvm
static std::vector< std::pair< int, unsigned > > Swizzle(std::vector< std::pair< int, unsigned > > Src, R600InstrInfo::BankSwizzle Swz)
A wrapper around a string literal that serves as a proxy for constructing global tables of StringRefs...
Definition: StringRef.h:849
const CustomOperandVal DepCtrInfo[]
const CustomOperand< const MCSubtargetInfo & > Opr[]
StringLiteral const UfmtSymbolicGFX11[]
unsigned const DfmtNfmt2UFmtGFX10[]
StringLiteral const DfmtSymbolic[]
StringLiteral const NfmtSymbolicGFX10[]
unsigned const DfmtNfmt2UFmtGFX11[]
StringLiteral const NfmtSymbolicVI[]
StringLiteral const NfmtSymbolicSICI[]
StringLiteral const UfmtSymbolicGFX10[]
const char *const OpGsSymbolic[OP_GS_LAST_]
const char *const OpSysSymbolic[OP_SYS_LAST_]
const CustomOperand< const MCSubtargetInfo & > Msg[]
const char *const IdSymbolic[]
const char *const IdSymbolic[]
bool isGFX10_BEncoding(const MCSubtargetInfo &STI)
bool isGFX10_GFX11(const MCSubtargetInfo &STI)
bool isGFX10Before1030(const MCSubtargetInfo &STI)
bool isGFX10(const MCSubtargetInfo &STI)
bool isGFX12Plus(const MCSubtargetInfo &STI)
bool isGFX940(const MCSubtargetInfo &STI)
bool isGFX11(const MCSubtargetInfo &STI)
bool isGFX10_3_GFX11(const MCSubtargetInfo &STI)
bool isGFX8_GFX9_GFX10(const MCSubtargetInfo &STI)
bool isNotGFX10Plus(const MCSubtargetInfo &STI)
bool isNotGFX11Plus(const MCSubtargetInfo &STI)
bool isGFX11Plus(const MCSubtargetInfo &STI)
bool isGFX10Plus(const MCSubtargetInfo &STI)
bool isGFX9Plus(const MCSubtargetInfo &STI)
bool isNotGFX12Plus(const MCSubtargetInfo &STI)
bool isGFX9_GFX10_GFX11(const MCSubtargetInfo &STI)
bool isGFX9_GFX10(const MCSubtargetInfo &STI)
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18