26 "Generic AMDGCN arch not classified correctly!");
36#define AMDGCN_GPU(NAME, ENUM, ISAVERSION, FEATURES) \
39#include "llvm/TargetParser/AMDGPUTargetParser.def"
47#define R600_GPU(NAME, ENUM, FEATURES) \
50#include "llvm/TargetParser/AMDGPUTargetParser.def"
58#define AMDGCN_GPU(NAME, ENUM, ISAVERSION, FEATURES) .Case(NAME, ENUM)
59#define AMDGCN_GPU_ALIAS(NAME, ENUM) .Case(NAME, ENUM)
60#include "llvm/TargetParser/AMDGPUTargetParser.def"
66#define R600_GPU(NAME, ENUM, FEATURES) .Case(NAME, ENUM)
67#define R600_GPU_ALIAS(NAME, ENUM) .Case(NAME, ENUM)
68#include "llvm/TargetParser/AMDGPUTargetParser.def"
74#define AMDGCN_GPU(NAME, ENUM, ISAVERSION, FEATURES) \
77#include "llvm/TargetParser/AMDGPUTargetParser.def"
85#define R600_GPU(NAME, ENUM, FEATURES) \
88#include "llvm/TargetParser/AMDGPUTargetParser.def"
97#define AMDGCN_GPU(NAME, ENUM, ISAVERSION, FEATURES) NAME,
98#define AMDGCN_GPU_ALIAS(NAME, ENUM) NAME,
99#include "llvm/TargetParser/AMDGPUTargetParser.def"
105#define R600_GPU(NAME, ENUM, FEATURES) NAME,
106#define R600_GPU_ALIAS(NAME, ENUM) NAME,
107#include "llvm/TargetParser/AMDGPUTargetParser.def"
114 if (GPU ==
"generic-hsa")
116 if (GPU ==
"generic")
122#define MAKE_ISAVERSION(A, B, C) {A, B, C}
123#define AMDGCN_GPU(NAME, ENUM, ISAVERSION, FEATURES) \
125 return MAKE_ISAVERSION ISAVERSION;
126#include "llvm/TargetParser/AMDGPUTargetParser.def"
127#undef MAKE_ISAVERSION
142static std::pair<FeatureError, StringRef>
146 const bool IsNullGPU = GPU.
empty();
147 const bool TargetHasWave32 = DefaultFeatures.
count(
"wavefrontsize32");
148 const bool TargetHasWave64 = DefaultFeatures.
count(
"wavefrontsize64");
150 auto Wave32Itr = Features.
find(
"wavefrontsize32");
151 auto Wave64Itr = Features.
find(
"wavefrontsize64");
152 const bool EnableWave32 =
153 Wave32Itr != Features.
end() && Wave32Itr->getValue();
154 const bool EnableWave64 =
155 Wave64Itr != Features.
end() && Wave64Itr->getValue();
156 const bool DisableWave32 =
157 Wave32Itr != Features.
end() && !Wave32Itr->getValue();
158 const bool DisableWave64 =
159 Wave64Itr != Features.
end() && !Wave64Itr->getValue();
161 if (EnableWave32 && EnableWave64)
163 "'+wavefrontsize32' and '+wavefrontsize64' are mutually exclusive"};
164 if (DisableWave32 && DisableWave64)
166 "'-wavefrontsize32' and '-wavefrontsize64' are mutually exclusive"};
169 if (TargetHasWave64) {
176 if (TargetHasWave32) {
186 if (!IsNullGPU && !EnableWave32 && !EnableWave64 && !TargetHasWave32 &&
188 Features.
insert(std::make_pair(
"wavefrontsize32",
true));
190 for (
const auto &Entry : DefaultFeatures) {
191 if (!Features.
count(Entry.getKey()))
192 Features[Entry.getKey()] = Entry.getValue();
207 Features[
"swmmac-gfx1200-insts"] =
true;
208 Features[
"swmmac-gfx1250-insts"] =
true;
211 Features[
"cube-insts"] =
true;
212 Features[
"cvt-pknorm-vop2-insts"] =
true;
213 Features[
"lerp-inst"] =
true;
214 Features[
"qsad-insts"] =
true;
215 Features[
"sad-insts"] =
true;
216 Features[
"msad-insts"] =
true;
217 Features[
"mqsad-pk-insts"] =
true;
218 Features[
"mqsad-insts"] =
true;
220 case GK_GFX12_5_GENERIC:
221 Features[
"ci-insts"] =
true;
222 Features[
"dot7-insts"] =
true;
223 Features[
"dot8-insts"] =
true;
224 Features[
"dl-insts"] =
true;
225 Features[
"16-bit-insts"] =
true;
226 Features[
"dpp"] =
true;
227 Features[
"gfx8-insts"] =
true;
228 Features[
"gfx9-insts"] =
true;
229 Features[
"gfx10-insts"] =
true;
230 Features[
"gfx10-3-insts"] =
true;
231 Features[
"gfx11-insts"] =
true;
232 Features[
"gfx12-insts"] =
true;
233 Features[
"gfx1250-insts"] =
true;
234 Features[
"bitop3-insts"] =
true;
235 Features[
"prng-inst"] =
true;
236 Features[
"tanh-insts"] =
true;
237 Features[
"tensor-cvt-lut-insts"] =
true;
238 Features[
"transpose-load-f4f6-insts"] =
true;
239 Features[
"bf16-trans-insts"] =
true;
240 Features[
"bf16-cvt-insts"] =
true;
241 Features[
"bf16-pk-insts"] =
true;
242 Features[
"fp8-conversion-insts"] =
true;
243 Features[
"fp8e5m3-insts"] =
true;
244 Features[
"permlane16-swap"] =
true;
245 Features[
"ashr-pk-insts"] =
true;
246 Features[
"add-min-max-insts"] =
true;
247 Features[
"pk-add-min-max-insts"] =
true;
248 Features[
"atomic-buffer-pk-add-bf16-inst"] =
true;
249 Features[
"vmem-pref-insts"] =
true;
250 Features[
"atomic-fadd-rtn-insts"] =
true;
251 Features[
"atomic-buffer-global-pk-add-f16-insts"] =
true;
252 Features[
"atomic-flat-pk-add-16-insts"] =
true;
253 Features[
"atomic-global-pk-add-bf16-inst"] =
true;
254 Features[
"atomic-ds-pk-add-16-insts"] =
true;
255 Features[
"setprio-inc-wg-inst"] =
true;
256 Features[
"s-wakeup-barrier-inst"] =
true;
257 Features[
"atomic-fmin-fmax-global-f32"] =
true;
258 Features[
"atomic-fmin-fmax-global-f64"] =
true;
259 Features[
"wavefrontsize32"] =
true;
260 Features[
"clusters"] =
true;
261 Features[
"mcast-load-insts"] =
true;
265 case GK_GFX12_GENERIC:
266 Features[
"ci-insts"] =
true;
267 Features[
"dot7-insts"] =
true;
268 Features[
"dot8-insts"] =
true;
269 Features[
"dot9-insts"] =
true;
270 Features[
"dot10-insts"] =
true;
271 Features[
"dot11-insts"] =
true;
272 Features[
"dot12-insts"] =
true;
273 Features[
"dl-insts"] =
true;
274 Features[
"atomic-ds-pk-add-16-insts"] =
true;
275 Features[
"atomic-flat-pk-add-16-insts"] =
true;
276 Features[
"atomic-buffer-global-pk-add-f16-insts"] =
true;
277 Features[
"atomic-buffer-pk-add-bf16-inst"] =
true;
278 Features[
"atomic-global-pk-add-bf16-inst"] =
true;
279 Features[
"16-bit-insts"] =
true;
280 Features[
"dpp"] =
true;
281 Features[
"gfx8-insts"] =
true;
282 Features[
"gfx9-insts"] =
true;
283 Features[
"gfx10-insts"] =
true;
284 Features[
"gfx10-3-insts"] =
true;
285 Features[
"gfx11-insts"] =
true;
286 Features[
"gfx12-insts"] =
true;
287 Features[
"atomic-fadd-rtn-insts"] =
true;
288 Features[
"image-insts"] =
true;
289 Features[
"cube-insts"] =
true;
290 Features[
"lerp-inst"] =
true;
291 Features[
"sad-insts"] =
true;
292 Features[
"qsad-insts"] =
true;
293 Features[
"msad-insts"] =
true;
294 Features[
"mqsad-pk-insts"] =
true;
295 Features[
"mqsad-insts"] =
true;
296 Features[
"cvt-pknorm-vop2-insts"] =
true;
297 Features[
"fp8-conversion-insts"] =
true;
298 Features[
"wmma-128b-insts"] =
true;
299 Features[
"swmmac-gfx1200-insts"] =
true;
300 Features[
"atomic-fmin-fmax-global-f32"] =
true;
305 Features[
"ci-insts"] =
true;
306 Features[
"dot7-insts"] =
true;
307 Features[
"dot8-insts"] =
true;
308 Features[
"dot9-insts"] =
true;
309 Features[
"dot10-insts"] =
true;
310 Features[
"dot12-insts"] =
true;
311 Features[
"dl-insts"] =
true;
312 Features[
"16-bit-insts"] =
true;
313 Features[
"dpp"] =
true;
314 Features[
"gfx8-insts"] =
true;
315 Features[
"gfx9-insts"] =
true;
316 Features[
"gfx10-insts"] =
true;
317 Features[
"gfx10-3-insts"] =
true;
318 Features[
"gfx11-insts"] =
true;
319 Features[
"atomic-fadd-rtn-insts"] =
true;
320 Features[
"image-insts"] =
true;
321 Features[
"cube-insts"] =
true;
322 Features[
"lerp-inst"] =
true;
323 Features[
"sad-insts"] =
true;
324 Features[
"qsad-insts"] =
true;
325 Features[
"msad-insts"] =
true;
326 Features[
"mqsad-pk-insts"] =
true;
327 Features[
"mqsad-insts"] =
true;
328 Features[
"cvt-pknorm-vop2-insts"] =
true;
329 Features[
"gws"] =
true;
330 Features[
"dot11-insts"] =
true;
331 Features[
"fp8-conversion-insts"] =
true;
332 Features[
"wmma-128b-insts"] =
true;
333 Features[
"swmmac-gfx1200-insts"] =
true;
334 Features[
"atomic-fmin-fmax-global-f32"] =
true;
344 case GK_GFX11_GENERIC:
345 Features[
"ci-insts"] =
true;
346 Features[
"dot5-insts"] =
true;
347 Features[
"dot7-insts"] =
true;
348 Features[
"dot8-insts"] =
true;
349 Features[
"dot9-insts"] =
true;
350 Features[
"dot10-insts"] =
true;
351 Features[
"dot12-insts"] =
true;
352 Features[
"dl-insts"] =
true;
353 Features[
"16-bit-insts"] =
true;
354 Features[
"dpp"] =
true;
355 Features[
"gfx8-insts"] =
true;
356 Features[
"gfx9-insts"] =
true;
357 Features[
"gfx10-insts"] =
true;
358 Features[
"gfx10-3-insts"] =
true;
359 Features[
"gfx11-insts"] =
true;
360 Features[
"atomic-fadd-rtn-insts"] =
true;
361 Features[
"image-insts"] =
true;
362 Features[
"cube-insts"] =
true;
363 Features[
"lerp-inst"] =
true;
364 Features[
"sad-insts"] =
true;
365 Features[
"qsad-insts"] =
true;
366 Features[
"msad-insts"] =
true;
367 Features[
"mqsad-pk-insts"] =
true;
368 Features[
"mqsad-insts"] =
true;
369 Features[
"cvt-pknorm-vop2-insts"] =
true;
370 Features[
"gws"] =
true;
371 Features[
"wmma-256b-insts"] =
true;
372 Features[
"atomic-fmin-fmax-global-f32"] =
true;
381 case GK_GFX10_3_GENERIC:
382 Features[
"ci-insts"] =
true;
383 Features[
"dot1-insts"] =
true;
384 Features[
"dot2-insts"] =
true;
385 Features[
"dot5-insts"] =
true;
386 Features[
"dot6-insts"] =
true;
387 Features[
"dot7-insts"] =
true;
388 Features[
"dot10-insts"] =
true;
389 Features[
"dl-insts"] =
true;
390 Features[
"16-bit-insts"] =
true;
391 Features[
"dpp"] =
true;
392 Features[
"gfx8-insts"] =
true;
393 Features[
"gfx9-insts"] =
true;
394 Features[
"gfx10-insts"] =
true;
395 Features[
"gfx10-3-insts"] =
true;
396 Features[
"image-insts"] =
true;
397 Features[
"s-memrealtime"] =
true;
398 Features[
"s-memtime-inst"] =
true;
399 Features[
"gws"] =
true;
400 Features[
"vmem-to-lds-load-insts"] =
true;
401 Features[
"atomic-fmin-fmax-global-f32"] =
true;
402 Features[
"atomic-fmin-fmax-global-f64"] =
true;
403 Features[
"cube-insts"] =
true;
404 Features[
"lerp-inst"] =
true;
405 Features[
"sad-insts"] =
true;
406 Features[
"qsad-insts"] =
true;
407 Features[
"msad-insts"] =
true;
408 Features[
"mqsad-pk-insts"] =
true;
409 Features[
"mqsad-insts"] =
true;
410 Features[
"cvt-pknorm-vop2-insts"] =
true;
414 Features[
"dot1-insts"] =
true;
415 Features[
"dot2-insts"] =
true;
416 Features[
"dot5-insts"] =
true;
417 Features[
"dot6-insts"] =
true;
418 Features[
"dot7-insts"] =
true;
419 Features[
"dot10-insts"] =
true;
423 case GK_GFX10_1_GENERIC:
424 Features[
"dl-insts"] =
true;
425 Features[
"ci-insts"] =
true;
426 Features[
"16-bit-insts"] =
true;
427 Features[
"dpp"] =
true;
428 Features[
"gfx8-insts"] =
true;
429 Features[
"gfx9-insts"] =
true;
430 Features[
"gfx10-insts"] =
true;
431 Features[
"image-insts"] =
true;
432 Features[
"s-memrealtime"] =
true;
433 Features[
"s-memtime-inst"] =
true;
434 Features[
"gws"] =
true;
435 Features[
"vmem-to-lds-load-insts"] =
true;
436 Features[
"atomic-fmin-fmax-global-f32"] =
true;
437 Features[
"atomic-fmin-fmax-global-f64"] =
true;
438 Features[
"cube-insts"] =
true;
439 Features[
"lerp-inst"] =
true;
440 Features[
"sad-insts"] =
true;
441 Features[
"qsad-insts"] =
true;
442 Features[
"msad-insts"] =
true;
443 Features[
"mqsad-pk-insts"] =
true;
444 Features[
"mqsad-insts"] =
true;
445 Features[
"cvt-pknorm-vop2-insts"] =
true;
448 Features[
"bitop3-insts"] =
true;
449 Features[
"fp6bf6-cvt-scale-insts"] =
true;
450 Features[
"fp4-cvt-scale-insts"] =
true;
451 Features[
"bf8-cvt-scale-insts"] =
true;
452 Features[
"fp8-cvt-scale-insts"] =
true;
453 Features[
"f16bf16-to-fp6bf6-cvt-scale-insts"] =
true;
454 Features[
"f32-to-f16bf16-cvt-sr-insts"] =
true;
455 Features[
"prng-inst"] =
true;
456 Features[
"permlane16-swap"] =
true;
457 Features[
"permlane32-swap"] =
true;
458 Features[
"ashr-pk-insts"] =
true;
459 Features[
"dot12-insts"] =
true;
460 Features[
"dot13-insts"] =
true;
461 Features[
"atomic-buffer-pk-add-bf16-inst"] =
true;
462 Features[
"gfx950-insts"] =
true;
465 Features[
"fp8-insts"] =
true;
466 Features[
"fp8-conversion-insts"] =
true;
467 if (Kind != GK_GFX950)
468 Features[
"xf32-insts"] =
true;
470 case GK_GFX9_4_GENERIC:
471 Features[
"gfx940-insts"] =
true;
472 Features[
"atomic-ds-pk-add-16-insts"] =
true;
473 Features[
"atomic-flat-pk-add-16-insts"] =
true;
474 Features[
"atomic-global-pk-add-bf16-inst"] =
true;
475 Features[
"gfx90a-insts"] =
true;
476 Features[
"atomic-buffer-global-pk-add-f16-insts"] =
true;
477 Features[
"atomic-fadd-rtn-insts"] =
true;
478 Features[
"dot3-insts"] =
true;
479 Features[
"dot4-insts"] =
true;
480 Features[
"dot5-insts"] =
true;
481 Features[
"dot6-insts"] =
true;
482 Features[
"mai-insts"] =
true;
483 Features[
"dl-insts"] =
true;
484 Features[
"dot1-insts"] =
true;
485 Features[
"dot2-insts"] =
true;
486 Features[
"dot7-insts"] =
true;
487 Features[
"dot10-insts"] =
true;
488 Features[
"gfx9-insts"] =
true;
489 Features[
"gfx8-insts"] =
true;
490 Features[
"16-bit-insts"] =
true;
491 Features[
"dpp"] =
true;
492 Features[
"s-memrealtime"] =
true;
493 Features[
"ci-insts"] =
true;
494 Features[
"s-memtime-inst"] =
true;
495 Features[
"gws"] =
true;
496 Features[
"vmem-to-lds-load-insts"] =
true;
497 Features[
"atomic-fmin-fmax-global-f64"] =
true;
498 Features[
"wavefrontsize64"] =
true;
499 Features[
"cube-insts"] =
true;
500 Features[
"lerp-inst"] =
true;
501 Features[
"sad-insts"] =
true;
502 Features[
"qsad-insts"] =
true;
503 Features[
"msad-insts"] =
true;
504 Features[
"mqsad-pk-insts"] =
true;
505 Features[
"mqsad-insts"] =
true;
506 Features[
"cvt-pknorm-vop2-insts"] =
true;
509 Features[
"gfx90a-insts"] =
true;
510 Features[
"atomic-buffer-global-pk-add-f16-insts"] =
true;
511 Features[
"atomic-fadd-rtn-insts"] =
true;
512 Features[
"atomic-fmin-fmax-global-f64"] =
true;
515 Features[
"dot3-insts"] =
true;
516 Features[
"dot4-insts"] =
true;
517 Features[
"dot5-insts"] =
true;
518 Features[
"dot6-insts"] =
true;
519 Features[
"mai-insts"] =
true;
522 Features[
"dl-insts"] =
true;
523 Features[
"dot1-insts"] =
true;
524 Features[
"dot2-insts"] =
true;
525 Features[
"dot7-insts"] =
true;
526 Features[
"dot10-insts"] =
true;
533 case GK_GFX9_GENERIC:
534 Features[
"gfx9-insts"] =
true;
535 Features[
"vmem-to-lds-load-insts"] =
true;
542 Features[
"gfx8-insts"] =
true;
543 Features[
"16-bit-insts"] =
true;
544 Features[
"dpp"] =
true;
545 Features[
"s-memrealtime"] =
true;
546 Features[
"ci-insts"] =
true;
547 Features[
"image-insts"] =
true;
548 Features[
"s-memtime-inst"] =
true;
549 Features[
"gws"] =
true;
550 Features[
"wavefrontsize64"] =
true;
551 Features[
"cube-insts"] =
true;
552 Features[
"lerp-inst"] =
true;
553 Features[
"sad-insts"] =
true;
554 Features[
"qsad-insts"] =
true;
555 Features[
"msad-insts"] =
true;
556 Features[
"mqsad-pk-insts"] =
true;
557 Features[
"mqsad-insts"] =
true;
558 Features[
"cvt-pknorm-vop2-insts"] =
true;
566 Features[
"ci-insts"] =
true;
567 Features[
"cube-insts"] =
true;
568 Features[
"lerp-inst"] =
true;
569 Features[
"sad-insts"] =
true;
570 Features[
"qsad-insts"] =
true;
571 Features[
"msad-insts"] =
true;
572 Features[
"mqsad-pk-insts"] =
true;
573 Features[
"mqsad-insts"] =
true;
574 Features[
"cvt-pknorm-vop2-insts"] =
true;
575 Features[
"image-insts"] =
true;
576 Features[
"s-memtime-inst"] =
true;
577 Features[
"gws"] =
true;
578 Features[
"atomic-fmin-fmax-global-f32"] =
true;
579 Features[
"atomic-fmin-fmax-global-f64"] =
true;
580 Features[
"wavefrontsize64"] =
true;
585 Features[
"image-insts"] =
true;
586 Features[
"s-memtime-inst"] =
true;
587 Features[
"gws"] =
true;
588 Features[
"atomic-fmin-fmax-global-f32"] =
true;
589 Features[
"atomic-fmin-fmax-global-f64"] =
true;
590 Features[
"wavefrontsize64"] =
true;
591 Features[
"cube-insts"] =
true;
592 Features[
"lerp-inst"] =
true;
593 Features[
"sad-insts"] =
true;
594 Features[
"msad-insts"] =
true;
595 Features[
"mqsad-pk-insts"] =
true;
596 Features[
"cvt-pknorm-vop2-insts"] =
true;
608std::pair<FeatureError, StringRef>
617 static const Triple AMDGCN(
"amdgcn-amd-amdhsa");
619 for (
auto &&GPU : GPUs) {
621 for (
auto &&[
F,
B] : Tmp)
624 Features[
"wavefrontsize32"] =
true;
625 Features[
"wavefrontsize64"] =
true;
626 }
else if (
T.isAMDGCN()) {
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static void fillAMDGCNFeatureMap(StringRef GPU, const Triple &T, StringMap< bool > &Features)
Fills Features map with default values for given target GPU.
static std::pair< FeatureError, StringRef > insertWaveSizeFeature(StringRef GPU, const Triple &T, const StringMap< bool > &DefaultFeatures, StringMap< bool > &Features)
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This file defines the SmallVector class.
This file implements the StringSwitch template, which mimics a switch() statement whose cases are str...
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringMap - This is an unconventional map that is specialized for handling keys that are "strings",...
iterator find(StringRef Key)
size_type count(StringRef Key) const
count - Return 1 if the element is in the map, 0 otherwise.
bool insert(MapEntryTy *KeyValue)
insert - Insert the specified key/value pair into the map.
Represent a constant reference to a string, i.e.
constexpr bool empty() const
Check if the string is empty.
StringRef take_front(size_t N=1) const
Return a StringRef equal to 'this' but with only the first N elements remaining.
size_t find(char C, size_t From=0) const
Search for the first character C in the string.
bool ends_with(StringRef Suffix) const
Check if this string ends with the given Suffix.
StringRef drop_back(size_t N=1) const
Return a StringRef equal to 'this' but with the last N elements dropped.
A switch()-like statement whose cases are string literals.
Triple - Helper class for working with autoconf configuration names.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
LLVM_ABI StringRef getArchNameR600(GPUKind AK)
GPUKind
GPU kinds supported by the AMDGPU target.
@ GK_AMDGCN_GENERIC_FIRST
LLVM_ABI StringRef getCanonicalArchName(const Triple &T, StringRef Arch)
LLVM_ABI void fillValidArchListR600(SmallVectorImpl< StringRef > &Values)
LLVM_ABI StringRef getArchFamilyNameAMDGCN(GPUKind AK)
LLVM_ABI IsaVersion getIsaVersion(StringRef GPU)
LLVM_ABI void fillValidArchListAMDGCN(SmallVectorImpl< StringRef > &Values)
LLVM_ABI GPUKind parseArchAMDGCN(StringRef CPU)
@ UNSUPPORTED_TARGET_FEATURE
@ INVALID_FEATURE_COMBINATION
LLVM_ABI std::pair< FeatureError, StringRef > fillAMDGPUFeatureMap(StringRef GPU, const Triple &T, StringMap< bool > &Features)
Fills Features map with default values for given target GPU.
LLVM_ABI StringRef getArchNameAMDGCN(GPUKind AK)
LLVM_ABI unsigned getArchAttrAMDGCN(GPUKind AK)
LLVM_ABI unsigned getArchAttrR600(GPUKind AK)
LLVM_ABI GPUKind parseArchR600(StringRef CPU)
This is an optimization pass for GlobalISel generic memory operations.
Instruction set architecture version.