LLVM 23.0.0git
SPIRVLegalizerInfo.cpp
Go to the documentation of this file.
1//===- SPIRVLegalizerInfo.cpp --- SPIR-V Legalization Rules ------*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the targeting of the Machinelegalizer class for SPIR-V.
10//
11//===----------------------------------------------------------------------===//
12
13#include "SPIRVLegalizerInfo.h"
14#include "SPIRV.h"
15#include "SPIRVGlobalRegistry.h"
16#include "SPIRVSubtarget.h"
17#include "SPIRVUtils.h"
24#include "llvm/IR/IntrinsicsSPIRV.h"
25#include "llvm/Support/Debug.h"
27
28using namespace llvm;
29using namespace llvm::LegalizeActions;
30using namespace llvm::LegalityPredicates;
31
32#define DEBUG_TYPE "spirv-legalizer"
33
34LegalityPredicate typeOfExtendedScalars(unsigned TypeIdx, bool IsExtendedInts) {
35 return [IsExtendedInts, TypeIdx](const LegalityQuery &Query) {
36 const LLT Ty = Query.Types[TypeIdx];
37 return IsExtendedInts && Ty.isValid() && Ty.isScalar();
38 };
39}
40
42 using namespace TargetOpcode;
43
44 this->ST = &ST;
45 GR = ST.getSPIRVGlobalRegistry();
46
47 const LLT s1 = LLT::scalar(1);
48 const LLT s8 = LLT::scalar(8);
49 const LLT s16 = LLT::scalar(16);
50 const LLT s32 = LLT::scalar(32);
51 const LLT s64 = LLT::scalar(64);
52 const LLT s128 = LLT::scalar(128);
53
54 const LLT v16s64 = LLT::fixed_vector(16, 64);
55 const LLT v16s32 = LLT::fixed_vector(16, 32);
56 const LLT v16s16 = LLT::fixed_vector(16, 16);
57 const LLT v16s8 = LLT::fixed_vector(16, 8);
58 const LLT v16s1 = LLT::fixed_vector(16, 1);
59
60 const LLT v8s64 = LLT::fixed_vector(8, 64);
61 const LLT v8s32 = LLT::fixed_vector(8, 32);
62 const LLT v8s16 = LLT::fixed_vector(8, 16);
63 const LLT v8s8 = LLT::fixed_vector(8, 8);
64 const LLT v8s1 = LLT::fixed_vector(8, 1);
65
66 const LLT v4s64 = LLT::fixed_vector(4, 64);
67 const LLT v4s32 = LLT::fixed_vector(4, 32);
68 const LLT v4s16 = LLT::fixed_vector(4, 16);
69 const LLT v4s8 = LLT::fixed_vector(4, 8);
70 const LLT v4s1 = LLT::fixed_vector(4, 1);
71
72 const LLT v3s64 = LLT::fixed_vector(3, 64);
73 const LLT v3s32 = LLT::fixed_vector(3, 32);
74 const LLT v3s16 = LLT::fixed_vector(3, 16);
75 const LLT v3s8 = LLT::fixed_vector(3, 8);
76 const LLT v3s1 = LLT::fixed_vector(3, 1);
77
78 const LLT v2s64 = LLT::fixed_vector(2, 64);
79 const LLT v2s32 = LLT::fixed_vector(2, 32);
80 const LLT v2s16 = LLT::fixed_vector(2, 16);
81 const LLT v2s8 = LLT::fixed_vector(2, 8);
82 const LLT v2s1 = LLT::fixed_vector(2, 1);
83
84 const unsigned PSize = ST.getPointerSize();
85 const LLT p0 = LLT::pointer(0, PSize); // Function
86 const LLT p1 = LLT::pointer(1, PSize); // CrossWorkgroup
87 const LLT p2 = LLT::pointer(2, PSize); // UniformConstant
88 const LLT p3 = LLT::pointer(3, PSize); // Workgroup
89 const LLT p4 = LLT::pointer(4, PSize); // Generic
90 const LLT p5 =
91 LLT::pointer(5, PSize); // Input, SPV_INTEL_usm_storage_classes (Device)
92 const LLT p6 = LLT::pointer(6, PSize); // SPV_INTEL_usm_storage_classes (Host)
93 const LLT p7 = LLT::pointer(7, PSize); // Input
94 const LLT p8 = LLT::pointer(8, PSize); // Output
95 const LLT p9 =
96 LLT::pointer(9, PSize); // CodeSectionINTEL, SPV_INTEL_function_pointers
97 const LLT p10 = LLT::pointer(10, PSize); // Private
98 const LLT p11 = LLT::pointer(11, PSize); // StorageBuffer
99 const LLT p12 = LLT::pointer(12, PSize); // Uniform
100 const LLT p13 = LLT::pointer(13, PSize); // PushConstant
101
102 // TODO: remove copy-pasting here by using concatenation in some way.
103 auto allPtrsScalarsAndVectors = {
104 p0, p1, p2, p3, p4, p5, p6, p7, p8,
105 p9, p10, p11, p12, p13, s1, s8, s16, s32,
106 s64, s128, v2s1, v2s8, v2s16, v2s32, v2s64, v3s1, v3s8,
107 v3s16, v3s32, v3s64, v4s1, v4s8, v4s16, v4s32, v4s64, v8s1,
108 v8s8, v8s16, v8s32, v8s64, v16s1, v16s8, v16s16, v16s32, v16s64};
109
110 auto allVectors = {v2s1, v2s8, v2s16, v2s32, v2s64, v3s1, v3s8,
111 v3s16, v3s32, v3s64, v4s1, v4s8, v4s16, v4s32,
112 v4s64, v8s1, v8s8, v8s16, v8s32, v8s64, v16s1,
113 v16s8, v16s16, v16s32, v16s64};
114
115 auto allShaderVectors = {v2s1, v2s8, v2s16, v2s32, v2s64,
116 v3s1, v3s8, v3s16, v3s32, v3s64,
117 v4s1, v4s8, v4s16, v4s32, v4s64};
118
119 auto allScalars = {s1, s8, s16, s32, s64};
120
121 auto allScalarsAndVectors = {
122 s1, s8, s16, s32, s64, s128, v2s1, v2s8,
123 v2s16, v2s32, v2s64, v3s1, v3s8, v3s16, v3s32, v3s64,
124 v4s1, v4s8, v4s16, v4s32, v4s64, v8s1, v8s8, v8s16,
125 v8s32, v8s64, v16s1, v16s8, v16s16, v16s32, v16s64};
126
127 auto allIntScalarsAndVectors = {
128 s8, s16, s32, s64, s128, v2s8, v2s16, v2s32, v2s64,
129 v3s8, v3s16, v3s32, v3s64, v4s8, v4s16, v4s32, v4s64, v8s8,
130 v8s16, v8s32, v8s64, v16s8, v16s16, v16s32, v16s64};
131
132 auto allBoolScalarsAndVectors = {s1, v2s1, v3s1, v4s1, v8s1, v16s1};
133
134 auto allIntScalars = {s8, s16, s32, s64, s128};
135
136 auto allFloatScalarsAndF16Vector2AndVector4s = {s16, s32, s64, v2s16, v4s16};
137
138 auto allFloatScalars = {s16, s32, s64};
139
140 auto allFloatScalarsAndVectors = {
141 s16, s32, s64, v2s16, v2s32, v2s64, v3s16, v3s32, v3s64,
142 v4s16, v4s32, v4s64, v8s16, v8s32, v8s64, v16s16, v16s32, v16s64};
143
144 auto allShaderFloatVectors = {v2s16, v2s32, v2s64, v3s16, v3s32,
145 v3s64, v4s16, v4s32, v4s64};
146
147 auto allFloatVectors = {v2s16, v2s32, v2s64, v3s16, v3s32,
148 v3s64, v4s16, v4s32, v4s64, v8s16,
149 v8s32, v8s64, v16s16, v16s32, v16s64};
150
151 auto &allowedFloatVectorTypes =
152 ST.isShader() ? allShaderFloatVectors : allFloatVectors;
153
154 auto allFloatAndIntScalarsAndPtrs = {s8, s16, s32, s64, p0, p1,
155 p2, p3, p4, p5, p6, p7,
156 p8, p9, p10, p11, p12, p13};
157
158 auto allPtrs = {p0, p1, p2, p3, p4, p5, p6, p7, p8, p9, p10, p11, p12, p13};
159
160 auto &allowedVectorTypes = ST.isShader() ? allShaderVectors : allVectors;
161
162 bool IsExtendedInts =
163 ST.canUseExtension(
164 SPIRV::Extension::SPV_ALTERA_arbitrary_precision_integers) ||
165 ST.canUseExtension(SPIRV::Extension::SPV_KHR_bit_instructions) ||
166 ST.canUseExtension(SPIRV::Extension::SPV_INTEL_int4);
167 auto extendedScalarsAndVectors =
168 [IsExtendedInts](const LegalityQuery &Query) {
169 const LLT Ty = Query.Types[0];
170 return IsExtendedInts && Ty.isValid() && !Ty.isPointerOrPointerVector();
171 };
172 auto extendedScalarsAndVectorsProduct = [IsExtendedInts](
173 const LegalityQuery &Query) {
174 const LLT Ty1 = Query.Types[0], Ty2 = Query.Types[1];
175 return IsExtendedInts && Ty1.isValid() && Ty2.isValid() &&
176 !Ty1.isPointerOrPointerVector() && !Ty2.isPointerOrPointerVector();
177 };
178 auto extendedPtrsScalarsAndVectors =
179 [IsExtendedInts](const LegalityQuery &Query) {
180 const LLT Ty = Query.Types[0];
181 return IsExtendedInts && Ty.isValid();
182 };
183
184 // The universal validation rules in the SPIR-V specification state that
185 // vector sizes are typically limited to 2, 3, or 4. However, larger vector
186 // sizes (8 and 16) are enabled when the Kernel capability is present. For
187 // shader execution models, vector sizes are strictly limited to 4. In
188 // non-shader contexts, vector sizes of 8 and 16 are also permitted, but
189 // arbitrary sizes (e.g., 6 or 11) are not.
190 uint32_t MaxVectorSize = ST.isShader() ? 4 : 16;
191 LLVM_DEBUG(dbgs() << "MaxVectorSize: " << MaxVectorSize << "\n");
192
193 for (auto Opc : getTypeFoldingSupportedOpcodes()) {
194 switch (Opc) {
195 case G_EXTRACT_VECTOR_ELT:
196 case G_UREM:
197 case G_SREM:
198 case G_UDIV:
199 case G_SDIV:
200 case G_FREM:
201 break;
202 default:
204 .customFor(allScalars)
205 .customFor(allowedVectorTypes)
209 0, ElementCount::getFixed(MaxVectorSize)))
210 .custom();
211 break;
212 }
213 }
214
215 getActionDefinitionsBuilder({G_UREM, G_SREM, G_SDIV, G_UDIV, G_FREM})
216 .customFor(allScalars)
217 .customFor(allowedVectorTypes)
221 0, ElementCount::getFixed(MaxVectorSize)))
222 .custom();
223
224 getActionDefinitionsBuilder({G_FMA, G_STRICT_FMA})
225 .legalFor(allScalars)
226 .legalFor(allowedVectorTypes)
230 0, ElementCount::getFixed(MaxVectorSize)))
231 .alwaysLegal();
232
233 getActionDefinitionsBuilder(G_INTRINSIC_W_SIDE_EFFECTS).custom();
234
235 getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
236 .legalForCartesianProduct(allowedVectorTypes, allowedVectorTypes)
238 .lowerIf(vectorElementCountIsGreaterThan(0, MaxVectorSize))
240 .lowerIf(vectorElementCountIsGreaterThan(1, MaxVectorSize));
241
242 getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
246 1, ElementCount::getFixed(MaxVectorSize)))
247 .custom();
248
249 getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
253 0, ElementCount::getFixed(MaxVectorSize)))
254 .custom();
255
256 // Illegal G_UNMERGE_VALUES instructions should be handled
257 // during the combine phase.
258 getActionDefinitionsBuilder(G_BUILD_VECTOR)
260
261 // When entering the legalizer, there should be no G_BITCAST instructions.
262 // They should all be calls to the `spv_bitcast` intrinsic. The call to
263 // the intrinsic will be converted to a G_BITCAST during legalization if
264 // the vectors are not legal. After using the rules to legalize a G_BITCAST,
265 // we turn it back into a call to the intrinsic with a custom rule to avoid
266 // potential machine verifier failures.
272 0, ElementCount::getFixed(MaxVectorSize)))
273 .lowerIf(vectorElementCountIsGreaterThan(1, MaxVectorSize))
274 .custom();
275
276 // If the result is still illegal, the combiner should be able to remove it.
277 getActionDefinitionsBuilder(G_CONCAT_VECTORS)
278 .legalForCartesianProduct(allowedVectorTypes, allowedVectorTypes);
279
280 getActionDefinitionsBuilder(G_SPLAT_VECTOR)
281 .legalFor(allowedVectorTypes)
285 .alwaysLegal();
286
287 // Vector Reduction Operations
289 {G_VECREDUCE_SMIN, G_VECREDUCE_SMAX, G_VECREDUCE_UMIN, G_VECREDUCE_UMAX,
290 G_VECREDUCE_ADD, G_VECREDUCE_MUL, G_VECREDUCE_FMUL, G_VECREDUCE_FMIN,
291 G_VECREDUCE_FMAX, G_VECREDUCE_FMINIMUM, G_VECREDUCE_FMAXIMUM,
292 G_VECREDUCE_OR, G_VECREDUCE_AND, G_VECREDUCE_XOR})
293 .legalFor(allowedVectorTypes)
294 .scalarize(1)
295 .lower();
296
297 getActionDefinitionsBuilder({G_VECREDUCE_SEQ_FADD, G_VECREDUCE_SEQ_FMUL})
298 .scalarize(2)
299 .lower();
300
301 // Illegal G_UNMERGE_VALUES instructions should be handled
302 // during the combine phase.
303 getActionDefinitionsBuilder(G_UNMERGE_VALUES)
305
306 getActionDefinitionsBuilder({G_MEMCPY, G_MEMCPY_INLINE, G_MEMMOVE})
307 .unsupportedIf(LegalityPredicates::any(typeIs(0, p9), typeIs(1, p9)))
308 .legalIf(all(typeInSet(0, allPtrs), typeInSet(1, allPtrs)));
309
311 .unsupportedIf(typeIs(0, p9))
312 .legalIf(all(typeInSet(0, allPtrs), typeInSet(1, allIntScalars)));
313
314 getActionDefinitionsBuilder(G_ADDRSPACE_CAST)
315 .legalForCartesianProduct(allPtrs, allPtrs);
316
317 // Should we be legalizing bad scalar sizes like s5 here instead
318 // of handling them in the instruction selector?
319 getActionDefinitionsBuilder({G_LOAD, G_STORE})
320 .unsupportedIf(typeIs(1, p9))
321 .legalForCartesianProduct(allowedVectorTypes, allPtrs)
322 .legalForCartesianProduct(allPtrs, allPtrs)
323 .legalIf(isScalar(0))
324 .custom();
325
326 getActionDefinitionsBuilder({G_SMIN, G_SMAX, G_UMIN, G_UMAX, G_ABS,
327 G_BITREVERSE, G_SADDSAT, G_UADDSAT, G_SSUBSAT,
328 G_USUBSAT, G_SCMP, G_UCMP})
329 .legalFor(allIntScalarsAndVectors)
330 .legalIf(extendedScalarsAndVectors);
331
332 getActionDefinitionsBuilder(G_STRICT_FLDEXP)
333 .legalForCartesianProduct(allFloatScalarsAndVectors, allIntScalars);
334
335 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
336 .legalForCartesianProduct(allIntScalarsAndVectors,
337 allFloatScalarsAndVectors);
338
339 getActionDefinitionsBuilder({G_FPTOSI_SAT, G_FPTOUI_SAT})
340 .legalForCartesianProduct(allIntScalarsAndVectors,
341 allFloatScalarsAndVectors);
342
343 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
344 .legalForCartesianProduct(allFloatScalarsAndVectors,
345 allScalarsAndVectors);
346
348 .legalForCartesianProduct(allIntScalarsAndVectors)
349 .legalIf(extendedScalarsAndVectorsProduct);
350
351 // Extensions.
352 getActionDefinitionsBuilder({G_TRUNC, G_ZEXT, G_SEXT, G_ANYEXT})
353 .legalForCartesianProduct(allScalarsAndVectors)
354 .legalIf(extendedScalarsAndVectorsProduct);
355
357 .legalFor(allPtrsScalarsAndVectors)
358 .legalIf(extendedPtrsScalarsAndVectors);
359
361 all(typeInSet(0, allPtrsScalarsAndVectors),
362 typeInSet(1, allPtrsScalarsAndVectors)));
363
364 getActionDefinitionsBuilder({G_IMPLICIT_DEF, G_FREEZE})
365 .legalFor({s1, s128})
366 .legalFor(allFloatAndIntScalarsAndPtrs)
367 .legalFor(allowedVectorTypes)
368 .legalIf([](const LegalityQuery &Query) {
369 return Query.Types[0].isPointerVector();
370 })
371 .moreElementsToNextPow2(0)
372 .fewerElementsIf(vectorElementCountIsGreaterThan(0, MaxVectorSize),
374 0, ElementCount::getFixed(MaxVectorSize)));
375
376 getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).alwaysLegal();
377
379 .legalForCartesianProduct(allPtrs, allIntScalars)
380 .legalIf(
381 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)))
382 .legalIf([](const LegalityQuery &Query) {
383 const LLT DstTy = Query.Types[0];
384 const LLT SrcTy = Query.Types[1];
385 return DstTy.isPointerVector() && SrcTy.isVector() &&
386 !SrcTy.isPointer() &&
387 DstTy.getNumElements() == SrcTy.getNumElements();
388 });
390 .legalForCartesianProduct(allIntScalars, allPtrs)
391 .legalIf(
392 all(typeOfExtendedScalars(0, IsExtendedInts), typeInSet(1, allPtrs)))
393 .legalIf([](const LegalityQuery &Query) {
394 const LLT DstTy = Query.Types[0];
395 const LLT SrcTy = Query.Types[1];
396 return SrcTy.isPointerVector() && DstTy.isVector() &&
397 !DstTy.isPointer() &&
398 DstTy.getNumElements() == SrcTy.getNumElements();
399 });
401 .legalForCartesianProduct(allPtrs, allIntScalars)
402 .legalIf(
403 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)));
404
406 .legalForCartesianProduct(allPtrs, allIntScalars)
407 .legalIf(
408 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)))
409 .legalIf([](const LegalityQuery &Query) {
410 const LLT PtrTy = Query.Types[0];
411 const LLT MaskTy = Query.Types[1];
412 return PtrTy.isPointerVector() && MaskTy.isVector() &&
413 !MaskTy.isPointer() &&
414 PtrTy.getNumElements() == MaskTy.getNumElements();
415 });
416
417 // ST.canDirectlyComparePointers() for pointer args is supported in
418 // legalizeCustom().
421 all(typeIs(0, p9), typeInSet(1, allPtrs), typeIsNot(1, p9)),
422 all(typeInSet(0, allPtrs), typeIsNot(0, p9), typeIs(1, p9))))
423 .legalIf([IsExtendedInts](const LegalityQuery &Query) {
424 const LLT Ty = Query.Types[1];
425 return IsExtendedInts && Ty.isValid() && !Ty.isPointerOrPointerVector();
426 })
427 .customIf(all(typeInSet(0, allBoolScalarsAndVectors),
428 typeInSet(1, allPtrsScalarsAndVectors)));
429
431 all(typeInSet(0, allBoolScalarsAndVectors),
432 typeInSet(1, allFloatScalarsAndVectors)));
433
434 getActionDefinitionsBuilder({G_ATOMICRMW_OR, G_ATOMICRMW_ADD, G_ATOMICRMW_AND,
435 G_ATOMICRMW_MAX, G_ATOMICRMW_MIN,
436 G_ATOMICRMW_SUB, G_ATOMICRMW_XOR,
437 G_ATOMICRMW_UMAX, G_ATOMICRMW_UMIN})
438 .legalForCartesianProduct(allIntScalars, allPtrs);
439
441 {G_ATOMICRMW_FADD, G_ATOMICRMW_FSUB, G_ATOMICRMW_FMIN, G_ATOMICRMW_FMAX})
442 .legalForCartesianProduct(allFloatScalarsAndF16Vector2AndVector4s,
443 allPtrs);
444
445 getActionDefinitionsBuilder(G_ATOMICRMW_XCHG)
446 .legalForCartesianProduct(allFloatAndIntScalarsAndPtrs, allPtrs);
447
448 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG_WITH_SUCCESS).lower();
449 // TODO: add proper legalization rules.
450 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG).alwaysLegal();
451
452 getActionDefinitionsBuilder({G_UADDO, G_USUBO, G_UMULO, G_SMULO})
453 .alwaysLegal();
454
455 getActionDefinitionsBuilder({G_SADDO, G_SSUBO}).lower();
456
457 getActionDefinitionsBuilder({G_LROUND, G_LLROUND})
458 .legalForCartesianProduct(allFloatScalarsAndVectors,
459 allIntScalarsAndVectors);
460
461 // FP conversions.
462 getActionDefinitionsBuilder({G_FPTRUNC, G_FPEXT})
463 .legalForCartesianProduct(allFloatScalarsAndVectors);
464
465 // Pointer-handling.
466 getActionDefinitionsBuilder(G_FRAME_INDEX).legalFor({p0});
467
468 getActionDefinitionsBuilder(G_GLOBAL_VALUE).legalFor(allPtrs);
469
470 // Control-flow. In some cases (e.g. constants) s1 may be promoted to s32.
472 getActionDefinitionsBuilder(G_BRCOND).legalFor({s1, s32});
473
475 allFloatScalarsAndVectors, {s32, v2s32, v3s32, v4s32, v8s32, v16s32});
476
477 // TODO: Review the target OpenCL and GLSL Extended Instruction Set specs to
478 // tighten these requirements. Many of these math functions are only legal on
479 // specific bitwidths, so they are not selectable for
480 // allFloatScalarsAndVectors.
481 // clang-format off
482 getActionDefinitionsBuilder({G_STRICT_FSQRT,
483 G_FPOW,
484 G_FEXP,
485 G_FMODF,
486 G_FSINCOS,
487 G_FEXP2,
488 G_FEXP10,
489 G_FLOG,
490 G_FLOG2,
491 G_FLOG10,
492 G_FABS,
493 G_FMINNUM,
494 G_FMAXNUM,
495 G_FCEIL,
496 G_FCOS,
497 G_FSIN,
498 G_FTAN,
499 G_FACOS,
500 G_FASIN,
501 G_FATAN,
502 G_FATAN2,
503 G_FCOSH,
504 G_FSINH,
505 G_FTANH,
506 G_FSQRT,
507 G_FFLOOR,
508 G_FRINT,
509 G_FNEARBYINT,
510 G_INTRINSIC_ROUND,
511 G_INTRINSIC_TRUNC,
512 G_FMINIMUM,
513 G_FMAXIMUM,
514 G_INTRINSIC_ROUNDEVEN})
515 .legalFor(allFloatScalars)
516 .legalFor(allowedFloatVectorTypes)
520 0, ElementCount::getFixed(MaxVectorSize)));
521 // clang-format on
522
523 getActionDefinitionsBuilder(G_FCOPYSIGN)
524 .legalForCartesianProduct(allFloatScalarsAndVectors,
525 allFloatScalarsAndVectors);
526
528 allFloatScalarsAndVectors, allIntScalarsAndVectors);
529
530 if (ST.canUseExtInstSet(SPIRV::InstructionSet::OpenCL_std)) {
532 {G_CTTZ, G_CTTZ_ZERO_POISON, G_CTLZ, G_CTLZ_ZERO_POISON})
533 .legalForCartesianProduct(allIntScalarsAndVectors,
534 allIntScalarsAndVectors);
535
536 // Struct return types become a single scalar, so cannot easily legalize.
537 getActionDefinitionsBuilder({G_SMULH, G_UMULH}).alwaysLegal();
538 }
539
540 getActionDefinitionsBuilder(G_IS_FPCLASS).custom();
541
542 getActionDefinitionsBuilder({G_INTRINSIC, G_INTRINSIC_CONVERGENT,
543 G_INTRINSIC_CONVERGENT_W_SIDE_EFFECTS})
544 .alwaysLegal();
546 getActionDefinitionsBuilder({G_TRAP, G_DEBUGTRAP, G_UBSANTRAP}).alwaysLegal();
547
549 verify(*ST.getInstrInfo());
550}
551
554 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
555 Register DstReg = MI.getOperand(0).getReg();
556 Register SrcReg = MI.getOperand(1).getReg();
557 Register IdxReg = MI.getOperand(2).getReg();
558
559 MIRBuilder
560 .buildIntrinsic(Intrinsic::spv_extractelt, ArrayRef<Register>{DstReg})
561 .addUse(SrcReg)
562 .addUse(IdxReg);
563 MI.eraseFromParent();
564 return true;
565}
566
569 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
570 Register DstReg = MI.getOperand(0).getReg();
571 Register SrcReg = MI.getOperand(1).getReg();
572 Register ValReg = MI.getOperand(2).getReg();
573 Register IdxReg = MI.getOperand(3).getReg();
574
575 MIRBuilder
576 .buildIntrinsic(Intrinsic::spv_insertelt, ArrayRef<Register>{DstReg})
577 .addUse(SrcReg)
578 .addUse(ValReg)
579 .addUse(IdxReg);
580 MI.eraseFromParent();
581 return true;
582}
583
585 LegalizerHelper &Helper,
588 Register ConvReg = MRI.createGenericVirtualRegister(ConvTy);
589 MRI.setRegClass(ConvReg, GR->getRegClass(SpvType));
590 GR->assignSPIRVTypeToVReg(SpvType, ConvReg, Helper.MIRBuilder.getMF());
591 Helper.MIRBuilder.buildInstr(TargetOpcode::G_PTRTOINT)
592 .addDef(ConvReg)
593 .addUse(Reg);
594 return ConvReg;
595}
596
597static bool needsVectorLegalization(const LLT &Ty, const SPIRVSubtarget &ST) {
598 if (!Ty.isVector())
599 return false;
600 unsigned NumElements = Ty.getNumElements();
601 unsigned MaxVectorSize = ST.isShader() ? 4 : 16;
602 return (NumElements > 4 && !isPowerOf2_32(NumElements)) ||
603 NumElements > MaxVectorSize;
604}
605
608 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
609 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
610 Register DstReg = MI.getOperand(0).getReg();
611 Register PtrReg = MI.getOperand(1).getReg();
612 LLT DstTy = MRI.getType(DstReg);
613
614 if (!DstTy.isVector())
615 return true;
616
617 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
618 if (!needsVectorLegalization(DstTy, ST))
619 return true;
620
621 SmallVector<Register, 8> SplitRegs;
622 LLT EltTy = DstTy.getElementType();
623 unsigned NumElts = DstTy.getNumElements();
624
625 LLT PtrTy = MRI.getType(PtrReg);
626 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
627
628 for (unsigned i = 0; i < NumElts; ++i) {
629 auto Idx = MIRBuilder.buildConstant(LLT::scalar(32), i);
630 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
631
632 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
633 .addImm(1) // InBounds
634 .addUse(PtrReg)
635 .addUse(Zero.getReg(0))
636 .addUse(Idx.getReg(0));
637
638 MachinePointerInfo EltPtrInfo;
639 Align EltAlign = Align(1);
640 if (!MI.memoperands_empty()) {
641 MachineMemOperand *MMO = *MI.memoperands_begin();
642 EltPtrInfo =
643 MMO->getPointerInfo().getWithOffset(i * EltTy.getSizeInBytes());
644 EltAlign = commonAlignment(MMO->getAlign(), i * EltTy.getSizeInBytes());
645 }
646
647 Register EltReg = MRI.createGenericVirtualRegister(EltTy);
648 MIRBuilder.buildLoad(EltReg, EltPtr, EltPtrInfo, EltAlign);
649 SplitRegs.push_back(EltReg);
650 }
651
652 MIRBuilder.buildBuildVector(DstReg, SplitRegs);
653 MI.eraseFromParent();
654 return true;
655}
656
659 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
660 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
661 Register ValReg = MI.getOperand(0).getReg();
662 Register PtrReg = MI.getOperand(1).getReg();
663 LLT ValTy = MRI.getType(ValReg);
664
665 assert(ValTy.isVector() && "Expected vector store");
666
667 SmallVector<Register, 8> SplitRegs;
668 LLT EltTy = ValTy.getElementType();
669 unsigned NumElts = ValTy.getNumElements();
670
671 for (unsigned i = 0; i < NumElts; ++i)
672 SplitRegs.push_back(MRI.createGenericVirtualRegister(EltTy));
673
674 MIRBuilder.buildUnmerge(SplitRegs, ValReg);
675
676 LLT PtrTy = MRI.getType(PtrReg);
677 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
678
679 for (unsigned i = 0; i < NumElts; ++i) {
680 auto Idx = MIRBuilder.buildConstant(LLT::scalar(32), i);
681 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
682
683 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
684 .addImm(1) // InBounds
685 .addUse(PtrReg)
686 .addUse(Zero.getReg(0))
687 .addUse(Idx.getReg(0));
688
689 MachinePointerInfo EltPtrInfo;
690 Align EltAlign = Align(1);
691 if (!MI.memoperands_empty()) {
692 MachineMemOperand *MMO = *MI.memoperands_begin();
693 EltPtrInfo =
694 MMO->getPointerInfo().getWithOffset(i * EltTy.getSizeInBytes());
695 EltAlign = commonAlignment(MMO->getAlign(), i * EltTy.getSizeInBytes());
696 }
697
698 MIRBuilder.buildStore(SplitRegs[i], EltPtr, EltPtrInfo, EltAlign);
699 }
700
701 MI.eraseFromParent();
702 return true;
703}
704
707 LostDebugLocObserver &LocObserver) const {
708 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
709 switch (MI.getOpcode()) {
710 default:
711 // TODO: implement legalization for other opcodes.
712 return true;
713 case TargetOpcode::G_BITCAST:
714 return legalizeBitcast(Helper, MI);
715 case TargetOpcode::G_EXTRACT_VECTOR_ELT:
716 return legalizeExtractVectorElt(Helper, MI, GR);
717 case TargetOpcode::G_INSERT_VECTOR_ELT:
718 return legalizeInsertVectorElt(Helper, MI, GR);
719 case TargetOpcode::G_INTRINSIC:
720 case TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS:
721 return legalizeIntrinsic(Helper, MI);
722 case TargetOpcode::G_IS_FPCLASS:
723 return legalizeIsFPClass(Helper, MI, LocObserver);
724 case TargetOpcode::G_ICMP: {
725 auto &Op0 = MI.getOperand(2);
726 auto &Op1 = MI.getOperand(3);
727 Register Reg0 = Op0.getReg();
728 Register Reg1 = Op1.getReg();
730 static_cast<CmpInst::Predicate>(MI.getOperand(1).getPredicate());
731 if ((!ST->canDirectlyComparePointers() ||
733 MRI.getType(Reg0).isPointer() && MRI.getType(Reg1).isPointer()) {
734 LLT ConvT = LLT::scalar(ST->getPointerSize());
735 Type *LLVMTy = IntegerType::get(MI.getMF()->getFunction().getContext(),
736 ST->getPointerSize());
737 SPIRVTypeInst SpirvTy = GR->getOrCreateSPIRVType(
738 LLVMTy, Helper.MIRBuilder, SPIRV::AccessQualifier::ReadWrite, true);
739 Op0.setReg(convertPtrToInt(Reg0, ConvT, SpirvTy, Helper, MRI, GR));
740 Op1.setReg(convertPtrToInt(Reg1, ConvT, SpirvTy, Helper, MRI, GR));
741 }
742 return true;
743 }
744 case TargetOpcode::G_LOAD:
745 return legalizeLoad(Helper, MI, GR);
746 case TargetOpcode::G_STORE:
747 return legalizeStore(Helper, MI, GR);
748 }
749}
750
753 Register SrcReg, LLT SrcTy,
754 MachinePointerInfo &PtrInfo, Align &VecAlign) {
755 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
756 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
757
758 VecAlign = Helper.getStackTemporaryAlignment(SrcTy);
759 auto StackTemp = Helper.createStackTemporary(
760 TypeSize::getFixed(SrcTy.getSizeInBytes()), VecAlign, PtrInfo);
761
762 // Set the type of StackTemp to a pointer to an array of the element type.
763 SPIRVTypeInst SpvSrcTy = GR->getSPIRVTypeForVReg(SrcReg);
764 SPIRVTypeInst EltSpvTy = GR->getScalarOrVectorComponentType(SpvSrcTy);
765 const Type *LLVMEltTy = GR->getTypeForSPIRVType(EltSpvTy);
766 const Type *LLVMArrTy =
767 ArrayType::get(const_cast<Type *>(LLVMEltTy), SrcTy.getNumElements());
768 SPIRVTypeInst ArrSpvTy = GR->getOrCreateSPIRVType(
769 LLVMArrTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite, true);
770 SPIRVTypeInst PtrToArrSpvTy = GR->getOrCreateSPIRVPointerType(
771 ArrSpvTy, MIRBuilder, SPIRV::StorageClass::Function);
772
773 Register StackReg = StackTemp.getReg(0);
774 MRI.setRegClass(StackReg, GR->getRegClass(PtrToArrSpvTy));
775 GR->assignSPIRVTypeToVReg(PtrToArrSpvTy, StackReg, MIRBuilder.getMF());
776
777 return StackTemp;
778}
779
782 LLVM_DEBUG(dbgs() << "Found a bitcast instruction\n");
783 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
784 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
785 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
786
787 Register DstReg = MI.getOperand(0).getReg();
788 Register SrcReg = MI.getOperand(2).getReg();
789 LLT DstTy = MRI.getType(DstReg);
790 LLT SrcTy = MRI.getType(SrcReg);
791
792 // If an spv_bitcast needs to be legalized, we convert it to G_BITCAST to
793 // allow using the generic legalization rules.
794 if (needsVectorLegalization(DstTy, ST) ||
795 needsVectorLegalization(SrcTy, ST)) {
796 LLVM_DEBUG(dbgs() << "Replacing with a G_BITCAST\n");
797 MIRBuilder.buildBitcast(DstReg, SrcReg);
798 MI.eraseFromParent();
799 }
800 return true;
801}
802
805 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
806 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
807 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
808
809 Register DstReg = MI.getOperand(0).getReg();
810 LLT DstTy = MRI.getType(DstReg);
811
812 if (needsVectorLegalization(DstTy, ST)) {
813 Register SrcReg = MI.getOperand(2).getReg();
814 Register ValReg = MI.getOperand(3).getReg();
815 LLT SrcTy = MRI.getType(SrcReg);
816 MachineOperand &IdxOperand = MI.getOperand(4);
817
818 if (getImm(IdxOperand, &MRI)) {
819 uint64_t IdxVal = foldImm(IdxOperand, &MRI);
820 if (IdxVal < SrcTy.getNumElements()) {
822 SPIRVTypeInst ElementType =
824 LLT ElementLLTTy = GR->getRegType(ElementType);
825 for (unsigned I = 0, E = SrcTy.getNumElements(); I < E; ++I) {
826 Register Reg = MRI.createGenericVirtualRegister(ElementLLTTy);
827 MRI.setRegClass(Reg, GR->getRegClass(ElementType));
828 GR->assignSPIRVTypeToVReg(ElementType, Reg, *MI.getMF());
829 Regs.push_back(Reg);
830 }
831 MIRBuilder.buildUnmerge(Regs, SrcReg);
832 Regs[IdxVal] = ValReg;
833 MIRBuilder.buildBuildVector(DstReg, Regs);
834 MI.eraseFromParent();
835 return true;
836 }
837 }
838
839 LLT EltTy = SrcTy.getElementType();
840 Align VecAlign;
841 MachinePointerInfo PtrInfo;
842 auto StackTemp = createStackTemporaryForVector(Helper, GR, SrcReg, SrcTy,
843 PtrInfo, VecAlign);
844
845 MIRBuilder.buildStore(SrcReg, StackTemp, PtrInfo, VecAlign);
846
847 Register IdxReg = IdxOperand.getReg();
848 LLT PtrTy = MRI.getType(StackTemp.getReg(0));
849 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
850 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
851
852 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
853 .addImm(1) // InBounds
854 .addUse(StackTemp.getReg(0))
855 .addUse(Zero.getReg(0))
856 .addUse(IdxReg);
857
859 Align EltAlign = Helper.getStackTemporaryAlignment(EltTy);
860 MIRBuilder.buildStore(ValReg, EltPtr, EltPtrInfo, EltAlign);
861
862 MIRBuilder.buildLoad(DstReg, StackTemp, PtrInfo, VecAlign);
863 MI.eraseFromParent();
864 return true;
865 }
866 return true;
867}
868
871 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
872 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
873 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
874
875 Register SrcReg = MI.getOperand(2).getReg();
876 LLT SrcTy = MRI.getType(SrcReg);
877
878 if (needsVectorLegalization(SrcTy, ST)) {
879 Register DstReg = MI.getOperand(0).getReg();
880 MachineOperand &IdxOperand = MI.getOperand(3);
881
882 if (getImm(IdxOperand, &MRI)) {
883 uint64_t IdxVal = foldImm(IdxOperand, &MRI);
884 if (IdxVal < SrcTy.getNumElements()) {
885 LLT DstTy = MRI.getType(DstReg);
887 SPIRVTypeInst DstSpvTy = GR->getSPIRVTypeForVReg(DstReg);
888 for (unsigned I = 0, E = SrcTy.getNumElements(); I < E; ++I) {
889 if (I == IdxVal) {
890 Regs.push_back(DstReg);
891 } else {
893 MRI.setRegClass(Reg, GR->getRegClass(DstSpvTy));
894 GR->assignSPIRVTypeToVReg(DstSpvTy, Reg, *MI.getMF());
895 Regs.push_back(Reg);
896 }
897 }
898 MIRBuilder.buildUnmerge(Regs, SrcReg);
899 MI.eraseFromParent();
900 return true;
901 }
902 }
903
904 LLT EltTy = SrcTy.getElementType();
905 Align VecAlign;
906 MachinePointerInfo PtrInfo;
907 auto StackTemp = createStackTemporaryForVector(Helper, GR, SrcReg, SrcTy,
908 PtrInfo, VecAlign);
909
910 MIRBuilder.buildStore(SrcReg, StackTemp, PtrInfo, VecAlign);
911
912 Register IdxReg = IdxOperand.getReg();
913 LLT PtrTy = MRI.getType(StackTemp.getReg(0));
914 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
915 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
916
917 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
918 .addImm(1) // InBounds
919 .addUse(StackTemp.getReg(0))
920 .addUse(Zero.getReg(0))
921 .addUse(IdxReg);
922
924 Align EltAlign = Helper.getStackTemporaryAlignment(EltTy);
925 MIRBuilder.buildLoad(DstReg, EltPtr, EltPtrInfo, EltAlign);
926
927 MI.eraseFromParent();
928 return true;
929 }
930 return true;
931}
932
935 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
936 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
937 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
938
939 Register DstReg = MI.getOperand(0).getReg();
940 LLT DstTy = MRI.getType(DstReg);
941
942 if (!needsVectorLegalization(DstTy, ST))
943 return true;
944
946 if (MI.getNumOperands() == 2) {
947 // The "null" case: no values are attached.
948 LLT EltTy = DstTy.getElementType();
949 auto Zero = MIRBuilder.buildConstant(EltTy, 0);
950 SPIRVTypeInst SpvDstTy = GR->getSPIRVTypeForVReg(DstReg);
951 SPIRVTypeInst SpvEltTy = GR->getScalarOrVectorComponentType(SpvDstTy);
952 GR->assignSPIRVTypeToVReg(SpvEltTy, Zero.getReg(0), MIRBuilder.getMF());
953 for (unsigned i = 0; i < DstTy.getNumElements(); ++i)
954 SrcRegs.push_back(Zero.getReg(0));
955 } else {
956 for (unsigned i = 2; i < MI.getNumOperands(); ++i) {
957 SrcRegs.push_back(MI.getOperand(i).getReg());
958 }
959 }
960 MIRBuilder.buildBuildVector(DstReg, SrcRegs);
961 MI.eraseFromParent();
962 return true;
963}
964
966 MachineInstr &MI) const {
967 LLVM_DEBUG(dbgs() << "legalizeIntrinsic: " << MI);
968 auto IntrinsicID = cast<GIntrinsic>(MI).getIntrinsicID();
969 switch (IntrinsicID) {
970 case Intrinsic::spv_bitcast:
971 return legalizeSpvBitcast(Helper, MI, GR);
972 case Intrinsic::spv_insertelt:
973 return legalizeSpvInsertElt(Helper, MI, GR);
974 case Intrinsic::spv_extractelt:
975 return legalizeSpvExtractElt(Helper, MI, GR);
976 case Intrinsic::spv_const_composite:
977 return legalizeSpvConstComposite(Helper, MI, GR);
978 }
979 return true;
980}
981
982bool SPIRVLegalizerInfo::legalizeBitcast(LegalizerHelper &Helper,
983 MachineInstr &MI) const {
984 // Once the G_BITCAST is using vectors that are allowed, we turn it back into
985 // an spv_bitcast to avoid verifier problems when the register types are the
986 // same for the source and the result. Note that the SPIR-V types associated
987 // with the bitcast can be different even if the register types are the same.
988 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
989 Register DstReg = MI.getOperand(0).getReg();
990 Register SrcReg = MI.getOperand(1).getReg();
991 SmallVector<Register, 1> DstRegs = {DstReg};
992 MIRBuilder.buildIntrinsic(Intrinsic::spv_bitcast, DstRegs).addUse(SrcReg);
993 MI.eraseFromParent();
994 return true;
995}
996
997// Note this code was copied from LegalizerHelper::lowerISFPCLASS and adjusted
998// to ensure that all instructions created during the lowering have SPIR-V types
999// assigned to them.
1000bool SPIRVLegalizerInfo::legalizeIsFPClass(
1002 LostDebugLocObserver &LocObserver) const {
1003 auto [DstReg, DstTy, SrcReg, SrcTy] = MI.getFirst2RegLLTs();
1004 FPClassTest Mask = static_cast<FPClassTest>(MI.getOperand(2).getImm());
1005
1006 auto &MIRBuilder = Helper.MIRBuilder;
1007 auto &MF = MIRBuilder.getMF();
1008 MachineRegisterInfo &MRI = MF.getRegInfo();
1009
1010 Type *LLVMDstTy =
1011 IntegerType::get(MIRBuilder.getContext(), DstTy.getScalarSizeInBits());
1012 if (DstTy.isVector())
1013 LLVMDstTy = VectorType::get(LLVMDstTy, DstTy.getElementCount());
1014 SPIRVTypeInst SPIRVDstTy = GR->getOrCreateSPIRVType(
1015 LLVMDstTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite,
1016 /*EmitIR*/ true);
1017
1018 unsigned BitSize = SrcTy.getScalarSizeInBits();
1019 const fltSemantics &Semantics = getFltSemanticForLLT(SrcTy.getScalarType());
1020
1021 LLT IntTy = LLT::scalar(BitSize);
1022 Type *LLVMIntTy = IntegerType::get(MIRBuilder.getContext(), BitSize);
1023 if (SrcTy.isVector()) {
1024 IntTy = LLT::vector(SrcTy.getElementCount(), IntTy);
1025 LLVMIntTy = VectorType::get(LLVMIntTy, SrcTy.getElementCount());
1026 }
1027 SPIRVTypeInst SPIRVIntTy = GR->getOrCreateSPIRVType(
1028 LLVMIntTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite,
1029 /*EmitIR*/ true);
1030
1031 // Clang doesn't support capture of structured bindings:
1032 LLT DstTyCopy = DstTy;
1033 const auto assignSPIRVTy = [&](MachineInstrBuilder &&MI) {
1034 // Assign this MI's (assumed only) destination to one of the two types we
1035 // expect: either the G_IS_FPCLASS's destination type, or the integer type
1036 // bitcast from the source type.
1037 LLT MITy = MRI.getType(MI.getReg(0));
1038 assert((MITy == IntTy || MITy == DstTyCopy) &&
1039 "Unexpected LLT type while lowering G_IS_FPCLASS");
1040 SPIRVTypeInst SPVTy = MITy == IntTy ? SPIRVIntTy : SPIRVDstTy;
1041 GR->assignSPIRVTypeToVReg(SPVTy, MI.getReg(0), MF);
1042 return MI;
1043 };
1044
1045 // Helper to build and assign a constant in one go
1046 const auto buildSPIRVConstant = [&](LLT Ty, auto &&C) -> MachineInstrBuilder {
1047 if (!Ty.isFixedVector())
1048 return assignSPIRVTy(MIRBuilder.buildConstant(Ty, C));
1049 auto ScalarC = MIRBuilder.buildConstant(Ty.getScalarType(), C);
1050 assert((Ty == IntTy || Ty == DstTyCopy) &&
1051 "Unexpected LLT type while lowering constant for G_IS_FPCLASS");
1052 SPIRVTypeInst VecEltTy = GR->getOrCreateSPIRVType(
1053 (Ty == IntTy ? LLVMIntTy : LLVMDstTy)->getScalarType(), MIRBuilder,
1054 SPIRV::AccessQualifier::ReadWrite,
1055 /*EmitIR*/ true);
1056 GR->assignSPIRVTypeToVReg(VecEltTy, ScalarC.getReg(0), MF);
1057 return assignSPIRVTy(MIRBuilder.buildSplatBuildVector(Ty, ScalarC));
1058 };
1059
1060 if (Mask == fcNone) {
1061 MIRBuilder.buildCopy(DstReg, buildSPIRVConstant(DstTy, 0));
1062 MI.eraseFromParent();
1063 return true;
1064 }
1065 if (Mask == fcAllFlags) {
1066 MIRBuilder.buildCopy(DstReg, buildSPIRVConstant(DstTy, 1));
1067 MI.eraseFromParent();
1068 return true;
1069 }
1070
1071 // Note that rather than creating a COPY here (between a floating-point and
1072 // integer type of the same size) we create a SPIR-V bitcast immediately. We
1073 // can't create a G_BITCAST because the LLTs are the same, and we can't seem
1074 // to correctly lower COPYs to SPIR-V bitcasts at this moment.
1075 Register ResVReg = MRI.createGenericVirtualRegister(IntTy);
1076 MRI.setRegClass(ResVReg, GR->getRegClass(SPIRVIntTy));
1077 GR->assignSPIRVTypeToVReg(SPIRVIntTy, ResVReg, Helper.MIRBuilder.getMF());
1078 auto AsInt = MIRBuilder.buildInstr(SPIRV::OpBitcast)
1079 .addDef(ResVReg)
1080 .addUse(GR->getSPIRVTypeID(SPIRVIntTy))
1081 .addUse(SrcReg);
1082 AsInt = assignSPIRVTy(std::move(AsInt));
1083
1084 // Various masks.
1085 APInt SignBit = APInt::getSignMask(BitSize);
1086 APInt ValueMask = APInt::getSignedMaxValue(BitSize); // All bits but sign.
1087 APInt Inf = APFloat::getInf(Semantics).bitcastToAPInt(); // Exp and int bit.
1088 APInt ExpMask = Inf;
1089 APInt AllOneMantissa = APFloat::getLargest(Semantics).bitcastToAPInt() & ~Inf;
1090 APInt QNaNBitMask =
1091 APInt::getOneBitSet(BitSize, AllOneMantissa.getActiveBits() - 1);
1092 APInt InversionMask = APInt::getAllOnes(DstTy.getScalarSizeInBits());
1093
1094 auto SignBitC = buildSPIRVConstant(IntTy, SignBit);
1095 auto ValueMaskC = buildSPIRVConstant(IntTy, ValueMask);
1096 auto InfC = buildSPIRVConstant(IntTy, Inf);
1097 auto ExpMaskC = buildSPIRVConstant(IntTy, ExpMask);
1098 auto ZeroC = buildSPIRVConstant(IntTy, 0);
1099
1100 auto Abs = assignSPIRVTy(MIRBuilder.buildAnd(IntTy, AsInt, ValueMaskC));
1101 auto Sign = assignSPIRVTy(
1102 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_NE, DstTy, AsInt, Abs));
1103
1104 auto Res = buildSPIRVConstant(DstTy, 0);
1105
1106 const auto appendToRes = [&](MachineInstrBuilder &&ToAppend) {
1107 Res = assignSPIRVTy(
1108 MIRBuilder.buildOr(DstTyCopy, Res, assignSPIRVTy(std::move(ToAppend))));
1109 };
1110
1111 // Tests that involve more than one class should be processed first.
1112 if ((Mask & fcFinite) == fcFinite) {
1113 // finite(V) ==> abs(V) u< exp_mask
1114 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, Abs,
1115 ExpMaskC));
1116 Mask &= ~fcFinite;
1117 } else if ((Mask & fcFinite) == fcPosFinite) {
1118 // finite(V) && V > 0 ==> V u< exp_mask
1119 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, AsInt,
1120 ExpMaskC));
1121 Mask &= ~fcPosFinite;
1122 } else if ((Mask & fcFinite) == fcNegFinite) {
1123 // finite(V) && V < 0 ==> abs(V) u< exp_mask && signbit == 1
1124 auto Cmp = assignSPIRVTy(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT,
1125 DstTy, Abs, ExpMaskC));
1126 appendToRes(MIRBuilder.buildAnd(DstTy, Cmp, Sign));
1127 Mask &= ~fcNegFinite;
1128 }
1129
1130 if (FPClassTest PartialCheck = Mask & (fcZero | fcSubnormal)) {
1131 // fcZero | fcSubnormal => test all exponent bits are 0
1132 // TODO: Handle sign bit specific cases
1133 // TODO: Handle inverted case
1134 if (PartialCheck == (fcZero | fcSubnormal)) {
1135 auto ExpBits = assignSPIRVTy(MIRBuilder.buildAnd(IntTy, AsInt, ExpMaskC));
1136 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1137 ExpBits, ZeroC));
1138 Mask &= ~PartialCheck;
1139 }
1140 }
1141
1142 // Check for individual classes.
1143 if (FPClassTest PartialCheck = Mask & fcZero) {
1144 if (PartialCheck == fcPosZero)
1145 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1146 AsInt, ZeroC));
1147 else if (PartialCheck == fcZero)
1148 appendToRes(
1149 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy, Abs, ZeroC));
1150 else // fcNegZero
1151 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1152 AsInt, SignBitC));
1153 }
1154
1155 if (FPClassTest PartialCheck = Mask & fcSubnormal) {
1156 // issubnormal(V) ==> unsigned(abs(V) - 1) u< (all mantissa bits set)
1157 // issubnormal(V) && V>0 ==> unsigned(V - 1) u< (all mantissa bits set)
1158 auto V = (PartialCheck == fcPosSubnormal) ? AsInt : Abs;
1159 auto OneC = buildSPIRVConstant(IntTy, 1);
1160 auto VMinusOne = MIRBuilder.buildSub(IntTy, V, OneC);
1161 auto SubnormalRes = assignSPIRVTy(
1162 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, VMinusOne,
1163 buildSPIRVConstant(IntTy, AllOneMantissa)));
1164 if (PartialCheck == fcNegSubnormal)
1165 SubnormalRes = MIRBuilder.buildAnd(DstTy, SubnormalRes, Sign);
1166 appendToRes(std::move(SubnormalRes));
1167 }
1168
1169 if (FPClassTest PartialCheck = Mask & fcInf) {
1170 if (PartialCheck == fcPosInf)
1171 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1172 AsInt, InfC));
1173 else if (PartialCheck == fcInf)
1174 appendToRes(
1175 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy, Abs, InfC));
1176 else { // fcNegInf
1177 APInt NegInf = APFloat::getInf(Semantics, true).bitcastToAPInt();
1178 auto NegInfC = buildSPIRVConstant(IntTy, NegInf);
1179 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1180 AsInt, NegInfC));
1181 }
1182 }
1183
1184 if (FPClassTest PartialCheck = Mask & fcNan) {
1185 auto InfWithQnanBitC =
1186 buildSPIRVConstant(IntTy, std::move(Inf) | QNaNBitMask);
1187 if (PartialCheck == fcNan) {
1188 // isnan(V) ==> abs(V) u> int(inf)
1189 appendToRes(
1190 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGT, DstTy, Abs, InfC));
1191 } else if (PartialCheck == fcQNan) {
1192 // isquiet(V) ==> abs(V) u>= (unsigned(Inf) | quiet_bit)
1193 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGE, DstTy, Abs,
1194 InfWithQnanBitC));
1195 } else { // fcSNan
1196 // issignaling(V) ==> abs(V) u> unsigned(Inf) &&
1197 // abs(V) u< (unsigned(Inf) | quiet_bit)
1198 auto IsNan = assignSPIRVTy(
1199 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGT, DstTy, Abs, InfC));
1200 auto IsNotQnan = assignSPIRVTy(MIRBuilder.buildICmp(
1201 CmpInst::Predicate::ICMP_ULT, DstTy, Abs, InfWithQnanBitC));
1202 appendToRes(MIRBuilder.buildAnd(DstTy, IsNan, IsNotQnan));
1203 }
1204 }
1205
1206 if (FPClassTest PartialCheck = Mask & fcNormal) {
1207 // isnormal(V) ==> (0 u< exp u< max_exp) ==> (unsigned(exp-1) u<
1208 // (max_exp-1))
1209 APInt ExpLSB = ExpMask & ~(ExpMask.shl(1));
1210 auto ExpMinusOne = assignSPIRVTy(
1211 MIRBuilder.buildSub(IntTy, Abs, buildSPIRVConstant(IntTy, ExpLSB)));
1212 APInt MaxExpMinusOne = std::move(ExpMask) - ExpLSB;
1213 auto NormalRes = assignSPIRVTy(
1214 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, ExpMinusOne,
1215 buildSPIRVConstant(IntTy, MaxExpMinusOne)));
1216 if (PartialCheck == fcNegNormal)
1217 NormalRes = MIRBuilder.buildAnd(DstTy, NormalRes, Sign);
1218 else if (PartialCheck == fcPosNormal) {
1219 auto PosSign = assignSPIRVTy(MIRBuilder.buildXor(
1220 DstTy, Sign, buildSPIRVConstant(DstTy, InversionMask)));
1221 NormalRes = MIRBuilder.buildAnd(DstTy, NormalRes, PosSign);
1222 }
1223 appendToRes(std::move(NormalRes));
1224 }
1225
1226 MIRBuilder.buildCopy(DstReg, Res);
1227 MI.eraseFromParent();
1228 return true;
1229}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static void scalarize(Instruction *I, SmallVectorImpl< Instruction * > &Worklist)
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
IRTranslator LLVM IR MI
#define I(x, y, z)
Definition MD5.cpp:57
This file declares the MachineIRBuilder class.
Register Reg
Promote Memory to Register
Definition Mem2Reg.cpp:110
ppc ctr loops verify
const SmallVectorImpl< MachineOperand > & Cond
static bool legalizeSpvInsertElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool needsVectorLegalization(const LLT &Ty, const SPIRVSubtarget &ST)
static MachineInstrBuilder createStackTemporaryForVector(LegalizerHelper &Helper, SPIRVGlobalRegistry *GR, Register SrcReg, LLT SrcTy, MachinePointerInfo &PtrInfo, Align &VecAlign)
static Register convertPtrToInt(Register Reg, LLT ConvTy, SPIRVTypeInst SpvType, LegalizerHelper &Helper, MachineRegisterInfo &MRI, SPIRVGlobalRegistry *GR)
LegalityPredicate typeOfExtendedScalars(unsigned TypeIdx, bool IsExtendedInts)
static bool legalizeExtractVectorElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeStore(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvExtractElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvBitcast(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvConstComposite(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeLoad(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeInsertVectorElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
#define LLVM_DEBUG(...)
Definition Debug.h:119
APInt bitcastToAPInt() const
Definition APFloat.h:1430
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Definition APFloat.h:1197
static APFloat getInf(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Infinity.
Definition APFloat.h:1157
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:235
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:230
unsigned getActiveBits() const
Compute the number of active bits in the value.
Definition APInt.h:1535
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:880
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
Definition APInt.h:240
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
static LLVM_ABI ArrayType * get(Type *ElementType, uint64_t NumElements)
This static method is the primary way to construct an ArrayType.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:740
@ ICMP_UGE
unsigned greater or equal
Definition InstrTypes.h:764
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:763
@ ICMP_ULT
unsigned less than
Definition InstrTypes.h:765
@ ICMP_NE
not equal
Definition InstrTypes.h:762
static constexpr ElementCount getFixed(ScalarTy MinVal)
Definition TypeSize.h:309
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:350
static constexpr LLT vector(ElementCount EC, unsigned ScalarSizeInBits)
Get a low-level vector of some number of elements and element width.
LLT getScalarType() const
constexpr bool isPointerVector() const
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr bool isValid() const
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr bool isPointer() const
constexpr unsigned getAddressSpace() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
constexpr bool isPointerOrPointerVector() const
constexpr bool isFixedVector() const
Returns true if the LLT is a fixed vector.
constexpr TypeSize getSizeInBytes() const
Returns the total size of the type in bytes, i.e.
LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
LLVM_ABI void computeTables()
Compute any ancillary tables needed to quickly decide how an operation should be handled.
LegalizeRuleSet & legalFor(std::initializer_list< LLT > Types)
The instruction is legal when type index 0 is any type in the given list.
LegalizeRuleSet & fewerElementsIf(LegalityPredicate Predicate, LegalizeMutation Mutation)
Remove elements to reach the type selected by the mutation if the predicate is true.
LegalizeRuleSet & moreElementsToNextPow2(unsigned TypeIdx)
Add more elements to the vector to reach the next power of two.
LegalizeRuleSet & lower()
The instruction is lowered.
LegalizeRuleSet & scalarizeIf(LegalityPredicate Predicate, unsigned TypeIdx)
LegalizeRuleSet & lowerIf(LegalityPredicate Predicate)
The instruction is lowered if predicate is true.
LegalizeRuleSet & custom()
Unconditionally custom lower.
LegalizeRuleSet & unsupportedIf(LegalityPredicate Predicate)
LegalizeRuleSet & alwaysLegal()
LegalizeRuleSet & scalarize(unsigned TypeIdx)
LegalizeRuleSet & legalForCartesianProduct(std::initializer_list< LLT > Types)
The instruction is legal when type indexes 0 and 1 are both in the given list.
LegalizeRuleSet & legalIf(LegalityPredicate Predicate)
The instruction is legal if predicate is true.
LegalizeRuleSet & customFor(std::initializer_list< LLT > Types)
LLVM_ABI MachineInstrBuilder createStackTemporary(TypeSize Bytes, Align Alignment, MachinePointerInfo &PtrInfo)
Create a stack temporary based on the size in bytes and the alignment.
MachineIRBuilder & MIRBuilder
Expose MIRBuilder so clients can set their own RecordInsertInstruction functions.
LLVM_ABI Align getStackTemporaryAlignment(LLT Type, Align MinAlign=Align()) const
Return the alignment to use for a stack temporary object with the given type.
LegalizeRuleSet & getActionDefinitionsBuilder(unsigned Opcode)
Get the action definition builder for the given opcode.
const LegacyLegalizerInfo & getLegacyLegalizerInfo() const
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Helper class to build MachineInstr.
LLVMContext & getContext() const
MachineInstrBuilder buildUnmerge(ArrayRef< LLT > Res, const SrcOp &Op)
Build and insert Res0, ... = G_UNMERGE_VALUES Op.
MachineInstrBuilder buildAnd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_AND Op0, Op1.
MachineInstrBuilder buildICmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_ICMP Pred, Op0, Op1.
MachineInstrBuilder buildSub(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_SUB Op0, Op1.
MachineInstrBuilder buildIntrinsic(Intrinsic::ID ID, ArrayRef< Register > Res, bool HasSideEffects, bool isConvergent)
Build and insert a G_INTRINSIC instruction.
MachineInstrBuilder buildSplatBuildVector(const DstOp &Res, const SrcOp &Src)
Build and insert Res = G_BUILD_VECTOR with Src replicated to fill the number of elements.
MachineInstrBuilder buildBuildVector(const DstOp &Res, ArrayRef< Register > Ops)
Build and insert Res = G_BUILD_VECTOR Op0, ...
MachineInstrBuilder buildLoad(const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = G_LOAD Addr, MMO.
MachineInstrBuilder buildStore(const SrcOp &Val, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert G_STORE Val, Addr, MMO.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
MachineFunction & getMF()
Getter for the function we currently build.
MachineInstrBuilder buildBitcast(const DstOp &Dst, const SrcOp &Src)
Build and insert Dst = G_BITCAST Src.
MachineRegisterInfo * getMRI()
Getter for MRI.
MachineInstrBuilder buildOr(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_OR Op0, Op1.
MachineInstrBuilder buildCopy(const DstOp &Res, const SrcOp &Op)
Build and insert Res = COPY Op.
MachineInstrBuilder buildXor(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_XOR Op0, Op1.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
Representation of each machine instruction.
A description of a memory reference used in the backend.
const MachinePointerInfo & getPointerInfo() const
LLVM_ABI Align getAlign() const
Return the minimum known alignment in bytes of the actual memory reference.
MachineOperand class - Representation of each machine instruction operand.
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
LLVM_ABI void setRegClass(Register Reg, const TargetRegisterClass *RC)
setRegClass - Set the register class of the specified virtual register.
LLVM_ABI Register createGenericVirtualRegister(LLT Ty, StringRef Name="")
Create and return a new generic virtual register with low-level type Ty.
Wrapper class representing virtual and physical registers.
Definition Register.h:20
void assignSPIRVTypeToVReg(SPIRVTypeInst Type, Register VReg, const MachineFunction &MF)
const TargetRegisterClass * getRegClass(SPIRVTypeInst SpvType) const
const Type * getTypeForSPIRVType(SPIRVTypeInst Ty) const
LLT getRegType(SPIRVTypeInst SpvType) const
SPIRVTypeInst getOrCreateSPIRVPointerType(const Type *BaseType, MachineIRBuilder &MIRBuilder, SPIRV::StorageClass::StorageClass SC)
SPIRVTypeInst getScalarOrVectorComponentType(SPIRVTypeInst Type) const
SPIRVTypeInst getOrCreateSPIRVType(const Type *Type, MachineInstr &I, SPIRV::AccessQualifier::AccessQualifier AQ, bool EmitIR)
SPIRVTypeInst getSPIRVTypeForVReg(Register VReg, const MachineFunction *MF=nullptr) const
SPIRVLegalizerInfo(const SPIRVSubtarget &ST)
bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI, LostDebugLocObserver &LocObserver) const override
Called for instructions with the Custom LegalizationAction.
bool legalizeIntrinsic(LegalizerHelper &Helper, MachineInstr &MI) const override
SPIRVGlobalRegistry * getSPIRVGlobalRegistry() const
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
LLVM_ABI LegalityPredicate isScalar(unsigned TypeIdx)
True iff the specified type index is a scalar.
LLVM_ABI LegalityPredicate numElementsNotPow2(unsigned TypeIdx)
True iff the specified type index is a vector whose element count is not a power of 2.
LLVM_ABI LegalityPredicate vectorElementCountIsLessThanOrEqualTo(unsigned TypeIdx, unsigned Size)
True iff the specified type index is a vector with a number of elements that's less than or equal to ...
LLVM_ABI LegalityPredicate typeInSet(unsigned TypeIdx, std::initializer_list< LLT > TypesInit)
True iff the given type index is one of the specified types.
LLVM_ABI LegalityPredicate vectorElementCountIsGreaterThan(unsigned TypeIdx, unsigned Size)
True iff the specified type index is a vector with a number of elements that's greater than the given...
Predicate any(Predicate P0, Predicate P1)
True iff P0 or P1 are true.
LegalityPredicate typeIsNot(unsigned TypeIdx, LLT Type)
True iff the given type index is not the specified type.
Predicate all(Predicate P0, Predicate P1)
True iff P0 and P1 are true.
LLVM_ABI LegalityPredicate typeIs(unsigned TypeIdx, LLT TypesInit)
True iff the given type index is the specified type.
LLVM_ABI LegalizeMutation changeElementCountTo(unsigned TypeIdx, unsigned FromTypeIdx)
Keep the same scalar or element type as TypeIdx, but take the number of elements from FromTypeIdx.
LLVM_ABI LegalizeMutation changeElementSizeTo(unsigned TypeIdx, unsigned FromTypeIdx)
Change the scalar size or element size to have the same scalar size as type index FromIndex.
Invariant opcodes: All instruction sets have these as their low opcodes.
This is an optimization pass for GlobalISel generic memory operations.
LLVM_ABI const llvm::fltSemantics & getFltSemanticForLLT(LLT Ty)
Get the appropriate floating point arithmetic semantic based on the bit size of the given scalar LLT.
std::function< bool(const LegalityQuery &)> LegalityPredicate
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:279
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
const std::set< unsigned > & getTypeFoldingSupportedOpcodes()
int64_t foldImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
The LegalityQuery object bundles together all the information that's needed to decide whether a given...
ArrayRef< LLT > Types
This class contains a discriminated union of information about pointers in memory operands,...
MachinePointerInfo getWithOffset(int64_t O) const