LLVM 23.0.0git
SPIRVLegalizerInfo.cpp
Go to the documentation of this file.
1//===- SPIRVLegalizerInfo.cpp --- SPIR-V Legalization Rules ------*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the targeting of the Machinelegalizer class for SPIR-V.
10//
11//===----------------------------------------------------------------------===//
12
13#include "SPIRVLegalizerInfo.h"
14#include "SPIRV.h"
15#include "SPIRVGlobalRegistry.h"
16#include "SPIRVSubtarget.h"
17#include "SPIRVUtils.h"
24#include "llvm/IR/IntrinsicsSPIRV.h"
25#include "llvm/Support/Debug.h"
27
28using namespace llvm;
29using namespace llvm::LegalizeActions;
30using namespace llvm::LegalityPredicates;
31
32#define DEBUG_TYPE "spirv-legalizer"
33
34LegalityPredicate typeOfExtendedScalars(unsigned TypeIdx, bool IsExtendedInts) {
35 return [IsExtendedInts, TypeIdx](const LegalityQuery &Query) {
36 const LLT Ty = Query.Types[TypeIdx];
37 return IsExtendedInts && Ty.isValid() && Ty.isScalar();
38 };
39}
40
42 using namespace TargetOpcode;
43
44 this->ST = &ST;
45 GR = ST.getSPIRVGlobalRegistry();
46
47 const LLT s1 = LLT::scalar(1);
48 const LLT s8 = LLT::scalar(8);
49 const LLT s16 = LLT::scalar(16);
50 const LLT s32 = LLT::scalar(32);
51 const LLT s64 = LLT::scalar(64);
52 const LLT s128 = LLT::scalar(128);
53
54 const LLT v16s64 = LLT::fixed_vector(16, 64);
55 const LLT v16s32 = LLT::fixed_vector(16, 32);
56 const LLT v16s16 = LLT::fixed_vector(16, 16);
57 const LLT v16s8 = LLT::fixed_vector(16, 8);
58 const LLT v16s1 = LLT::fixed_vector(16, 1);
59
60 const LLT v8s64 = LLT::fixed_vector(8, 64);
61 const LLT v8s32 = LLT::fixed_vector(8, 32);
62 const LLT v8s16 = LLT::fixed_vector(8, 16);
63 const LLT v8s8 = LLT::fixed_vector(8, 8);
64 const LLT v8s1 = LLT::fixed_vector(8, 1);
65
66 const LLT v4s64 = LLT::fixed_vector(4, 64);
67 const LLT v4s32 = LLT::fixed_vector(4, 32);
68 const LLT v4s16 = LLT::fixed_vector(4, 16);
69 const LLT v4s8 = LLT::fixed_vector(4, 8);
70 const LLT v4s1 = LLT::fixed_vector(4, 1);
71
72 const LLT v3s64 = LLT::fixed_vector(3, 64);
73 const LLT v3s32 = LLT::fixed_vector(3, 32);
74 const LLT v3s16 = LLT::fixed_vector(3, 16);
75 const LLT v3s8 = LLT::fixed_vector(3, 8);
76 const LLT v3s1 = LLT::fixed_vector(3, 1);
77
78 const LLT v2s64 = LLT::fixed_vector(2, 64);
79 const LLT v2s32 = LLT::fixed_vector(2, 32);
80 const LLT v2s16 = LLT::fixed_vector(2, 16);
81 const LLT v2s8 = LLT::fixed_vector(2, 8);
82 const LLT v2s1 = LLT::fixed_vector(2, 1);
83
84 const unsigned PSize = ST.getPointerSize();
85 const LLT p0 = LLT::pointer(0, PSize); // Function
86 const LLT p1 = LLT::pointer(1, PSize); // CrossWorkgroup
87 const LLT p2 = LLT::pointer(2, PSize); // UniformConstant
88 const LLT p3 = LLT::pointer(3, PSize); // Workgroup
89 const LLT p4 = LLT::pointer(4, PSize); // Generic
90 const LLT p5 =
91 LLT::pointer(5, PSize); // Input, SPV_INTEL_usm_storage_classes (Device)
92 const LLT p6 = LLT::pointer(6, PSize); // SPV_INTEL_usm_storage_classes (Host)
93 const LLT p7 = LLT::pointer(7, PSize); // Input
94 const LLT p8 = LLT::pointer(8, PSize); // Output
95 const LLT p9 =
96 LLT::pointer(9, PSize); // CodeSectionINTEL, SPV_INTEL_function_pointers
97 const LLT p10 = LLT::pointer(10, PSize); // Private
98 const LLT p11 = LLT::pointer(11, PSize); // StorageBuffer
99 const LLT p12 = LLT::pointer(12, PSize); // Uniform
100 const LLT p13 = LLT::pointer(13, PSize); // PushConstant
101
102 // TODO: remove copy-pasting here by using concatenation in some way.
103 auto allPtrsScalarsAndVectors = {
104 p0, p1, p2, p3, p4, p5, p6, p7, p8,
105 p9, p10, p11, p12, p13, s1, s8, s16, s32,
106 s64, v2s1, v2s8, v2s16, v2s32, v2s64, v3s1, v3s8, v3s16,
107 v3s32, v3s64, v4s1, v4s8, v4s16, v4s32, v4s64, v8s1, v8s8,
108 v8s16, v8s32, v8s64, v16s1, v16s8, v16s16, v16s32, v16s64};
109
110 auto allVectors = {v2s1, v2s8, v2s16, v2s32, v2s64, v3s1, v3s8,
111 v3s16, v3s32, v3s64, v4s1, v4s8, v4s16, v4s32,
112 v4s64, v8s1, v8s8, v8s16, v8s32, v8s64, v16s1,
113 v16s8, v16s16, v16s32, v16s64};
114
115 auto allShaderVectors = {v2s1, v2s8, v2s16, v2s32, v2s64,
116 v3s1, v3s8, v3s16, v3s32, v3s64,
117 v4s1, v4s8, v4s16, v4s32, v4s64};
118
119 auto allScalars = {s1, s8, s16, s32, s64};
120
121 auto allScalarsAndVectors = {
122 s1, s8, s16, s32, s64, s128, v2s1, v2s8,
123 v2s16, v2s32, v2s64, v3s1, v3s8, v3s16, v3s32, v3s64,
124 v4s1, v4s8, v4s16, v4s32, v4s64, v8s1, v8s8, v8s16,
125 v8s32, v8s64, v16s1, v16s8, v16s16, v16s32, v16s64};
126
127 auto allIntScalarsAndVectors = {
128 s8, s16, s32, s64, s128, v2s8, v2s16, v2s32, v2s64,
129 v3s8, v3s16, v3s32, v3s64, v4s8, v4s16, v4s32, v4s64, v8s8,
130 v8s16, v8s32, v8s64, v16s8, v16s16, v16s32, v16s64};
131
132 auto allBoolScalarsAndVectors = {s1, v2s1, v3s1, v4s1, v8s1, v16s1};
133
134 auto allIntScalars = {s8, s16, s32, s64, s128};
135
136 auto allFloatScalarsAndF16Vector2AndVector4s = {s16, s32, s64, v2s16, v4s16};
137
138 auto allFloatScalars = {s16, s32, s64};
139
140 auto allFloatScalarsAndVectors = {
141 s16, s32, s64, v2s16, v2s32, v2s64, v3s16, v3s32, v3s64,
142 v4s16, v4s32, v4s64, v8s16, v8s32, v8s64, v16s16, v16s32, v16s64};
143
144 auto allShaderFloatVectors = {v2s16, v2s32, v2s64, v3s16, v3s32,
145 v3s64, v4s16, v4s32, v4s64};
146
147 auto allFloatVectors = {v2s16, v2s32, v2s64, v3s16, v3s32,
148 v3s64, v4s16, v4s32, v4s64, v8s16,
149 v8s32, v8s64, v16s16, v16s32, v16s64};
150
151 auto &allowedFloatVectorTypes =
152 ST.isShader() ? allShaderFloatVectors : allFloatVectors;
153
154 auto allFloatAndIntScalarsAndPtrs = {s8, s16, s32, s64, p0, p1,
155 p2, p3, p4, p5, p6, p7,
156 p8, p9, p10, p11, p12, p13};
157
158 auto allPtrs = {p0, p1, p2, p3, p4, p5, p6, p7, p8, p9, p10, p11, p12, p13};
159
160 auto &allowedVectorTypes = ST.isShader() ? allShaderVectors : allVectors;
161
162 bool IsExtendedInts =
163 ST.canUseExtension(
164 SPIRV::Extension::SPV_ALTERA_arbitrary_precision_integers) ||
165 ST.canUseExtension(SPIRV::Extension::SPV_KHR_bit_instructions) ||
166 ST.canUseExtension(SPIRV::Extension::SPV_INTEL_int4);
167 auto extendedScalarsAndVectors =
168 [IsExtendedInts](const LegalityQuery &Query) {
169 const LLT Ty = Query.Types[0];
170 return IsExtendedInts && Ty.isValid() && !Ty.isPointerOrPointerVector();
171 };
172 auto extendedScalarsAndVectorsProduct = [IsExtendedInts](
173 const LegalityQuery &Query) {
174 const LLT Ty1 = Query.Types[0], Ty2 = Query.Types[1];
175 return IsExtendedInts && Ty1.isValid() && Ty2.isValid() &&
176 !Ty1.isPointerOrPointerVector() && !Ty2.isPointerOrPointerVector();
177 };
178 auto extendedPtrsScalarsAndVectors =
179 [IsExtendedInts](const LegalityQuery &Query) {
180 const LLT Ty = Query.Types[0];
181 return IsExtendedInts && Ty.isValid();
182 };
183
184 // The universal validation rules in the SPIR-V specification state that
185 // vector sizes are typically limited to 2, 3, or 4. However, larger vector
186 // sizes (8 and 16) are enabled when the Kernel capability is present. For
187 // shader execution models, vector sizes are strictly limited to 4. In
188 // non-shader contexts, vector sizes of 8 and 16 are also permitted, but
189 // arbitrary sizes (e.g., 6 or 11) are not.
190 uint32_t MaxVectorSize = ST.isShader() ? 4 : 16;
191 LLVM_DEBUG(dbgs() << "MaxVectorSize: " << MaxVectorSize << "\n");
192
193 for (auto Opc : getTypeFoldingSupportedOpcodes()) {
194 switch (Opc) {
195 case G_EXTRACT_VECTOR_ELT:
196 case G_UREM:
197 case G_SREM:
198 case G_UDIV:
199 case G_SDIV:
200 case G_FREM:
201 break;
202 default:
204 .customFor(allScalars)
205 .customFor(allowedVectorTypes)
209 0, ElementCount::getFixed(MaxVectorSize)))
210 .custom();
211 break;
212 }
213 }
214
215 getActionDefinitionsBuilder({G_UREM, G_SREM, G_SDIV, G_UDIV, G_FREM})
216 .customFor(allScalars)
217 .customFor(allowedVectorTypes)
221 0, ElementCount::getFixed(MaxVectorSize)))
222 .custom();
223
224 getActionDefinitionsBuilder({G_FMA, G_STRICT_FMA})
225 .legalFor(allScalars)
226 .legalFor(allowedVectorTypes)
230 0, ElementCount::getFixed(MaxVectorSize)))
231 .alwaysLegal();
232
233 getActionDefinitionsBuilder(G_INTRINSIC_W_SIDE_EFFECTS).custom();
234
235 getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
236 .legalForCartesianProduct(allowedVectorTypes, allowedVectorTypes)
238 .lowerIf(vectorElementCountIsGreaterThan(0, MaxVectorSize))
240 .lowerIf(vectorElementCountIsGreaterThan(1, MaxVectorSize));
241
242 getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
246 1, ElementCount::getFixed(MaxVectorSize)))
247 .custom();
248
249 getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
253 0, ElementCount::getFixed(MaxVectorSize)))
254 .custom();
255
256 // Illegal G_UNMERGE_VALUES instructions should be handled
257 // during the combine phase.
258 getActionDefinitionsBuilder(G_BUILD_VECTOR)
260
261 // When entering the legalizer, there should be no G_BITCAST instructions.
262 // They should all be calls to the `spv_bitcast` intrinsic. The call to
263 // the intrinsic will be converted to a G_BITCAST during legalization if
264 // the vectors are not legal. After using the rules to legalize a G_BITCAST,
265 // we turn it back into a call to the intrinsic with a custom rule to avoid
266 // potential machine verifier failures.
272 0, ElementCount::getFixed(MaxVectorSize)))
273 .lowerIf(vectorElementCountIsGreaterThan(1, MaxVectorSize))
274 .custom();
275
276 // If the result is still illegal, the combiner should be able to remove it.
277 getActionDefinitionsBuilder(G_CONCAT_VECTORS)
278 .legalForCartesianProduct(allowedVectorTypes, allowedVectorTypes);
279
280 getActionDefinitionsBuilder(G_SPLAT_VECTOR)
281 .legalFor(allowedVectorTypes)
285 .alwaysLegal();
286
287 // Vector Reduction Operations
289 {G_VECREDUCE_SMIN, G_VECREDUCE_SMAX, G_VECREDUCE_UMIN, G_VECREDUCE_UMAX,
290 G_VECREDUCE_ADD, G_VECREDUCE_MUL, G_VECREDUCE_FMUL, G_VECREDUCE_FMIN,
291 G_VECREDUCE_FMAX, G_VECREDUCE_FMINIMUM, G_VECREDUCE_FMAXIMUM,
292 G_VECREDUCE_OR, G_VECREDUCE_AND, G_VECREDUCE_XOR})
293 .legalFor(allowedVectorTypes)
294 .scalarize(1)
295 .lower();
296
297 getActionDefinitionsBuilder({G_VECREDUCE_SEQ_FADD, G_VECREDUCE_SEQ_FMUL})
298 .scalarize(2)
299 .lower();
300
301 // Illegal G_UNMERGE_VALUES instructions should be handled
302 // during the combine phase.
303 getActionDefinitionsBuilder(G_UNMERGE_VALUES)
305
306 getActionDefinitionsBuilder({G_MEMCPY, G_MEMMOVE})
307 .unsupportedIf(LegalityPredicates::any(typeIs(0, p9), typeIs(1, p9)))
308 .legalIf(all(typeInSet(0, allPtrs), typeInSet(1, allPtrs)));
309
311 .unsupportedIf(typeIs(0, p9))
312 .legalIf(all(typeInSet(0, allPtrs), typeInSet(1, allIntScalars)));
313
314 getActionDefinitionsBuilder(G_ADDRSPACE_CAST)
315 .legalForCartesianProduct(allPtrs, allPtrs);
316
317 // Should we be legalizing bad scalar sizes like s5 here instead
318 // of handling them in the instruction selector?
319 getActionDefinitionsBuilder({G_LOAD, G_STORE})
320 .unsupportedIf(typeIs(1, p9))
321 .legalForCartesianProduct(allowedVectorTypes, allPtrs)
322 .legalForCartesianProduct(allPtrs, allPtrs)
323 .legalIf(isScalar(0))
324 .custom();
325
326 getActionDefinitionsBuilder({G_SMIN, G_SMAX, G_UMIN, G_UMAX, G_ABS,
327 G_BITREVERSE, G_SADDSAT, G_UADDSAT, G_SSUBSAT,
328 G_USUBSAT, G_SCMP, G_UCMP})
329 .legalFor(allIntScalarsAndVectors)
330 .legalIf(extendedScalarsAndVectors);
331
332 getActionDefinitionsBuilder(G_STRICT_FLDEXP)
333 .legalForCartesianProduct(allFloatScalarsAndVectors, allIntScalars);
334
335 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
336 .legalForCartesianProduct(allIntScalarsAndVectors,
337 allFloatScalarsAndVectors);
338
339 getActionDefinitionsBuilder({G_FPTOSI_SAT, G_FPTOUI_SAT})
340 .legalForCartesianProduct(allIntScalarsAndVectors,
341 allFloatScalarsAndVectors);
342
343 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
344 .legalForCartesianProduct(allFloatScalarsAndVectors,
345 allScalarsAndVectors);
346
348 .legalForCartesianProduct(allIntScalarsAndVectors)
349 .legalIf(extendedScalarsAndVectorsProduct);
350
351 // Extensions.
352 getActionDefinitionsBuilder({G_TRUNC, G_ZEXT, G_SEXT, G_ANYEXT})
353 .legalForCartesianProduct(allScalarsAndVectors)
354 .legalIf(extendedScalarsAndVectorsProduct);
355
357 .legalFor(allPtrsScalarsAndVectors)
358 .legalIf(extendedPtrsScalarsAndVectors);
359
361 all(typeInSet(0, allPtrsScalarsAndVectors),
362 typeInSet(1, allPtrsScalarsAndVectors)));
363
364 getActionDefinitionsBuilder({G_IMPLICIT_DEF, G_FREEZE})
365 .legalFor({s1, s128})
366 .legalFor(allFloatAndIntScalarsAndPtrs)
367 .legalFor(allowedVectorTypes)
368 .legalIf([](const LegalityQuery &Query) {
369 return Query.Types[0].isPointerVector();
370 })
371 .moreElementsToNextPow2(0)
372 .fewerElementsIf(vectorElementCountIsGreaterThan(0, MaxVectorSize),
374 0, ElementCount::getFixed(MaxVectorSize)));
375
376 getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).alwaysLegal();
377
379 .legalForCartesianProduct(allPtrs, allIntScalars)
380 .legalIf(
381 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)))
382 .legalIf([](const LegalityQuery &Query) {
383 const LLT DstTy = Query.Types[0];
384 const LLT SrcTy = Query.Types[1];
385 return DstTy.isPointerVector() && SrcTy.isVector() &&
386 !SrcTy.isPointer() &&
387 DstTy.getNumElements() == SrcTy.getNumElements();
388 });
390 .legalForCartesianProduct(allIntScalars, allPtrs)
391 .legalIf(
392 all(typeOfExtendedScalars(0, IsExtendedInts), typeInSet(1, allPtrs)))
393 .legalIf([](const LegalityQuery &Query) {
394 const LLT DstTy = Query.Types[0];
395 const LLT SrcTy = Query.Types[1];
396 return SrcTy.isPointerVector() && DstTy.isVector() &&
397 !DstTy.isPointer() &&
398 DstTy.getNumElements() == SrcTy.getNumElements();
399 });
401 .legalForCartesianProduct(allPtrs, allIntScalars)
402 .legalIf(
403 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)));
404
405 // ST.canDirectlyComparePointers() for pointer args is supported in
406 // legalizeCustom().
409 all(typeIs(0, p9), typeInSet(1, allPtrs), typeIsNot(1, p9)),
410 all(typeInSet(0, allPtrs), typeIsNot(0, p9), typeIs(1, p9))))
411 .legalIf([IsExtendedInts](const LegalityQuery &Query) {
412 const LLT Ty = Query.Types[1];
413 return IsExtendedInts && Ty.isValid() && !Ty.isPointerOrPointerVector();
414 })
415 .customIf(all(typeInSet(0, allBoolScalarsAndVectors),
416 typeInSet(1, allPtrsScalarsAndVectors)));
417
419 all(typeInSet(0, allBoolScalarsAndVectors),
420 typeInSet(1, allFloatScalarsAndVectors)));
421
422 getActionDefinitionsBuilder({G_ATOMICRMW_OR, G_ATOMICRMW_ADD, G_ATOMICRMW_AND,
423 G_ATOMICRMW_MAX, G_ATOMICRMW_MIN,
424 G_ATOMICRMW_SUB, G_ATOMICRMW_XOR,
425 G_ATOMICRMW_UMAX, G_ATOMICRMW_UMIN})
426 .legalForCartesianProduct(allIntScalars, allPtrs);
427
429 {G_ATOMICRMW_FADD, G_ATOMICRMW_FSUB, G_ATOMICRMW_FMIN, G_ATOMICRMW_FMAX})
430 .legalForCartesianProduct(allFloatScalarsAndF16Vector2AndVector4s,
431 allPtrs);
432
433 getActionDefinitionsBuilder(G_ATOMICRMW_XCHG)
434 .legalForCartesianProduct(allFloatAndIntScalarsAndPtrs, allPtrs);
435
436 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG_WITH_SUCCESS).lower();
437 // TODO: add proper legalization rules.
438 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG).alwaysLegal();
439
440 getActionDefinitionsBuilder({G_UADDO, G_USUBO, G_UMULO, G_SMULO})
441 .alwaysLegal();
442
443 getActionDefinitionsBuilder({G_SADDO, G_SSUBO}).lower();
444
445 getActionDefinitionsBuilder({G_LROUND, G_LLROUND})
446 .legalForCartesianProduct(allFloatScalarsAndVectors,
447 allIntScalarsAndVectors);
448
449 // FP conversions.
450 getActionDefinitionsBuilder({G_FPTRUNC, G_FPEXT})
451 .legalForCartesianProduct(allFloatScalarsAndVectors);
452
453 // Pointer-handling.
454 getActionDefinitionsBuilder(G_FRAME_INDEX).legalFor({p0});
455
456 getActionDefinitionsBuilder(G_GLOBAL_VALUE).legalFor(allPtrs);
457
458 // Control-flow. In some cases (e.g. constants) s1 may be promoted to s32.
460 getActionDefinitionsBuilder(G_BRCOND).legalFor({s1, s32});
461
463 allFloatScalarsAndVectors, {s32, v2s32, v3s32, v4s32, v8s32, v16s32});
464
465 // TODO: Review the target OpenCL and GLSL Extended Instruction Set specs to
466 // tighten these requirements. Many of these math functions are only legal on
467 // specific bitwidths, so they are not selectable for
468 // allFloatScalarsAndVectors.
469 // clang-format off
470 getActionDefinitionsBuilder({G_STRICT_FSQRT,
471 G_FPOW,
472 G_FEXP,
473 G_FMODF,
474 G_FSINCOS,
475 G_FEXP2,
476 G_FEXP10,
477 G_FLOG,
478 G_FLOG2,
479 G_FLOG10,
480 G_FABS,
481 G_FMINNUM,
482 G_FMAXNUM,
483 G_FCEIL,
484 G_FCOS,
485 G_FSIN,
486 G_FTAN,
487 G_FACOS,
488 G_FASIN,
489 G_FATAN,
490 G_FATAN2,
491 G_FCOSH,
492 G_FSINH,
493 G_FTANH,
494 G_FSQRT,
495 G_FFLOOR,
496 G_FRINT,
497 G_FNEARBYINT,
498 G_INTRINSIC_ROUND,
499 G_INTRINSIC_TRUNC,
500 G_FMINIMUM,
501 G_FMAXIMUM,
502 G_INTRINSIC_ROUNDEVEN})
503 .legalFor(allFloatScalars)
504 .legalFor(allowedFloatVectorTypes)
508 0, ElementCount::getFixed(MaxVectorSize)));
509 // clang-format on
510
511 getActionDefinitionsBuilder(G_FCOPYSIGN)
512 .legalForCartesianProduct(allFloatScalarsAndVectors,
513 allFloatScalarsAndVectors);
514
516 allFloatScalarsAndVectors, allIntScalarsAndVectors);
517
518 if (ST.canUseExtInstSet(SPIRV::InstructionSet::OpenCL_std)) {
520 {G_CTTZ, G_CTTZ_ZERO_POISON, G_CTLZ, G_CTLZ_ZERO_POISON})
521 .legalForCartesianProduct(allIntScalarsAndVectors,
522 allIntScalarsAndVectors);
523
524 // Struct return types become a single scalar, so cannot easily legalize.
525 getActionDefinitionsBuilder({G_SMULH, G_UMULH}).alwaysLegal();
526 }
527
528 getActionDefinitionsBuilder(G_IS_FPCLASS).custom();
529
530 getActionDefinitionsBuilder({G_INTRINSIC, G_INTRINSIC_CONVERGENT,
531 G_INTRINSIC_CONVERGENT_W_SIDE_EFFECTS})
532 .alwaysLegal();
534 getActionDefinitionsBuilder({G_TRAP, G_DEBUGTRAP, G_UBSANTRAP}).alwaysLegal();
535
537 verify(*ST.getInstrInfo());
538}
539
542 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
543 Register DstReg = MI.getOperand(0).getReg();
544 Register SrcReg = MI.getOperand(1).getReg();
545 Register IdxReg = MI.getOperand(2).getReg();
546
547 MIRBuilder
548 .buildIntrinsic(Intrinsic::spv_extractelt, ArrayRef<Register>{DstReg})
549 .addUse(SrcReg)
550 .addUse(IdxReg);
551 MI.eraseFromParent();
552 return true;
553}
554
557 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
558 Register DstReg = MI.getOperand(0).getReg();
559 Register SrcReg = MI.getOperand(1).getReg();
560 Register ValReg = MI.getOperand(2).getReg();
561 Register IdxReg = MI.getOperand(3).getReg();
562
563 MIRBuilder
564 .buildIntrinsic(Intrinsic::spv_insertelt, ArrayRef<Register>{DstReg})
565 .addUse(SrcReg)
566 .addUse(ValReg)
567 .addUse(IdxReg);
568 MI.eraseFromParent();
569 return true;
570}
571
573 LegalizerHelper &Helper,
576 Register ConvReg = MRI.createGenericVirtualRegister(ConvTy);
577 MRI.setRegClass(ConvReg, GR->getRegClass(SpvType));
578 GR->assignSPIRVTypeToVReg(SpvType, ConvReg, Helper.MIRBuilder.getMF());
579 Helper.MIRBuilder.buildInstr(TargetOpcode::G_PTRTOINT)
580 .addDef(ConvReg)
581 .addUse(Reg);
582 return ConvReg;
583}
584
585static bool needsVectorLegalization(const LLT &Ty, const SPIRVSubtarget &ST) {
586 if (!Ty.isVector())
587 return false;
588 unsigned NumElements = Ty.getNumElements();
589 unsigned MaxVectorSize = ST.isShader() ? 4 : 16;
590 return (NumElements > 4 && !isPowerOf2_32(NumElements)) ||
591 NumElements > MaxVectorSize;
592}
593
596 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
597 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
598 Register DstReg = MI.getOperand(0).getReg();
599 Register PtrReg = MI.getOperand(1).getReg();
600 LLT DstTy = MRI.getType(DstReg);
601
602 if (!DstTy.isVector())
603 return true;
604
605 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
606 if (!needsVectorLegalization(DstTy, ST))
607 return true;
608
609 SmallVector<Register, 8> SplitRegs;
610 LLT EltTy = DstTy.getElementType();
611 unsigned NumElts = DstTy.getNumElements();
612
613 LLT PtrTy = MRI.getType(PtrReg);
614 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
615
616 for (unsigned i = 0; i < NumElts; ++i) {
617 auto Idx = MIRBuilder.buildConstant(LLT::scalar(32), i);
618 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
619
620 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
621 .addImm(1) // InBounds
622 .addUse(PtrReg)
623 .addUse(Zero.getReg(0))
624 .addUse(Idx.getReg(0));
625
626 MachinePointerInfo EltPtrInfo;
627 Align EltAlign = Align(1);
628 if (!MI.memoperands_empty()) {
629 MachineMemOperand *MMO = *MI.memoperands_begin();
630 EltPtrInfo =
631 MMO->getPointerInfo().getWithOffset(i * EltTy.getSizeInBytes());
632 EltAlign = commonAlignment(MMO->getAlign(), i * EltTy.getSizeInBytes());
633 }
634
635 Register EltReg = MRI.createGenericVirtualRegister(EltTy);
636 MIRBuilder.buildLoad(EltReg, EltPtr, EltPtrInfo, EltAlign);
637 SplitRegs.push_back(EltReg);
638 }
639
640 MIRBuilder.buildBuildVector(DstReg, SplitRegs);
641 MI.eraseFromParent();
642 return true;
643}
644
647 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
648 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
649 Register ValReg = MI.getOperand(0).getReg();
650 Register PtrReg = MI.getOperand(1).getReg();
651 LLT ValTy = MRI.getType(ValReg);
652
653 assert(ValTy.isVector() && "Expected vector store");
654
655 SmallVector<Register, 8> SplitRegs;
656 LLT EltTy = ValTy.getElementType();
657 unsigned NumElts = ValTy.getNumElements();
658
659 for (unsigned i = 0; i < NumElts; ++i)
660 SplitRegs.push_back(MRI.createGenericVirtualRegister(EltTy));
661
662 MIRBuilder.buildUnmerge(SplitRegs, ValReg);
663
664 LLT PtrTy = MRI.getType(PtrReg);
665 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
666
667 for (unsigned i = 0; i < NumElts; ++i) {
668 auto Idx = MIRBuilder.buildConstant(LLT::scalar(32), i);
669 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
670
671 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
672 .addImm(1) // InBounds
673 .addUse(PtrReg)
674 .addUse(Zero.getReg(0))
675 .addUse(Idx.getReg(0));
676
677 MachinePointerInfo EltPtrInfo;
678 Align EltAlign = Align(1);
679 if (!MI.memoperands_empty()) {
680 MachineMemOperand *MMO = *MI.memoperands_begin();
681 EltPtrInfo =
682 MMO->getPointerInfo().getWithOffset(i * EltTy.getSizeInBytes());
683 EltAlign = commonAlignment(MMO->getAlign(), i * EltTy.getSizeInBytes());
684 }
685
686 MIRBuilder.buildStore(SplitRegs[i], EltPtr, EltPtrInfo, EltAlign);
687 }
688
689 MI.eraseFromParent();
690 return true;
691}
692
695 LostDebugLocObserver &LocObserver) const {
696 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
697 switch (MI.getOpcode()) {
698 default:
699 // TODO: implement legalization for other opcodes.
700 return true;
701 case TargetOpcode::G_BITCAST:
702 return legalizeBitcast(Helper, MI);
703 case TargetOpcode::G_EXTRACT_VECTOR_ELT:
704 return legalizeExtractVectorElt(Helper, MI, GR);
705 case TargetOpcode::G_INSERT_VECTOR_ELT:
706 return legalizeInsertVectorElt(Helper, MI, GR);
707 case TargetOpcode::G_INTRINSIC:
708 case TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS:
709 return legalizeIntrinsic(Helper, MI);
710 case TargetOpcode::G_IS_FPCLASS:
711 return legalizeIsFPClass(Helper, MI, LocObserver);
712 case TargetOpcode::G_ICMP: {
713 auto &Op0 = MI.getOperand(2);
714 auto &Op1 = MI.getOperand(3);
715 Register Reg0 = Op0.getReg();
716 Register Reg1 = Op1.getReg();
718 static_cast<CmpInst::Predicate>(MI.getOperand(1).getPredicate());
719 if ((!ST->canDirectlyComparePointers() ||
721 MRI.getType(Reg0).isPointer() && MRI.getType(Reg1).isPointer()) {
722 LLT ConvT = LLT::scalar(ST->getPointerSize());
723 Type *LLVMTy = IntegerType::get(MI.getMF()->getFunction().getContext(),
724 ST->getPointerSize());
725 SPIRVTypeInst SpirvTy = GR->getOrCreateSPIRVType(
726 LLVMTy, Helper.MIRBuilder, SPIRV::AccessQualifier::ReadWrite, true);
727 Op0.setReg(convertPtrToInt(Reg0, ConvT, SpirvTy, Helper, MRI, GR));
728 Op1.setReg(convertPtrToInt(Reg1, ConvT, SpirvTy, Helper, MRI, GR));
729 }
730 return true;
731 }
732 case TargetOpcode::G_LOAD:
733 return legalizeLoad(Helper, MI, GR);
734 case TargetOpcode::G_STORE:
735 return legalizeStore(Helper, MI, GR);
736 }
737}
738
741 Register SrcReg, LLT SrcTy,
742 MachinePointerInfo &PtrInfo, Align &VecAlign) {
743 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
744 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
745
746 VecAlign = Helper.getStackTemporaryAlignment(SrcTy);
747 auto StackTemp = Helper.createStackTemporary(
748 TypeSize::getFixed(SrcTy.getSizeInBytes()), VecAlign, PtrInfo);
749
750 // Set the type of StackTemp to a pointer to an array of the element type.
751 SPIRVTypeInst SpvSrcTy = GR->getSPIRVTypeForVReg(SrcReg);
752 SPIRVTypeInst EltSpvTy = GR->getScalarOrVectorComponentType(SpvSrcTy);
753 const Type *LLVMEltTy = GR->getTypeForSPIRVType(EltSpvTy);
754 const Type *LLVMArrTy =
755 ArrayType::get(const_cast<Type *>(LLVMEltTy), SrcTy.getNumElements());
756 SPIRVTypeInst ArrSpvTy = GR->getOrCreateSPIRVType(
757 LLVMArrTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite, true);
758 SPIRVTypeInst PtrToArrSpvTy = GR->getOrCreateSPIRVPointerType(
759 ArrSpvTy, MIRBuilder, SPIRV::StorageClass::Function);
760
761 Register StackReg = StackTemp.getReg(0);
762 MRI.setRegClass(StackReg, GR->getRegClass(PtrToArrSpvTy));
763 GR->assignSPIRVTypeToVReg(PtrToArrSpvTy, StackReg, MIRBuilder.getMF());
764
765 return StackTemp;
766}
767
770 LLVM_DEBUG(dbgs() << "Found a bitcast instruction\n");
771 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
772 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
773 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
774
775 Register DstReg = MI.getOperand(0).getReg();
776 Register SrcReg = MI.getOperand(2).getReg();
777 LLT DstTy = MRI.getType(DstReg);
778 LLT SrcTy = MRI.getType(SrcReg);
779
780 // If an spv_bitcast needs to be legalized, we convert it to G_BITCAST to
781 // allow using the generic legalization rules.
782 if (needsVectorLegalization(DstTy, ST) ||
783 needsVectorLegalization(SrcTy, ST)) {
784 LLVM_DEBUG(dbgs() << "Replacing with a G_BITCAST\n");
785 MIRBuilder.buildBitcast(DstReg, SrcReg);
786 MI.eraseFromParent();
787 }
788 return true;
789}
790
793 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
794 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
795 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
796
797 Register DstReg = MI.getOperand(0).getReg();
798 LLT DstTy = MRI.getType(DstReg);
799
800 if (needsVectorLegalization(DstTy, ST)) {
801 Register SrcReg = MI.getOperand(2).getReg();
802 Register ValReg = MI.getOperand(3).getReg();
803 LLT SrcTy = MRI.getType(SrcReg);
804 MachineOperand &IdxOperand = MI.getOperand(4);
805
806 if (getImm(IdxOperand, &MRI)) {
807 uint64_t IdxVal = foldImm(IdxOperand, &MRI);
808 if (IdxVal < SrcTy.getNumElements()) {
810 SPIRVTypeInst ElementType =
812 LLT ElementLLTTy = GR->getRegType(ElementType);
813 for (unsigned I = 0, E = SrcTy.getNumElements(); I < E; ++I) {
814 Register Reg = MRI.createGenericVirtualRegister(ElementLLTTy);
815 MRI.setRegClass(Reg, GR->getRegClass(ElementType));
816 GR->assignSPIRVTypeToVReg(ElementType, Reg, *MI.getMF());
817 Regs.push_back(Reg);
818 }
819 MIRBuilder.buildUnmerge(Regs, SrcReg);
820 Regs[IdxVal] = ValReg;
821 MIRBuilder.buildBuildVector(DstReg, Regs);
822 MI.eraseFromParent();
823 return true;
824 }
825 }
826
827 LLT EltTy = SrcTy.getElementType();
828 Align VecAlign;
829 MachinePointerInfo PtrInfo;
830 auto StackTemp = createStackTemporaryForVector(Helper, GR, SrcReg, SrcTy,
831 PtrInfo, VecAlign);
832
833 MIRBuilder.buildStore(SrcReg, StackTemp, PtrInfo, VecAlign);
834
835 Register IdxReg = IdxOperand.getReg();
836 LLT PtrTy = MRI.getType(StackTemp.getReg(0));
837 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
838 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
839
840 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
841 .addImm(1) // InBounds
842 .addUse(StackTemp.getReg(0))
843 .addUse(Zero.getReg(0))
844 .addUse(IdxReg);
845
847 Align EltAlign = Helper.getStackTemporaryAlignment(EltTy);
848 MIRBuilder.buildStore(ValReg, EltPtr, EltPtrInfo, EltAlign);
849
850 MIRBuilder.buildLoad(DstReg, StackTemp, PtrInfo, VecAlign);
851 MI.eraseFromParent();
852 return true;
853 }
854 return true;
855}
856
859 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
860 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
861 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
862
863 Register SrcReg = MI.getOperand(2).getReg();
864 LLT SrcTy = MRI.getType(SrcReg);
865
866 if (needsVectorLegalization(SrcTy, ST)) {
867 Register DstReg = MI.getOperand(0).getReg();
868 MachineOperand &IdxOperand = MI.getOperand(3);
869
870 if (getImm(IdxOperand, &MRI)) {
871 uint64_t IdxVal = foldImm(IdxOperand, &MRI);
872 if (IdxVal < SrcTy.getNumElements()) {
873 LLT DstTy = MRI.getType(DstReg);
875 SPIRVTypeInst DstSpvTy = GR->getSPIRVTypeForVReg(DstReg);
876 for (unsigned I = 0, E = SrcTy.getNumElements(); I < E; ++I) {
877 if (I == IdxVal) {
878 Regs.push_back(DstReg);
879 } else {
881 MRI.setRegClass(Reg, GR->getRegClass(DstSpvTy));
882 GR->assignSPIRVTypeToVReg(DstSpvTy, Reg, *MI.getMF());
883 Regs.push_back(Reg);
884 }
885 }
886 MIRBuilder.buildUnmerge(Regs, SrcReg);
887 MI.eraseFromParent();
888 return true;
889 }
890 }
891
892 LLT EltTy = SrcTy.getElementType();
893 Align VecAlign;
894 MachinePointerInfo PtrInfo;
895 auto StackTemp = createStackTemporaryForVector(Helper, GR, SrcReg, SrcTy,
896 PtrInfo, VecAlign);
897
898 MIRBuilder.buildStore(SrcReg, StackTemp, PtrInfo, VecAlign);
899
900 Register IdxReg = IdxOperand.getReg();
901 LLT PtrTy = MRI.getType(StackTemp.getReg(0));
902 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
903 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
904
905 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
906 .addImm(1) // InBounds
907 .addUse(StackTemp.getReg(0))
908 .addUse(Zero.getReg(0))
909 .addUse(IdxReg);
910
912 Align EltAlign = Helper.getStackTemporaryAlignment(EltTy);
913 MIRBuilder.buildLoad(DstReg, EltPtr, EltPtrInfo, EltAlign);
914
915 MI.eraseFromParent();
916 return true;
917 }
918 return true;
919}
920
923 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
924 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
925 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
926
927 Register DstReg = MI.getOperand(0).getReg();
928 LLT DstTy = MRI.getType(DstReg);
929
930 if (!needsVectorLegalization(DstTy, ST))
931 return true;
932
934 if (MI.getNumOperands() == 2) {
935 // The "null" case: no values are attached.
936 LLT EltTy = DstTy.getElementType();
937 auto Zero = MIRBuilder.buildConstant(EltTy, 0);
938 SPIRVTypeInst SpvDstTy = GR->getSPIRVTypeForVReg(DstReg);
939 SPIRVTypeInst SpvEltTy = GR->getScalarOrVectorComponentType(SpvDstTy);
940 GR->assignSPIRVTypeToVReg(SpvEltTy, Zero.getReg(0), MIRBuilder.getMF());
941 for (unsigned i = 0; i < DstTy.getNumElements(); ++i)
942 SrcRegs.push_back(Zero.getReg(0));
943 } else {
944 for (unsigned i = 2; i < MI.getNumOperands(); ++i) {
945 SrcRegs.push_back(MI.getOperand(i).getReg());
946 }
947 }
948 MIRBuilder.buildBuildVector(DstReg, SrcRegs);
949 MI.eraseFromParent();
950 return true;
951}
952
954 MachineInstr &MI) const {
955 LLVM_DEBUG(dbgs() << "legalizeIntrinsic: " << MI);
956 auto IntrinsicID = cast<GIntrinsic>(MI).getIntrinsicID();
957 switch (IntrinsicID) {
958 case Intrinsic::spv_bitcast:
959 return legalizeSpvBitcast(Helper, MI, GR);
960 case Intrinsic::spv_insertelt:
961 return legalizeSpvInsertElt(Helper, MI, GR);
962 case Intrinsic::spv_extractelt:
963 return legalizeSpvExtractElt(Helper, MI, GR);
964 case Intrinsic::spv_const_composite:
965 return legalizeSpvConstComposite(Helper, MI, GR);
966 }
967 return true;
968}
969
970bool SPIRVLegalizerInfo::legalizeBitcast(LegalizerHelper &Helper,
971 MachineInstr &MI) const {
972 // Once the G_BITCAST is using vectors that are allowed, we turn it back into
973 // an spv_bitcast to avoid verifier problems when the register types are the
974 // same for the source and the result. Note that the SPIR-V types associated
975 // with the bitcast can be different even if the register types are the same.
976 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
977 Register DstReg = MI.getOperand(0).getReg();
978 Register SrcReg = MI.getOperand(1).getReg();
979 SmallVector<Register, 1> DstRegs = {DstReg};
980 MIRBuilder.buildIntrinsic(Intrinsic::spv_bitcast, DstRegs).addUse(SrcReg);
981 MI.eraseFromParent();
982 return true;
983}
984
985// Note this code was copied from LegalizerHelper::lowerISFPCLASS and adjusted
986// to ensure that all instructions created during the lowering have SPIR-V types
987// assigned to them.
988bool SPIRVLegalizerInfo::legalizeIsFPClass(
990 LostDebugLocObserver &LocObserver) const {
991 auto [DstReg, DstTy, SrcReg, SrcTy] = MI.getFirst2RegLLTs();
992 FPClassTest Mask = static_cast<FPClassTest>(MI.getOperand(2).getImm());
993
994 auto &MIRBuilder = Helper.MIRBuilder;
995 auto &MF = MIRBuilder.getMF();
996 MachineRegisterInfo &MRI = MF.getRegInfo();
997
998 Type *LLVMDstTy =
999 IntegerType::get(MIRBuilder.getContext(), DstTy.getScalarSizeInBits());
1000 if (DstTy.isVector())
1001 LLVMDstTy = VectorType::get(LLVMDstTy, DstTy.getElementCount());
1002 SPIRVTypeInst SPIRVDstTy = GR->getOrCreateSPIRVType(
1003 LLVMDstTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite,
1004 /*EmitIR*/ true);
1005
1006 unsigned BitSize = SrcTy.getScalarSizeInBits();
1007 const fltSemantics &Semantics = getFltSemanticForLLT(SrcTy.getScalarType());
1008
1009 LLT IntTy = LLT::scalar(BitSize);
1010 Type *LLVMIntTy = IntegerType::get(MIRBuilder.getContext(), BitSize);
1011 if (SrcTy.isVector()) {
1012 IntTy = LLT::vector(SrcTy.getElementCount(), IntTy);
1013 LLVMIntTy = VectorType::get(LLVMIntTy, SrcTy.getElementCount());
1014 }
1015 SPIRVTypeInst SPIRVIntTy = GR->getOrCreateSPIRVType(
1016 LLVMIntTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite,
1017 /*EmitIR*/ true);
1018
1019 // Clang doesn't support capture of structured bindings:
1020 LLT DstTyCopy = DstTy;
1021 const auto assignSPIRVTy = [&](MachineInstrBuilder &&MI) {
1022 // Assign this MI's (assumed only) destination to one of the two types we
1023 // expect: either the G_IS_FPCLASS's destination type, or the integer type
1024 // bitcast from the source type.
1025 LLT MITy = MRI.getType(MI.getReg(0));
1026 assert((MITy == IntTy || MITy == DstTyCopy) &&
1027 "Unexpected LLT type while lowering G_IS_FPCLASS");
1028 SPIRVTypeInst SPVTy = MITy == IntTy ? SPIRVIntTy : SPIRVDstTy;
1029 GR->assignSPIRVTypeToVReg(SPVTy, MI.getReg(0), MF);
1030 return MI;
1031 };
1032
1033 // Helper to build and assign a constant in one go
1034 const auto buildSPIRVConstant = [&](LLT Ty, auto &&C) -> MachineInstrBuilder {
1035 if (!Ty.isFixedVector())
1036 return assignSPIRVTy(MIRBuilder.buildConstant(Ty, C));
1037 auto ScalarC = MIRBuilder.buildConstant(Ty.getScalarType(), C);
1038 assert((Ty == IntTy || Ty == DstTyCopy) &&
1039 "Unexpected LLT type while lowering constant for G_IS_FPCLASS");
1040 SPIRVTypeInst VecEltTy = GR->getOrCreateSPIRVType(
1041 (Ty == IntTy ? LLVMIntTy : LLVMDstTy)->getScalarType(), MIRBuilder,
1042 SPIRV::AccessQualifier::ReadWrite,
1043 /*EmitIR*/ true);
1044 GR->assignSPIRVTypeToVReg(VecEltTy, ScalarC.getReg(0), MF);
1045 return assignSPIRVTy(MIRBuilder.buildSplatBuildVector(Ty, ScalarC));
1046 };
1047
1048 if (Mask == fcNone) {
1049 MIRBuilder.buildCopy(DstReg, buildSPIRVConstant(DstTy, 0));
1050 MI.eraseFromParent();
1051 return true;
1052 }
1053 if (Mask == fcAllFlags) {
1054 MIRBuilder.buildCopy(DstReg, buildSPIRVConstant(DstTy, 1));
1055 MI.eraseFromParent();
1056 return true;
1057 }
1058
1059 // Note that rather than creating a COPY here (between a floating-point and
1060 // integer type of the same size) we create a SPIR-V bitcast immediately. We
1061 // can't create a G_BITCAST because the LLTs are the same, and we can't seem
1062 // to correctly lower COPYs to SPIR-V bitcasts at this moment.
1063 Register ResVReg = MRI.createGenericVirtualRegister(IntTy);
1064 MRI.setRegClass(ResVReg, GR->getRegClass(SPIRVIntTy));
1065 GR->assignSPIRVTypeToVReg(SPIRVIntTy, ResVReg, Helper.MIRBuilder.getMF());
1066 auto AsInt = MIRBuilder.buildInstr(SPIRV::OpBitcast)
1067 .addDef(ResVReg)
1068 .addUse(GR->getSPIRVTypeID(SPIRVIntTy))
1069 .addUse(SrcReg);
1070 AsInt = assignSPIRVTy(std::move(AsInt));
1071
1072 // Various masks.
1073 APInt SignBit = APInt::getSignMask(BitSize);
1074 APInt ValueMask = APInt::getSignedMaxValue(BitSize); // All bits but sign.
1075 APInt Inf = APFloat::getInf(Semantics).bitcastToAPInt(); // Exp and int bit.
1076 APInt ExpMask = Inf;
1077 APInt AllOneMantissa = APFloat::getLargest(Semantics).bitcastToAPInt() & ~Inf;
1078 APInt QNaNBitMask =
1079 APInt::getOneBitSet(BitSize, AllOneMantissa.getActiveBits() - 1);
1080 APInt InversionMask = APInt::getAllOnes(DstTy.getScalarSizeInBits());
1081
1082 auto SignBitC = buildSPIRVConstant(IntTy, SignBit);
1083 auto ValueMaskC = buildSPIRVConstant(IntTy, ValueMask);
1084 auto InfC = buildSPIRVConstant(IntTy, Inf);
1085 auto ExpMaskC = buildSPIRVConstant(IntTy, ExpMask);
1086 auto ZeroC = buildSPIRVConstant(IntTy, 0);
1087
1088 auto Abs = assignSPIRVTy(MIRBuilder.buildAnd(IntTy, AsInt, ValueMaskC));
1089 auto Sign = assignSPIRVTy(
1090 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_NE, DstTy, AsInt, Abs));
1091
1092 auto Res = buildSPIRVConstant(DstTy, 0);
1093
1094 const auto appendToRes = [&](MachineInstrBuilder &&ToAppend) {
1095 Res = assignSPIRVTy(
1096 MIRBuilder.buildOr(DstTyCopy, Res, assignSPIRVTy(std::move(ToAppend))));
1097 };
1098
1099 // Tests that involve more than one class should be processed first.
1100 if ((Mask & fcFinite) == fcFinite) {
1101 // finite(V) ==> abs(V) u< exp_mask
1102 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, Abs,
1103 ExpMaskC));
1104 Mask &= ~fcFinite;
1105 } else if ((Mask & fcFinite) == fcPosFinite) {
1106 // finite(V) && V > 0 ==> V u< exp_mask
1107 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, AsInt,
1108 ExpMaskC));
1109 Mask &= ~fcPosFinite;
1110 } else if ((Mask & fcFinite) == fcNegFinite) {
1111 // finite(V) && V < 0 ==> abs(V) u< exp_mask && signbit == 1
1112 auto Cmp = assignSPIRVTy(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT,
1113 DstTy, Abs, ExpMaskC));
1114 appendToRes(MIRBuilder.buildAnd(DstTy, Cmp, Sign));
1115 Mask &= ~fcNegFinite;
1116 }
1117
1118 if (FPClassTest PartialCheck = Mask & (fcZero | fcSubnormal)) {
1119 // fcZero | fcSubnormal => test all exponent bits are 0
1120 // TODO: Handle sign bit specific cases
1121 // TODO: Handle inverted case
1122 if (PartialCheck == (fcZero | fcSubnormal)) {
1123 auto ExpBits = assignSPIRVTy(MIRBuilder.buildAnd(IntTy, AsInt, ExpMaskC));
1124 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1125 ExpBits, ZeroC));
1126 Mask &= ~PartialCheck;
1127 }
1128 }
1129
1130 // Check for individual classes.
1131 if (FPClassTest PartialCheck = Mask & fcZero) {
1132 if (PartialCheck == fcPosZero)
1133 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1134 AsInt, ZeroC));
1135 else if (PartialCheck == fcZero)
1136 appendToRes(
1137 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy, Abs, ZeroC));
1138 else // fcNegZero
1139 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1140 AsInt, SignBitC));
1141 }
1142
1143 if (FPClassTest PartialCheck = Mask & fcSubnormal) {
1144 // issubnormal(V) ==> unsigned(abs(V) - 1) u< (all mantissa bits set)
1145 // issubnormal(V) && V>0 ==> unsigned(V - 1) u< (all mantissa bits set)
1146 auto V = (PartialCheck == fcPosSubnormal) ? AsInt : Abs;
1147 auto OneC = buildSPIRVConstant(IntTy, 1);
1148 auto VMinusOne = MIRBuilder.buildSub(IntTy, V, OneC);
1149 auto SubnormalRes = assignSPIRVTy(
1150 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, VMinusOne,
1151 buildSPIRVConstant(IntTy, AllOneMantissa)));
1152 if (PartialCheck == fcNegSubnormal)
1153 SubnormalRes = MIRBuilder.buildAnd(DstTy, SubnormalRes, Sign);
1154 appendToRes(std::move(SubnormalRes));
1155 }
1156
1157 if (FPClassTest PartialCheck = Mask & fcInf) {
1158 if (PartialCheck == fcPosInf)
1159 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1160 AsInt, InfC));
1161 else if (PartialCheck == fcInf)
1162 appendToRes(
1163 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy, Abs, InfC));
1164 else { // fcNegInf
1165 APInt NegInf = APFloat::getInf(Semantics, true).bitcastToAPInt();
1166 auto NegInfC = buildSPIRVConstant(IntTy, NegInf);
1167 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1168 AsInt, NegInfC));
1169 }
1170 }
1171
1172 if (FPClassTest PartialCheck = Mask & fcNan) {
1173 auto InfWithQnanBitC =
1174 buildSPIRVConstant(IntTy, std::move(Inf) | QNaNBitMask);
1175 if (PartialCheck == fcNan) {
1176 // isnan(V) ==> abs(V) u> int(inf)
1177 appendToRes(
1178 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGT, DstTy, Abs, InfC));
1179 } else if (PartialCheck == fcQNan) {
1180 // isquiet(V) ==> abs(V) u>= (unsigned(Inf) | quiet_bit)
1181 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGE, DstTy, Abs,
1182 InfWithQnanBitC));
1183 } else { // fcSNan
1184 // issignaling(V) ==> abs(V) u> unsigned(Inf) &&
1185 // abs(V) u< (unsigned(Inf) | quiet_bit)
1186 auto IsNan = assignSPIRVTy(
1187 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGT, DstTy, Abs, InfC));
1188 auto IsNotQnan = assignSPIRVTy(MIRBuilder.buildICmp(
1189 CmpInst::Predicate::ICMP_ULT, DstTy, Abs, InfWithQnanBitC));
1190 appendToRes(MIRBuilder.buildAnd(DstTy, IsNan, IsNotQnan));
1191 }
1192 }
1193
1194 if (FPClassTest PartialCheck = Mask & fcNormal) {
1195 // isnormal(V) ==> (0 u< exp u< max_exp) ==> (unsigned(exp-1) u<
1196 // (max_exp-1))
1197 APInt ExpLSB = ExpMask & ~(ExpMask.shl(1));
1198 auto ExpMinusOne = assignSPIRVTy(
1199 MIRBuilder.buildSub(IntTy, Abs, buildSPIRVConstant(IntTy, ExpLSB)));
1200 APInt MaxExpMinusOne = std::move(ExpMask) - ExpLSB;
1201 auto NormalRes = assignSPIRVTy(
1202 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, ExpMinusOne,
1203 buildSPIRVConstant(IntTy, MaxExpMinusOne)));
1204 if (PartialCheck == fcNegNormal)
1205 NormalRes = MIRBuilder.buildAnd(DstTy, NormalRes, Sign);
1206 else if (PartialCheck == fcPosNormal) {
1207 auto PosSign = assignSPIRVTy(MIRBuilder.buildXor(
1208 DstTy, Sign, buildSPIRVConstant(DstTy, InversionMask)));
1209 NormalRes = MIRBuilder.buildAnd(DstTy, NormalRes, PosSign);
1210 }
1211 appendToRes(std::move(NormalRes));
1212 }
1213
1214 MIRBuilder.buildCopy(DstReg, Res);
1215 MI.eraseFromParent();
1216 return true;
1217}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static void scalarize(Instruction *I, SmallVectorImpl< Instruction * > &Worklist)
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
IRTranslator LLVM IR MI
#define I(x, y, z)
Definition MD5.cpp:57
This file declares the MachineIRBuilder class.
Register Reg
Promote Memory to Register
Definition Mem2Reg.cpp:110
ppc ctr loops verify
const SmallVectorImpl< MachineOperand > & Cond
static bool legalizeSpvInsertElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool needsVectorLegalization(const LLT &Ty, const SPIRVSubtarget &ST)
static MachineInstrBuilder createStackTemporaryForVector(LegalizerHelper &Helper, SPIRVGlobalRegistry *GR, Register SrcReg, LLT SrcTy, MachinePointerInfo &PtrInfo, Align &VecAlign)
static Register convertPtrToInt(Register Reg, LLT ConvTy, SPIRVTypeInst SpvType, LegalizerHelper &Helper, MachineRegisterInfo &MRI, SPIRVGlobalRegistry *GR)
LegalityPredicate typeOfExtendedScalars(unsigned TypeIdx, bool IsExtendedInts)
static bool legalizeExtractVectorElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeStore(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvExtractElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvBitcast(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvConstComposite(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeLoad(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeInsertVectorElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
#define LLVM_DEBUG(...)
Definition Debug.h:119
APInt bitcastToAPInt() const
Definition APFloat.h:1430
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Definition APFloat.h:1197
static APFloat getInf(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Infinity.
Definition APFloat.h:1157
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:235
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:230
unsigned getActiveBits() const
Compute the number of active bits in the value.
Definition APInt.h:1535
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:880
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
Definition APInt.h:240
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
static LLVM_ABI ArrayType * get(Type *ElementType, uint64_t NumElements)
This static method is the primary way to construct an ArrayType.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:740
@ ICMP_UGE
unsigned greater or equal
Definition InstrTypes.h:764
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:763
@ ICMP_ULT
unsigned less than
Definition InstrTypes.h:765
@ ICMP_NE
not equal
Definition InstrTypes.h:762
static constexpr ElementCount getFixed(ScalarTy MinVal)
Definition TypeSize.h:309
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:354
static constexpr LLT vector(ElementCount EC, unsigned ScalarSizeInBits)
Get a low-level vector of some number of elements and element width.
LLT getScalarType() const
constexpr bool isPointerVector() const
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr bool isValid() const
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr bool isPointer() const
constexpr unsigned getAddressSpace() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
constexpr bool isPointerOrPointerVector() const
constexpr bool isFixedVector() const
Returns true if the LLT is a fixed vector.
constexpr TypeSize getSizeInBytes() const
Returns the total size of the type in bytes, i.e.
LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
LLVM_ABI void computeTables()
Compute any ancillary tables needed to quickly decide how an operation should be handled.
LegalizeRuleSet & legalFor(std::initializer_list< LLT > Types)
The instruction is legal when type index 0 is any type in the given list.
LegalizeRuleSet & fewerElementsIf(LegalityPredicate Predicate, LegalizeMutation Mutation)
Remove elements to reach the type selected by the mutation if the predicate is true.
LegalizeRuleSet & moreElementsToNextPow2(unsigned TypeIdx)
Add more elements to the vector to reach the next power of two.
LegalizeRuleSet & lower()
The instruction is lowered.
LegalizeRuleSet & scalarizeIf(LegalityPredicate Predicate, unsigned TypeIdx)
LegalizeRuleSet & lowerIf(LegalityPredicate Predicate)
The instruction is lowered if predicate is true.
LegalizeRuleSet & custom()
Unconditionally custom lower.
LegalizeRuleSet & unsupportedIf(LegalityPredicate Predicate)
LegalizeRuleSet & alwaysLegal()
LegalizeRuleSet & scalarize(unsigned TypeIdx)
LegalizeRuleSet & legalForCartesianProduct(std::initializer_list< LLT > Types)
The instruction is legal when type indexes 0 and 1 are both in the given list.
LegalizeRuleSet & legalIf(LegalityPredicate Predicate)
The instruction is legal if predicate is true.
LegalizeRuleSet & customFor(std::initializer_list< LLT > Types)
LLVM_ABI MachineInstrBuilder createStackTemporary(TypeSize Bytes, Align Alignment, MachinePointerInfo &PtrInfo)
Create a stack temporary based on the size in bytes and the alignment.
MachineIRBuilder & MIRBuilder
Expose MIRBuilder so clients can set their own RecordInsertInstruction functions.
LLVM_ABI Align getStackTemporaryAlignment(LLT Type, Align MinAlign=Align()) const
Return the alignment to use for a stack temporary object with the given type.
LegalizeRuleSet & getActionDefinitionsBuilder(unsigned Opcode)
Get the action definition builder for the given opcode.
const LegacyLegalizerInfo & getLegacyLegalizerInfo() const
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Helper class to build MachineInstr.
LLVMContext & getContext() const
MachineInstrBuilder buildUnmerge(ArrayRef< LLT > Res, const SrcOp &Op)
Build and insert Res0, ... = G_UNMERGE_VALUES Op.
MachineInstrBuilder buildAnd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_AND Op0, Op1.
MachineInstrBuilder buildICmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_ICMP Pred, Op0, Op1.
MachineInstrBuilder buildSub(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_SUB Op0, Op1.
MachineInstrBuilder buildIntrinsic(Intrinsic::ID ID, ArrayRef< Register > Res, bool HasSideEffects, bool isConvergent)
Build and insert a G_INTRINSIC instruction.
MachineInstrBuilder buildSplatBuildVector(const DstOp &Res, const SrcOp &Src)
Build and insert Res = G_BUILD_VECTOR with Src replicated to fill the number of elements.
MachineInstrBuilder buildBuildVector(const DstOp &Res, ArrayRef< Register > Ops)
Build and insert Res = G_BUILD_VECTOR Op0, ...
MachineInstrBuilder buildLoad(const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = G_LOAD Addr, MMO.
MachineInstrBuilder buildStore(const SrcOp &Val, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert G_STORE Val, Addr, MMO.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
MachineFunction & getMF()
Getter for the function we currently build.
MachineInstrBuilder buildBitcast(const DstOp &Dst, const SrcOp &Src)
Build and insert Dst = G_BITCAST Src.
MachineRegisterInfo * getMRI()
Getter for MRI.
MachineInstrBuilder buildOr(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_OR Op0, Op1.
MachineInstrBuilder buildCopy(const DstOp &Res, const SrcOp &Op)
Build and insert Res = COPY Op.
MachineInstrBuilder buildXor(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_XOR Op0, Op1.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
Representation of each machine instruction.
A description of a memory reference used in the backend.
const MachinePointerInfo & getPointerInfo() const
LLVM_ABI Align getAlign() const
Return the minimum known alignment in bytes of the actual memory reference.
MachineOperand class - Representation of each machine instruction operand.
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
LLVM_ABI void setRegClass(Register Reg, const TargetRegisterClass *RC)
setRegClass - Set the register class of the specified virtual register.
LLVM_ABI Register createGenericVirtualRegister(LLT Ty, StringRef Name="")
Create and return a new generic virtual register with low-level type Ty.
Wrapper class representing virtual and physical registers.
Definition Register.h:20
void assignSPIRVTypeToVReg(SPIRVTypeInst Type, Register VReg, const MachineFunction &MF)
const TargetRegisterClass * getRegClass(SPIRVTypeInst SpvType) const
const Type * getTypeForSPIRVType(SPIRVTypeInst Ty) const
LLT getRegType(SPIRVTypeInst SpvType) const
SPIRVTypeInst getOrCreateSPIRVPointerType(const Type *BaseType, MachineIRBuilder &MIRBuilder, SPIRV::StorageClass::StorageClass SC)
SPIRVTypeInst getScalarOrVectorComponentType(SPIRVTypeInst Type) const
SPIRVTypeInst getOrCreateSPIRVType(const Type *Type, MachineInstr &I, SPIRV::AccessQualifier::AccessQualifier AQ, bool EmitIR)
SPIRVTypeInst getSPIRVTypeForVReg(Register VReg, const MachineFunction *MF=nullptr) const
SPIRVLegalizerInfo(const SPIRVSubtarget &ST)
bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI, LostDebugLocObserver &LocObserver) const override
Called for instructions with the Custom LegalizationAction.
bool legalizeIntrinsic(LegalizerHelper &Helper, MachineInstr &MI) const override
SPIRVGlobalRegistry * getSPIRVGlobalRegistry() const
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
LLVM_ABI LegalityPredicate isScalar(unsigned TypeIdx)
True iff the specified type index is a scalar.
LLVM_ABI LegalityPredicate numElementsNotPow2(unsigned TypeIdx)
True iff the specified type index is a vector whose element count is not a power of 2.
LLVM_ABI LegalityPredicate vectorElementCountIsLessThanOrEqualTo(unsigned TypeIdx, unsigned Size)
True iff the specified type index is a vector with a number of elements that's less than or equal to ...
LLVM_ABI LegalityPredicate typeInSet(unsigned TypeIdx, std::initializer_list< LLT > TypesInit)
True iff the given type index is one of the specified types.
LLVM_ABI LegalityPredicate vectorElementCountIsGreaterThan(unsigned TypeIdx, unsigned Size)
True iff the specified type index is a vector with a number of elements that's greater than the given...
Predicate any(Predicate P0, Predicate P1)
True iff P0 or P1 are true.
LegalityPredicate typeIsNot(unsigned TypeIdx, LLT Type)
True iff the given type index is not the specified type.
Predicate all(Predicate P0, Predicate P1)
True iff P0 and P1 are true.
LLVM_ABI LegalityPredicate typeIs(unsigned TypeIdx, LLT TypesInit)
True iff the given type index is the specified type.
LLVM_ABI LegalizeMutation changeElementCountTo(unsigned TypeIdx, unsigned FromTypeIdx)
Keep the same scalar or element type as TypeIdx, but take the number of elements from FromTypeIdx.
LLVM_ABI LegalizeMutation changeElementSizeTo(unsigned TypeIdx, unsigned FromTypeIdx)
Change the scalar size or element size to have the same scalar size as type index FromIndex.
Invariant opcodes: All instruction sets have these as their low opcodes.
This is an optimization pass for GlobalISel generic memory operations.
LLVM_ABI const llvm::fltSemantics & getFltSemanticForLLT(LLT Ty)
Get the appropriate floating point arithmetic semantic based on the bit size of the given scalar LLT.
std::function< bool(const LegalityQuery &)> LegalityPredicate
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:279
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
const std::set< unsigned > & getTypeFoldingSupportedOpcodes()
int64_t foldImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
The LegalityQuery object bundles together all the information that's needed to decide whether a given...
ArrayRef< LLT > Types
This class contains a discriminated union of information about pointers in memory operands,...
MachinePointerInfo getWithOffset(int64_t O) const