LLVM 23.0.0git
SPIRVLegalizerInfo.cpp
Go to the documentation of this file.
1//===- SPIRVLegalizerInfo.cpp --- SPIR-V Legalization Rules ------*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the targeting of the Machinelegalizer class for SPIR-V.
10//
11//===----------------------------------------------------------------------===//
12
13#include "SPIRVLegalizerInfo.h"
14#include "SPIRV.h"
15#include "SPIRVGlobalRegistry.h"
16#include "SPIRVSubtarget.h"
17#include "SPIRVUtils.h"
24#include "llvm/IR/IntrinsicsSPIRV.h"
25#include "llvm/Support/Debug.h"
27
28using namespace llvm;
29using namespace llvm::LegalizeActions;
30using namespace llvm::LegalityPredicates;
31
32#define DEBUG_TYPE "spirv-legalizer"
33
34LegalityPredicate typeOfExtendedScalars(unsigned TypeIdx, bool IsExtendedInts) {
35 return [IsExtendedInts, TypeIdx](const LegalityQuery &Query) {
36 const LLT Ty = Query.Types[TypeIdx];
37 return IsExtendedInts && Ty.isValid() && Ty.isScalar();
38 };
39}
40
42 using namespace TargetOpcode;
43
44 this->ST = &ST;
45 GR = ST.getSPIRVGlobalRegistry();
46
47 const LLT s1 = LLT::scalar(1);
48 const LLT s8 = LLT::scalar(8);
49 const LLT s16 = LLT::scalar(16);
50 const LLT s32 = LLT::scalar(32);
51 const LLT s64 = LLT::scalar(64);
52 const LLT s128 = LLT::scalar(128);
53
54 const LLT v16s64 = LLT::fixed_vector(16, 64);
55 const LLT v16s32 = LLT::fixed_vector(16, 32);
56 const LLT v16s16 = LLT::fixed_vector(16, 16);
57 const LLT v16s8 = LLT::fixed_vector(16, 8);
58 const LLT v16s1 = LLT::fixed_vector(16, 1);
59
60 const LLT v8s64 = LLT::fixed_vector(8, 64);
61 const LLT v8s32 = LLT::fixed_vector(8, 32);
62 const LLT v8s16 = LLT::fixed_vector(8, 16);
63 const LLT v8s8 = LLT::fixed_vector(8, 8);
64 const LLT v8s1 = LLT::fixed_vector(8, 1);
65
66 const LLT v4s64 = LLT::fixed_vector(4, 64);
67 const LLT v4s32 = LLT::fixed_vector(4, 32);
68 const LLT v4s16 = LLT::fixed_vector(4, 16);
69 const LLT v4s8 = LLT::fixed_vector(4, 8);
70 const LLT v4s1 = LLT::fixed_vector(4, 1);
71
72 const LLT v3s64 = LLT::fixed_vector(3, 64);
73 const LLT v3s32 = LLT::fixed_vector(3, 32);
74 const LLT v3s16 = LLT::fixed_vector(3, 16);
75 const LLT v3s8 = LLT::fixed_vector(3, 8);
76 const LLT v3s1 = LLT::fixed_vector(3, 1);
77
78 const LLT v2s64 = LLT::fixed_vector(2, 64);
79 const LLT v2s32 = LLT::fixed_vector(2, 32);
80 const LLT v2s16 = LLT::fixed_vector(2, 16);
81 const LLT v2s8 = LLT::fixed_vector(2, 8);
82 const LLT v2s1 = LLT::fixed_vector(2, 1);
83
84 const unsigned PSize = ST.getPointerSize();
85 const LLT p0 = LLT::pointer(0, PSize); // Function
86 const LLT p1 = LLT::pointer(1, PSize); // CrossWorkgroup
87 const LLT p2 = LLT::pointer(2, PSize); // UniformConstant
88 const LLT p3 = LLT::pointer(3, PSize); // Workgroup
89 const LLT p4 = LLT::pointer(4, PSize); // Generic
90 const LLT p5 =
91 LLT::pointer(5, PSize); // Input, SPV_INTEL_usm_storage_classes (Device)
92 const LLT p6 = LLT::pointer(6, PSize); // SPV_INTEL_usm_storage_classes (Host)
93 const LLT p7 = LLT::pointer(7, PSize); // Input
94 const LLT p8 = LLT::pointer(8, PSize); // Output
95 const LLT p9 =
96 LLT::pointer(9, PSize); // CodeSectionINTEL, SPV_INTEL_function_pointers
97 const LLT p10 = LLT::pointer(10, PSize); // Private
98 const LLT p11 = LLT::pointer(11, PSize); // StorageBuffer
99 const LLT p12 = LLT::pointer(12, PSize); // Uniform
100 const LLT p13 = LLT::pointer(13, PSize); // PushConstant
101
102 // TODO: remove copy-pasting here by using concatenation in some way.
103 auto allPtrsScalarsAndVectors = {
104 p0, p1, p2, p3, p4, p5, p6, p7, p8,
105 p9, p10, p11, p12, p13, s1, s8, s16, s32,
106 s64, s128, v2s1, v2s8, v2s16, v2s32, v2s64, v3s1, v3s8,
107 v3s16, v3s32, v3s64, v4s1, v4s8, v4s16, v4s32, v4s64, v8s1,
108 v8s8, v8s16, v8s32, v8s64, v16s1, v16s8, v16s16, v16s32, v16s64};
109
110 auto allVectors = {v2s1, v2s8, v2s16, v2s32, v2s64, v3s1, v3s8,
111 v3s16, v3s32, v3s64, v4s1, v4s8, v4s16, v4s32,
112 v4s64, v8s1, v8s8, v8s16, v8s32, v8s64, v16s1,
113 v16s8, v16s16, v16s32, v16s64};
114
115 auto allShaderVectors = {v2s1, v2s8, v2s16, v2s32, v2s64,
116 v3s1, v3s8, v3s16, v3s32, v3s64,
117 v4s1, v4s8, v4s16, v4s32, v4s64};
118
119 auto allScalars = {s1, s8, s16, s32, s64};
120
121 auto allScalarsAndVectors = {
122 s1, s8, s16, s32, s64, s128, v2s1, v2s8,
123 v2s16, v2s32, v2s64, v3s1, v3s8, v3s16, v3s32, v3s64,
124 v4s1, v4s8, v4s16, v4s32, v4s64, v8s1, v8s8, v8s16,
125 v8s32, v8s64, v16s1, v16s8, v16s16, v16s32, v16s64};
126
127 auto allIntScalarsAndVectors = {
128 s8, s16, s32, s64, s128, v2s8, v2s16, v2s32, v2s64,
129 v3s8, v3s16, v3s32, v3s64, v4s8, v4s16, v4s32, v4s64, v8s8,
130 v8s16, v8s32, v8s64, v16s8, v16s16, v16s32, v16s64};
131
132 auto allBoolScalarsAndVectors = {s1, v2s1, v3s1, v4s1, v8s1, v16s1};
133
134 auto allIntScalars = {s8, s16, s32, s64, s128};
135
136 auto allFloatScalarsAndF16Vector2AndVector4s = {s16, s32, s64, v2s16, v4s16};
137
138 auto allFloatScalars = {s16, s32, s64};
139
140 auto allFloatScalarsAndVectors = {
141 s16, s32, s64, v2s16, v2s32, v2s64, v3s16, v3s32, v3s64,
142 v4s16, v4s32, v4s64, v8s16, v8s32, v8s64, v16s16, v16s32, v16s64};
143
144 auto allShaderFloatVectors = {v2s16, v2s32, v2s64, v3s16, v3s32,
145 v3s64, v4s16, v4s32, v4s64};
146
147 auto allFloatVectors = {v2s16, v2s32, v2s64, v3s16, v3s32,
148 v3s64, v4s16, v4s32, v4s64, v8s16,
149 v8s32, v8s64, v16s16, v16s32, v16s64};
150
151 auto &allowedFloatVectorTypes =
152 ST.isShader() ? allShaderFloatVectors : allFloatVectors;
153
154 auto allFloatAndIntScalarsAndPtrs = {s8, s16, s32, s64, p0, p1,
155 p2, p3, p4, p5, p6, p7,
156 p8, p9, p10, p11, p12, p13};
157
158 auto allPtrs = {p0, p1, p2, p3, p4, p5, p6, p7, p8, p9, p10, p11, p12, p13};
159
160 auto &allowedVectorTypes = ST.isShader() ? allShaderVectors : allVectors;
161
162 bool IsExtendedInts =
163 ST.canUseExtension(
164 SPIRV::Extension::SPV_ALTERA_arbitrary_precision_integers) ||
165 ST.canUseExtension(SPIRV::Extension::SPV_KHR_bit_instructions) ||
166 ST.canUseExtension(SPIRV::Extension::SPV_INTEL_int4);
167 auto extendedScalarsAndVectors =
168 [IsExtendedInts](const LegalityQuery &Query) {
169 const LLT Ty = Query.Types[0];
170 return IsExtendedInts && Ty.isValid() && !Ty.isPointerOrPointerVector();
171 };
172 auto extendedScalarsAndVectorsProduct = [IsExtendedInts](
173 const LegalityQuery &Query) {
174 const LLT Ty1 = Query.Types[0], Ty2 = Query.Types[1];
175 return IsExtendedInts && Ty1.isValid() && Ty2.isValid() &&
176 !Ty1.isPointerOrPointerVector() && !Ty2.isPointerOrPointerVector();
177 };
178 auto extendedPtrsScalarsAndVectors =
179 [IsExtendedInts](const LegalityQuery &Query) {
180 const LLT Ty = Query.Types[0];
181 return IsExtendedInts && Ty.isValid();
182 };
183
184 // The universal validation rules in the SPIR-V specification state that
185 // vector sizes are typically limited to 2, 3, or 4. However, larger vector
186 // sizes (8 and 16) are enabled when the Kernel capability is present. For
187 // shader execution models, vector sizes are strictly limited to 4. In
188 // non-shader contexts, vector sizes of 8 and 16 are also permitted, but
189 // arbitrary sizes (e.g., 6 or 11) are not.
190 uint32_t MaxVectorSize = ST.isShader() ? 4 : 16;
191 LLVM_DEBUG(dbgs() << "MaxVectorSize: " << MaxVectorSize << "\n");
192
193 for (auto Opc : getTypeFoldingSupportedOpcodes()) {
194 switch (Opc) {
195 case G_EXTRACT_VECTOR_ELT:
196 case G_UREM:
197 case G_SREM:
198 case G_UDIV:
199 case G_SDIV:
200 case G_FREM:
201 break;
202 default:
204 .customFor(allScalars)
205 .customFor(allowedVectorTypes)
209 0, ElementCount::getFixed(MaxVectorSize)))
210 .custom();
211 break;
212 }
213 }
214
215 getActionDefinitionsBuilder({G_UREM, G_SREM, G_SDIV, G_UDIV, G_FREM})
216 .customFor(allScalars)
217 .customFor(allowedVectorTypes)
221 0, ElementCount::getFixed(MaxVectorSize)))
222 .custom();
223
224 getActionDefinitionsBuilder({G_FMA, G_STRICT_FMA})
225 .legalFor(allScalars)
226 .legalFor(allowedVectorTypes)
230 0, ElementCount::getFixed(MaxVectorSize)))
231 .alwaysLegal();
232
233 getActionDefinitionsBuilder(G_INTRINSIC_W_SIDE_EFFECTS).custom();
234
235 getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
236 .legalForCartesianProduct(allowedVectorTypes, allowedVectorTypes)
238 .lowerIf(vectorElementCountIsGreaterThan(0, MaxVectorSize))
240 .lowerIf(vectorElementCountIsGreaterThan(1, MaxVectorSize));
241
242 getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
246 1, ElementCount::getFixed(MaxVectorSize)))
247 .custom();
248
249 getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
253 0, ElementCount::getFixed(MaxVectorSize)))
254 .custom();
255
256 // Illegal G_UNMERGE_VALUES instructions should be handled
257 // during the combine phase.
258 getActionDefinitionsBuilder(G_BUILD_VECTOR)
260
261 // When entering the legalizer, there should be no G_BITCAST instructions.
262 // They should all be calls to the `spv_bitcast` intrinsic. The call to
263 // the intrinsic will be converted to a G_BITCAST during legalization if
264 // the vectors are not legal. After using the rules to legalize a G_BITCAST,
265 // we turn it back into a call to the intrinsic with a custom rule to avoid
266 // potential machine verifier failures.
272 0, ElementCount::getFixed(MaxVectorSize)))
273 .lowerIf(vectorElementCountIsGreaterThan(1, MaxVectorSize))
274 .custom();
275
276 // If the result is still illegal, the combiner should be able to remove it.
277 getActionDefinitionsBuilder(G_CONCAT_VECTORS)
278 .legalForCartesianProduct(allowedVectorTypes, allowedVectorTypes);
279
280 getActionDefinitionsBuilder(G_SPLAT_VECTOR)
281 .legalFor(allowedVectorTypes)
285 .alwaysLegal();
286
287 // Vector Reduction Operations
289 {G_VECREDUCE_SMIN, G_VECREDUCE_SMAX, G_VECREDUCE_UMIN, G_VECREDUCE_UMAX,
290 G_VECREDUCE_ADD, G_VECREDUCE_MUL, G_VECREDUCE_FMUL, G_VECREDUCE_FMIN,
291 G_VECREDUCE_FMAX, G_VECREDUCE_FMINIMUM, G_VECREDUCE_FMAXIMUM,
292 G_VECREDUCE_OR, G_VECREDUCE_AND, G_VECREDUCE_XOR})
293 .legalFor(allowedVectorTypes)
294 .scalarize(1)
295 .lower();
296
297 getActionDefinitionsBuilder({G_VECREDUCE_SEQ_FADD, G_VECREDUCE_SEQ_FMUL})
298 .scalarize(2)
299 .lower();
300
301 // Illegal G_UNMERGE_VALUES instructions should be handled
302 // during the combine phase.
303 getActionDefinitionsBuilder(G_UNMERGE_VALUES)
305
306 getActionDefinitionsBuilder({G_MEMCPY, G_MEMCPY_INLINE, G_MEMMOVE})
307 .unsupportedIf(LegalityPredicates::any(typeIs(0, p9), typeIs(1, p9)))
308 .legalIf(all(typeInSet(0, allPtrs), typeInSet(1, allPtrs)));
309
310 getActionDefinitionsBuilder({G_MEMSET, G_MEMSET_INLINE})
311 .unsupportedIf(typeIs(0, p9))
312 .legalIf(all(typeInSet(0, allPtrs), typeInSet(1, allIntScalars)));
313
314 getActionDefinitionsBuilder(G_ADDRSPACE_CAST)
315 .legalForCartesianProduct(allPtrs, allPtrs);
316
317 // Should we be legalizing bad scalar sizes like s5 here instead
318 // of handling them in the instruction selector?
319 getActionDefinitionsBuilder({G_LOAD, G_STORE})
320 .unsupportedIf(typeIs(1, p9))
321 .legalForCartesianProduct(allowedVectorTypes, allPtrs)
322 .legalForCartesianProduct(allPtrs, allPtrs)
323 .legalIf(isScalar(0))
324 .custom();
325
326 getActionDefinitionsBuilder({G_SMIN, G_SMAX, G_UMIN, G_UMAX, G_ABS,
327 G_BITREVERSE, G_SADDSAT, G_UADDSAT, G_SSUBSAT,
328 G_USUBSAT, G_SCMP, G_UCMP})
329 .legalFor(allIntScalarsAndVectors)
330 .legalIf(extendedScalarsAndVectors);
331
332 getActionDefinitionsBuilder({G_SSHLSAT, G_USHLSAT}).lower();
333
334 getActionDefinitionsBuilder(G_STRICT_FLDEXP)
335 .legalForCartesianProduct(allFloatScalarsAndVectors, allIntScalars);
336
337 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
338 .legalForCartesianProduct(allIntScalarsAndVectors,
339 allFloatScalarsAndVectors);
340
341 getActionDefinitionsBuilder({G_FPTOSI_SAT, G_FPTOUI_SAT})
342 .legalForCartesianProduct(allIntScalarsAndVectors,
343 allFloatScalarsAndVectors);
344
345 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
346 .legalForCartesianProduct(allFloatScalarsAndVectors,
347 allScalarsAndVectors);
348
350 .legalForCartesianProduct(allIntScalarsAndVectors)
351 .legalIf(extendedScalarsAndVectorsProduct);
352
353 // Extensions.
354 getActionDefinitionsBuilder({G_TRUNC, G_ZEXT, G_SEXT, G_ANYEXT})
355 .legalForCartesianProduct(allScalarsAndVectors)
356 .legalIf(extendedScalarsAndVectorsProduct);
357
359 .legalFor(allPtrsScalarsAndVectors)
360 .legalIf(extendedPtrsScalarsAndVectors)
364 0, ElementCount::getFixed(MaxVectorSize)));
365
367 all(typeInSet(0, allPtrsScalarsAndVectors),
368 typeInSet(1, allPtrsScalarsAndVectors)));
369
370 getActionDefinitionsBuilder({G_IMPLICIT_DEF, G_FREEZE})
371 .legalFor({s1, s128})
372 .legalFor(allFloatAndIntScalarsAndPtrs)
373 .legalFor(allowedVectorTypes)
374 .legalIf([](const LegalityQuery &Query) {
375 return Query.Types[0].isPointerVector();
376 })
377 .moreElementsToNextPow2(0)
378 .fewerElementsIf(vectorElementCountIsGreaterThan(0, MaxVectorSize),
380 0, ElementCount::getFixed(MaxVectorSize)));
381
382 getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).alwaysLegal();
383
385 .legalForCartesianProduct(allPtrs, allIntScalars)
386 .legalIf(
387 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)))
388 .legalIf([](const LegalityQuery &Query) {
389 const LLT DstTy = Query.Types[0];
390 const LLT SrcTy = Query.Types[1];
391 return DstTy.isPointerVector() && SrcTy.isVector() &&
392 !SrcTy.isPointer() &&
393 DstTy.getNumElements() == SrcTy.getNumElements();
394 });
396 .legalForCartesianProduct(allIntScalars, allPtrs)
397 .legalIf(
398 all(typeOfExtendedScalars(0, IsExtendedInts), typeInSet(1, allPtrs)))
399 .legalIf([](const LegalityQuery &Query) {
400 const LLT DstTy = Query.Types[0];
401 const LLT SrcTy = Query.Types[1];
402 return SrcTy.isPointerVector() && DstTy.isVector() &&
403 !DstTy.isPointer() &&
404 DstTy.getNumElements() == SrcTy.getNumElements();
405 });
407 .legalForCartesianProduct(allPtrs, allIntScalars)
408 .legalIf(
409 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)));
410
412 .legalForCartesianProduct(allPtrs, allIntScalars)
413 .legalIf(
414 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)))
415 .legalIf([](const LegalityQuery &Query) {
416 const LLT PtrTy = Query.Types[0];
417 const LLT MaskTy = Query.Types[1];
418 return PtrTy.isPointerVector() && MaskTy.isVector() &&
419 !MaskTy.isPointer() &&
420 PtrTy.getNumElements() == MaskTy.getNumElements();
421 });
422
423 // ST.canDirectlyComparePointers() for pointer args is supported in
424 // legalizeCustom().
427 all(typeIs(0, p9), typeInSet(1, allPtrs), typeIsNot(1, p9)),
428 all(typeInSet(0, allPtrs), typeIsNot(0, p9), typeIs(1, p9))))
429 .legalIf([IsExtendedInts](const LegalityQuery &Query) {
430 const LLT Ty = Query.Types[1];
431 return IsExtendedInts && Ty.isValid() && !Ty.isPointerOrPointerVector();
432 })
433 .customIf(all(typeInSet(0, allBoolScalarsAndVectors),
434 typeInSet(1, allPtrsScalarsAndVectors)));
435
437 all(typeInSet(0, allBoolScalarsAndVectors),
438 typeInSet(1, allFloatScalarsAndVectors)));
439
440 getActionDefinitionsBuilder({G_ATOMICRMW_OR, G_ATOMICRMW_ADD, G_ATOMICRMW_AND,
441 G_ATOMICRMW_MAX, G_ATOMICRMW_MIN,
442 G_ATOMICRMW_SUB, G_ATOMICRMW_XOR,
443 G_ATOMICRMW_UMAX, G_ATOMICRMW_UMIN})
444 .legalForCartesianProduct(allIntScalars, allPtrs);
445
447 {G_ATOMICRMW_FADD, G_ATOMICRMW_FSUB, G_ATOMICRMW_FMIN, G_ATOMICRMW_FMAX})
448 .legalForCartesianProduct(allFloatScalarsAndF16Vector2AndVector4s,
449 allPtrs);
450
451 getActionDefinitionsBuilder(G_ATOMICRMW_XCHG)
452 .legalForCartesianProduct(allFloatAndIntScalarsAndPtrs, allPtrs);
453
454 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG_WITH_SUCCESS).lower();
455 // TODO: add proper legalization rules.
456 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG).alwaysLegal();
457
458 getActionDefinitionsBuilder({G_UADDO, G_USUBO, G_UMULO, G_SMULO})
459 .alwaysLegal();
460
461 getActionDefinitionsBuilder({G_SADDO, G_SSUBO}).lower();
462
463 // s64 is unsupported because lowering widens to s128, which SPIR-V does not
464 // have.
465 getActionDefinitionsBuilder({G_SMULFIX, G_UMULFIX})
466 .unsupportedFor({s64})
467 .lower();
468
469 getActionDefinitionsBuilder({G_LROUND, G_LLROUND})
470 .legalForCartesianProduct(allFloatScalarsAndVectors,
471 allIntScalarsAndVectors);
472
473 // FP conversions.
474 getActionDefinitionsBuilder({G_FPTRUNC, G_FPEXT})
475 .legalForCartesianProduct(allFloatScalarsAndVectors);
476
477 // Pointer-handling.
478 getActionDefinitionsBuilder(G_FRAME_INDEX).legalFor({p0});
479
480 getActionDefinitionsBuilder(G_GLOBAL_VALUE).legalFor(allPtrs);
481
482 // Control-flow. In some cases (e.g. constants) s1 may be promoted to s32.
484 getActionDefinitionsBuilder(G_BRCOND).legalFor({s1, s32});
485
487 allFloatScalarsAndVectors, {s32, v2s32, v3s32, v4s32, v8s32, v16s32});
488
489 // TODO: Review the target OpenCL and GLSL Extended Instruction Set specs to
490 // tighten these requirements. Many of these math functions are only legal on
491 // specific bitwidths, so they are not selectable for
492 // allFloatScalarsAndVectors.
493 // clang-format off
494 getActionDefinitionsBuilder({G_STRICT_FSQRT,
495 G_FPOW,
496 G_FEXP,
497 G_FMODF,
498 G_FSINCOS,
499 G_FEXP2,
500 G_FEXP10,
501 G_FLOG,
502 G_FLOG2,
503 G_FLOG10,
504 G_FABS,
505 G_FMINNUM,
506 G_FMAXNUM,
507 G_FCEIL,
508 G_FCOS,
509 G_FSIN,
510 G_FTAN,
511 G_FACOS,
512 G_FASIN,
513 G_FATAN,
514 G_FATAN2,
515 G_FCOSH,
516 G_FSINH,
517 G_FTANH,
518 G_FSQRT,
519 G_FFLOOR,
520 G_FRINT,
521 G_FNEARBYINT,
522 G_INTRINSIC_ROUND,
523 G_INTRINSIC_TRUNC,
524 G_FMINIMUM,
525 G_FMAXIMUM,
526 G_INTRINSIC_ROUNDEVEN})
527 .legalFor(allFloatScalars)
528 .legalFor(allowedFloatVectorTypes)
532 0, ElementCount::getFixed(MaxVectorSize)));
533 // clang-format on
534
535 getActionDefinitionsBuilder(G_FCOPYSIGN)
536 .legalForCartesianProduct(allFloatScalarsAndVectors,
537 allFloatScalarsAndVectors);
538
540 allFloatScalarsAndVectors, allIntScalarsAndVectors);
541
542 if (ST.canUseExtInstSet(SPIRV::InstructionSet::OpenCL_std)) {
544 {G_CTTZ, G_CTTZ_ZERO_POISON, G_CTLZ, G_CTLZ_ZERO_POISON})
545 .legalForCartesianProduct(allIntScalarsAndVectors,
546 allIntScalarsAndVectors);
547
548 // Struct return types become a single scalar, so cannot easily legalize.
549 getActionDefinitionsBuilder({G_SMULH, G_UMULH}).alwaysLegal();
550 }
551
552 getActionDefinitionsBuilder(G_IS_FPCLASS).custom();
553
554 getActionDefinitionsBuilder({G_INTRINSIC, G_INTRINSIC_CONVERGENT,
555 G_INTRINSIC_CONVERGENT_W_SIDE_EFFECTS})
556 .alwaysLegal();
558 getActionDefinitionsBuilder({G_TRAP, G_DEBUGTRAP, G_UBSANTRAP}).alwaysLegal();
559
561 verify(*ST.getInstrInfo());
562}
563
566 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
567 Register DstReg = MI.getOperand(0).getReg();
568 Register SrcReg = MI.getOperand(1).getReg();
569 Register IdxReg = MI.getOperand(2).getReg();
570
571 MIRBuilder
572 .buildIntrinsic(Intrinsic::spv_extractelt, ArrayRef<Register>{DstReg})
573 .addUse(SrcReg)
574 .addUse(IdxReg);
575 MI.eraseFromParent();
576 return true;
577}
578
581 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
582 Register DstReg = MI.getOperand(0).getReg();
583 Register SrcReg = MI.getOperand(1).getReg();
584 Register ValReg = MI.getOperand(2).getReg();
585 Register IdxReg = MI.getOperand(3).getReg();
586
587 MIRBuilder
588 .buildIntrinsic(Intrinsic::spv_insertelt, ArrayRef<Register>{DstReg})
589 .addUse(SrcReg)
590 .addUse(ValReg)
591 .addUse(IdxReg);
592 MI.eraseFromParent();
593 return true;
594}
595
597 LegalizerHelper &Helper,
600 Register ConvReg = MRI.createGenericVirtualRegister(ConvTy);
601 MRI.setRegClass(ConvReg, GR->getRegClass(SpvType));
602 GR->assignSPIRVTypeToVReg(SpvType, ConvReg, Helper.MIRBuilder.getMF());
603 Helper.MIRBuilder.buildInstr(TargetOpcode::G_PTRTOINT)
604 .addDef(ConvReg)
605 .addUse(Reg);
606 return ConvReg;
607}
608
609static bool needsVectorLegalization(const LLT &Ty, const SPIRVSubtarget &ST) {
610 if (!Ty.isVector())
611 return false;
612 unsigned NumElements = Ty.getNumElements();
613 unsigned MaxVectorSize = ST.isShader() ? 4 : 16;
614 return (NumElements > 4 && !isPowerOf2_32(NumElements)) ||
615 NumElements > MaxVectorSize;
616}
617
620 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
621 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
622 Register DstReg = MI.getOperand(0).getReg();
623 Register PtrReg = MI.getOperand(1).getReg();
624 LLT DstTy = MRI.getType(DstReg);
625
626 if (!DstTy.isVector())
627 return true;
628
629 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
630 if (!needsVectorLegalization(DstTy, ST))
631 return true;
632
633 SmallVector<Register, 8> SplitRegs;
634 LLT EltTy = DstTy.getElementType();
635 unsigned NumElts = DstTy.getNumElements();
636
637 LLT PtrTy = MRI.getType(PtrReg);
638 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
639
640 for (unsigned i = 0; i < NumElts; ++i) {
641 auto Idx = MIRBuilder.buildConstant(LLT::scalar(32), i);
642 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
643
644 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
645 .addImm(1) // InBounds
646 .addUse(PtrReg)
647 .addUse(Zero.getReg(0))
648 .addUse(Idx.getReg(0));
649
650 MachinePointerInfo EltPtrInfo;
651 Align EltAlign = Align(1);
652 if (!MI.memoperands_empty()) {
653 MachineMemOperand *MMO = *MI.memoperands_begin();
654 EltPtrInfo =
655 MMO->getPointerInfo().getWithOffset(i * EltTy.getSizeInBytes());
656 EltAlign = commonAlignment(MMO->getAlign(), i * EltTy.getSizeInBytes());
657 }
658
659 Register EltReg = MRI.createGenericVirtualRegister(EltTy);
660 MIRBuilder.buildLoad(EltReg, EltPtr, EltPtrInfo, EltAlign);
661 SplitRegs.push_back(EltReg);
662 }
663
664 MIRBuilder.buildBuildVector(DstReg, SplitRegs);
665 MI.eraseFromParent();
666 return true;
667}
668
671 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
672 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
673 Register ValReg = MI.getOperand(0).getReg();
674 Register PtrReg = MI.getOperand(1).getReg();
675 LLT ValTy = MRI.getType(ValReg);
676
677 assert(ValTy.isVector() && "Expected vector store");
678
679 SmallVector<Register, 8> SplitRegs;
680 LLT EltTy = ValTy.getElementType();
681 unsigned NumElts = ValTy.getNumElements();
682
683 for (unsigned i = 0; i < NumElts; ++i)
684 SplitRegs.push_back(MRI.createGenericVirtualRegister(EltTy));
685
686 MIRBuilder.buildUnmerge(SplitRegs, ValReg);
687
688 LLT PtrTy = MRI.getType(PtrReg);
689 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
690
691 for (unsigned i = 0; i < NumElts; ++i) {
692 auto Idx = MIRBuilder.buildConstant(LLT::scalar(32), i);
693 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
694
695 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
696 .addImm(1) // InBounds
697 .addUse(PtrReg)
698 .addUse(Zero.getReg(0))
699 .addUse(Idx.getReg(0));
700
701 MachinePointerInfo EltPtrInfo;
702 Align EltAlign = Align(1);
703 if (!MI.memoperands_empty()) {
704 MachineMemOperand *MMO = *MI.memoperands_begin();
705 EltPtrInfo =
706 MMO->getPointerInfo().getWithOffset(i * EltTy.getSizeInBytes());
707 EltAlign = commonAlignment(MMO->getAlign(), i * EltTy.getSizeInBytes());
708 }
709
710 MIRBuilder.buildStore(SplitRegs[i], EltPtr, EltPtrInfo, EltAlign);
711 }
712
713 MI.eraseFromParent();
714 return true;
715}
716
719 LostDebugLocObserver &LocObserver) const {
720 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
721 switch (MI.getOpcode()) {
722 default:
723 // TODO: implement legalization for other opcodes.
724 return true;
725 case TargetOpcode::G_BITCAST:
726 return legalizeBitcast(Helper, MI);
727 case TargetOpcode::G_EXTRACT_VECTOR_ELT:
728 return legalizeExtractVectorElt(Helper, MI, GR);
729 case TargetOpcode::G_INSERT_VECTOR_ELT:
730 return legalizeInsertVectorElt(Helper, MI, GR);
731 case TargetOpcode::G_INTRINSIC:
732 case TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS:
733 return legalizeIntrinsic(Helper, MI);
734 case TargetOpcode::G_IS_FPCLASS:
735 return legalizeIsFPClass(Helper, MI, LocObserver);
736 case TargetOpcode::G_ICMP: {
737 auto &Op0 = MI.getOperand(2);
738 auto &Op1 = MI.getOperand(3);
739 Register Reg0 = Op0.getReg();
740 Register Reg1 = Op1.getReg();
742 static_cast<CmpInst::Predicate>(MI.getOperand(1).getPredicate());
743 if ((!ST->canDirectlyComparePointers() ||
745 MRI.getType(Reg0).isPointer() && MRI.getType(Reg1).isPointer()) {
746 LLT ConvT = LLT::scalar(ST->getPointerSize());
747 Type *LLVMTy = IntegerType::get(MI.getMF()->getFunction().getContext(),
748 ST->getPointerSize());
749 SPIRVTypeInst SpirvTy = GR->getOrCreateSPIRVType(
750 LLVMTy, Helper.MIRBuilder, SPIRV::AccessQualifier::ReadWrite, true);
751 Op0.setReg(convertPtrToInt(Reg0, ConvT, SpirvTy, Helper, MRI, GR));
752 Op1.setReg(convertPtrToInt(Reg1, ConvT, SpirvTy, Helper, MRI, GR));
753 }
754 return true;
755 }
756 case TargetOpcode::G_LOAD:
757 return legalizeLoad(Helper, MI, GR);
758 case TargetOpcode::G_STORE:
759 return legalizeStore(Helper, MI, GR);
760 }
761}
762
765 Register SrcReg, LLT SrcTy,
766 MachinePointerInfo &PtrInfo, Align &VecAlign) {
767 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
768 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
769
770 VecAlign = Helper.getStackTemporaryAlignment(SrcTy);
771 auto StackTemp = Helper.createStackTemporary(
772 TypeSize::getFixed(SrcTy.getSizeInBytes()), VecAlign, PtrInfo);
773
774 // Set the type of StackTemp to a pointer to an array of the element type.
775 SPIRVTypeInst SpvSrcTy = GR->getSPIRVTypeForVReg(SrcReg);
776 SPIRVTypeInst EltSpvTy = GR->getScalarOrVectorComponentType(SpvSrcTy);
777 const Type *LLVMEltTy = GR->getTypeForSPIRVType(EltSpvTy);
778 const Type *LLVMArrTy =
779 ArrayType::get(const_cast<Type *>(LLVMEltTy), SrcTy.getNumElements());
780 SPIRVTypeInst ArrSpvTy = GR->getOrCreateSPIRVType(
781 LLVMArrTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite, true);
782 SPIRVTypeInst PtrToArrSpvTy = GR->getOrCreateSPIRVPointerType(
783 ArrSpvTy, MIRBuilder, SPIRV::StorageClass::Function);
784
785 Register StackReg = StackTemp.getReg(0);
786 MRI.setRegClass(StackReg, GR->getRegClass(PtrToArrSpvTy));
787 GR->assignSPIRVTypeToVReg(PtrToArrSpvTy, StackReg, MIRBuilder.getMF());
788
789 return StackTemp;
790}
791
794 LLVM_DEBUG(dbgs() << "Found a bitcast instruction\n");
795 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
796 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
797 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
798
799 Register DstReg = MI.getOperand(0).getReg();
800 Register SrcReg = MI.getOperand(2).getReg();
801 LLT DstTy = MRI.getType(DstReg);
802 LLT SrcTy = MRI.getType(SrcReg);
803
804 // If an spv_bitcast needs to be legalized, we convert it to G_BITCAST to
805 // allow using the generic legalization rules.
806 if (needsVectorLegalization(DstTy, ST) ||
807 needsVectorLegalization(SrcTy, ST)) {
808 LLVM_DEBUG(dbgs() << "Replacing with a G_BITCAST\n");
809 MIRBuilder.buildBitcast(DstReg, SrcReg);
810 MI.eraseFromParent();
811 }
812 return true;
813}
814
817 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
818 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
819 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
820
821 Register DstReg = MI.getOperand(0).getReg();
822 LLT DstTy = MRI.getType(DstReg);
823
824 if (needsVectorLegalization(DstTy, ST)) {
825 Register SrcReg = MI.getOperand(2).getReg();
826 Register ValReg = MI.getOperand(3).getReg();
827 LLT SrcTy = MRI.getType(SrcReg);
828 MachineOperand &IdxOperand = MI.getOperand(4);
829
830 if (getImm(IdxOperand, &MRI)) {
831 uint64_t IdxVal = foldImm(IdxOperand, &MRI);
832 if (IdxVal < SrcTy.getNumElements()) {
834 SPIRVTypeInst ElementType =
836 LLT ElementLLTTy = GR->getRegType(ElementType);
837 for (unsigned I = 0, E = SrcTy.getNumElements(); I < E; ++I) {
838 Register Reg = MRI.createGenericVirtualRegister(ElementLLTTy);
839 MRI.setRegClass(Reg, GR->getRegClass(ElementType));
840 GR->assignSPIRVTypeToVReg(ElementType, Reg, *MI.getMF());
841 Regs.push_back(Reg);
842 }
843 MIRBuilder.buildUnmerge(Regs, SrcReg);
844 Regs[IdxVal] = ValReg;
845 MIRBuilder.buildBuildVector(DstReg, Regs);
846 MI.eraseFromParent();
847 return true;
848 }
849 }
850
851 LLT EltTy = SrcTy.getElementType();
852 Align VecAlign;
853 MachinePointerInfo PtrInfo;
854 auto StackTemp = createStackTemporaryForVector(Helper, GR, SrcReg, SrcTy,
855 PtrInfo, VecAlign);
856
857 MIRBuilder.buildStore(SrcReg, StackTemp, PtrInfo, VecAlign);
858
859 Register IdxReg = IdxOperand.getReg();
860 LLT PtrTy = MRI.getType(StackTemp.getReg(0));
861 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
862 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
863
864 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
865 .addImm(1) // InBounds
866 .addUse(StackTemp.getReg(0))
867 .addUse(Zero.getReg(0))
868 .addUse(IdxReg);
869
871 Align EltAlign = Helper.getStackTemporaryAlignment(EltTy);
872 MIRBuilder.buildStore(ValReg, EltPtr, EltPtrInfo, EltAlign);
873
874 MIRBuilder.buildLoad(DstReg, StackTemp, PtrInfo, VecAlign);
875 MI.eraseFromParent();
876 return true;
877 }
878 return true;
879}
880
883 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
884 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
885 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
886
887 Register SrcReg = MI.getOperand(2).getReg();
888 LLT SrcTy = MRI.getType(SrcReg);
889
890 if (needsVectorLegalization(SrcTy, ST)) {
891 Register DstReg = MI.getOperand(0).getReg();
892 MachineOperand &IdxOperand = MI.getOperand(3);
893
894 if (getImm(IdxOperand, &MRI)) {
895 uint64_t IdxVal = foldImm(IdxOperand, &MRI);
896 if (IdxVal < SrcTy.getNumElements()) {
897 LLT DstTy = MRI.getType(DstReg);
899 SPIRVTypeInst DstSpvTy = GR->getSPIRVTypeForVReg(DstReg);
900 for (unsigned I = 0, E = SrcTy.getNumElements(); I < E; ++I) {
901 if (I == IdxVal) {
902 Regs.push_back(DstReg);
903 } else {
905 MRI.setRegClass(Reg, GR->getRegClass(DstSpvTy));
906 GR->assignSPIRVTypeToVReg(DstSpvTy, Reg, *MI.getMF());
907 Regs.push_back(Reg);
908 }
909 }
910 MIRBuilder.buildUnmerge(Regs, SrcReg);
911 MI.eraseFromParent();
912 return true;
913 }
914 }
915
916 LLT EltTy = SrcTy.getElementType();
917 Align VecAlign;
918 MachinePointerInfo PtrInfo;
919 auto StackTemp = createStackTemporaryForVector(Helper, GR, SrcReg, SrcTy,
920 PtrInfo, VecAlign);
921
922 MIRBuilder.buildStore(SrcReg, StackTemp, PtrInfo, VecAlign);
923
924 Register IdxReg = IdxOperand.getReg();
925 LLT PtrTy = MRI.getType(StackTemp.getReg(0));
926 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
927 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
928
929 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
930 .addImm(1) // InBounds
931 .addUse(StackTemp.getReg(0))
932 .addUse(Zero.getReg(0))
933 .addUse(IdxReg);
934
936 Align EltAlign = Helper.getStackTemporaryAlignment(EltTy);
937 MIRBuilder.buildLoad(DstReg, EltPtr, EltPtrInfo, EltAlign);
938
939 MI.eraseFromParent();
940 return true;
941 }
942 return true;
943}
944
947 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
948 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
949 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
950
951 Register DstReg = MI.getOperand(0).getReg();
952 LLT DstTy = MRI.getType(DstReg);
953
954 if (!needsVectorLegalization(DstTy, ST))
955 return true;
956
958 if (MI.getNumOperands() == 2) {
959 // The "null" case: no values are attached.
960 LLT EltTy = DstTy.getElementType();
961 auto Zero = MIRBuilder.buildConstant(EltTy, 0);
962 SPIRVTypeInst SpvDstTy = GR->getSPIRVTypeForVReg(DstReg);
963 SPIRVTypeInst SpvEltTy = GR->getScalarOrVectorComponentType(SpvDstTy);
964 GR->assignSPIRVTypeToVReg(SpvEltTy, Zero.getReg(0), MIRBuilder.getMF());
965 for (unsigned i = 0; i < DstTy.getNumElements(); ++i)
966 SrcRegs.push_back(Zero.getReg(0));
967 } else {
968 for (unsigned i = 2; i < MI.getNumOperands(); ++i) {
969 SrcRegs.push_back(MI.getOperand(i).getReg());
970 }
971 }
972 MIRBuilder.buildBuildVector(DstReg, SrcRegs);
973 MI.eraseFromParent();
974 return true;
975}
976
978 MachineInstr &MI) const {
979 LLVM_DEBUG(dbgs() << "legalizeIntrinsic: " << MI);
980 auto IntrinsicID = cast<GIntrinsic>(MI).getIntrinsicID();
981 switch (IntrinsicID) {
982 case Intrinsic::spv_bitcast:
983 return legalizeSpvBitcast(Helper, MI, GR);
984 case Intrinsic::spv_insertelt:
985 return legalizeSpvInsertElt(Helper, MI, GR);
986 case Intrinsic::spv_extractelt:
987 return legalizeSpvExtractElt(Helper, MI, GR);
988 case Intrinsic::spv_const_composite:
989 return legalizeSpvConstComposite(Helper, MI, GR);
990 }
991 return true;
992}
993
994bool SPIRVLegalizerInfo::legalizeBitcast(LegalizerHelper &Helper,
995 MachineInstr &MI) const {
996 // Once the G_BITCAST is using vectors that are allowed, we turn it back into
997 // an spv_bitcast to avoid verifier problems when the register types are the
998 // same for the source and the result. Note that the SPIR-V types associated
999 // with the bitcast can be different even if the register types are the same.
1000 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
1001 Register DstReg = MI.getOperand(0).getReg();
1002 Register SrcReg = MI.getOperand(1).getReg();
1003 SmallVector<Register, 1> DstRegs = {DstReg};
1004 MIRBuilder.buildIntrinsic(Intrinsic::spv_bitcast, DstRegs).addUse(SrcReg);
1005 MI.eraseFromParent();
1006 return true;
1007}
1008
1009// Note this code was copied from LegalizerHelper::lowerISFPCLASS and adjusted
1010// to ensure that all instructions created during the lowering have SPIR-V types
1011// assigned to them.
1012bool SPIRVLegalizerInfo::legalizeIsFPClass(
1014 LostDebugLocObserver &LocObserver) const {
1015 auto [DstReg, DstTy, SrcReg, SrcTy] = MI.getFirst2RegLLTs();
1016 FPClassTest Mask = static_cast<FPClassTest>(MI.getOperand(2).getImm());
1017
1018 auto &MIRBuilder = Helper.MIRBuilder;
1019 auto &MF = MIRBuilder.getMF();
1020 MachineRegisterInfo &MRI = MF.getRegInfo();
1021
1022 Type *LLVMDstTy =
1023 IntegerType::get(MIRBuilder.getContext(), DstTy.getScalarSizeInBits());
1024 if (DstTy.isVector())
1025 LLVMDstTy = VectorType::get(LLVMDstTy, DstTy.getElementCount());
1026 SPIRVTypeInst SPIRVDstTy = GR->getOrCreateSPIRVType(
1027 LLVMDstTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite,
1028 /*EmitIR*/ true);
1029
1030 unsigned BitSize = SrcTy.getScalarSizeInBits();
1031 const fltSemantics &Semantics = getFltSemanticForLLT(SrcTy.getScalarType());
1032
1033 LLT IntTy = LLT::scalar(BitSize);
1034 Type *LLVMIntTy = IntegerType::get(MIRBuilder.getContext(), BitSize);
1035 if (SrcTy.isVector()) {
1036 IntTy = LLT::vector(SrcTy.getElementCount(), IntTy);
1037 LLVMIntTy = VectorType::get(LLVMIntTy, SrcTy.getElementCount());
1038 }
1039 SPIRVTypeInst SPIRVIntTy = GR->getOrCreateSPIRVType(
1040 LLVMIntTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite,
1041 /*EmitIR*/ true);
1042
1043 // Clang doesn't support capture of structured bindings:
1044 LLT DstTyCopy = DstTy;
1045 const auto assignSPIRVTy = [&](MachineInstrBuilder &&MI) {
1046 // Assign this MI's (assumed only) destination to one of the two types we
1047 // expect: either the G_IS_FPCLASS's destination type, or the integer type
1048 // bitcast from the source type.
1049 LLT MITy = MRI.getType(MI.getReg(0));
1050 assert((MITy == IntTy || MITy == DstTyCopy) &&
1051 "Unexpected LLT type while lowering G_IS_FPCLASS");
1052 SPIRVTypeInst SPVTy = MITy == IntTy ? SPIRVIntTy : SPIRVDstTy;
1053 GR->assignSPIRVTypeToVReg(SPVTy, MI.getReg(0), MF);
1054 return MI;
1055 };
1056
1057 // Helper to build and assign a constant in one go
1058 const auto buildSPIRVConstant = [&](LLT Ty, auto &&C) -> MachineInstrBuilder {
1059 if (!Ty.isFixedVector())
1060 return assignSPIRVTy(MIRBuilder.buildConstant(Ty, C));
1061 auto ScalarC = MIRBuilder.buildConstant(Ty.getScalarType(), C);
1062 assert((Ty == IntTy || Ty == DstTyCopy) &&
1063 "Unexpected LLT type while lowering constant for G_IS_FPCLASS");
1064 SPIRVTypeInst VecEltTy = GR->getOrCreateSPIRVType(
1065 (Ty == IntTy ? LLVMIntTy : LLVMDstTy)->getScalarType(), MIRBuilder,
1066 SPIRV::AccessQualifier::ReadWrite,
1067 /*EmitIR*/ true);
1068 GR->assignSPIRVTypeToVReg(VecEltTy, ScalarC.getReg(0), MF);
1069 return assignSPIRVTy(MIRBuilder.buildSplatBuildVector(Ty, ScalarC));
1070 };
1071
1072 if (Mask == fcNone) {
1073 MIRBuilder.buildCopy(DstReg, buildSPIRVConstant(DstTy, 0));
1074 MI.eraseFromParent();
1075 return true;
1076 }
1077 if (Mask == fcAllFlags) {
1078 MIRBuilder.buildCopy(DstReg, buildSPIRVConstant(DstTy, 1));
1079 MI.eraseFromParent();
1080 return true;
1081 }
1082
1083 // Note that rather than creating a COPY here (between a floating-point and
1084 // integer type of the same size) we create a SPIR-V bitcast immediately. We
1085 // can't create a G_BITCAST because the LLTs are the same, and we can't seem
1086 // to correctly lower COPYs to SPIR-V bitcasts at this moment.
1087 Register ResVReg = MRI.createGenericVirtualRegister(IntTy);
1088 MRI.setRegClass(ResVReg, GR->getRegClass(SPIRVIntTy));
1089 GR->assignSPIRVTypeToVReg(SPIRVIntTy, ResVReg, Helper.MIRBuilder.getMF());
1090 auto AsInt = MIRBuilder.buildInstr(SPIRV::OpBitcast)
1091 .addDef(ResVReg)
1092 .addUse(GR->getSPIRVTypeID(SPIRVIntTy))
1093 .addUse(SrcReg);
1094 AsInt = assignSPIRVTy(std::move(AsInt));
1095
1096 // Various masks.
1097 APInt SignBit = APInt::getSignMask(BitSize);
1098 APInt ValueMask = APInt::getSignedMaxValue(BitSize); // All bits but sign.
1099 APInt Inf = APFloat::getInf(Semantics).bitcastToAPInt(); // Exp and int bit.
1100 APInt ExpMask = Inf;
1101 APInt AllOneMantissa = APFloat::getLargest(Semantics).bitcastToAPInt() & ~Inf;
1102 APInt QNaNBitMask =
1103 APInt::getOneBitSet(BitSize, AllOneMantissa.getActiveBits() - 1);
1104 APInt InversionMask = APInt::getAllOnes(DstTy.getScalarSizeInBits());
1105
1106 auto SignBitC = buildSPIRVConstant(IntTy, SignBit);
1107 auto ValueMaskC = buildSPIRVConstant(IntTy, ValueMask);
1108 auto InfC = buildSPIRVConstant(IntTy, Inf);
1109 auto ExpMaskC = buildSPIRVConstant(IntTy, ExpMask);
1110 auto ZeroC = buildSPIRVConstant(IntTy, 0);
1111
1112 auto Abs = assignSPIRVTy(MIRBuilder.buildAnd(IntTy, AsInt, ValueMaskC));
1113 auto Sign = assignSPIRVTy(
1114 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_NE, DstTy, AsInt, Abs));
1115
1116 auto Res = buildSPIRVConstant(DstTy, 0);
1117
1118 const auto appendToRes = [&](MachineInstrBuilder &&ToAppend) {
1119 Res = assignSPIRVTy(
1120 MIRBuilder.buildOr(DstTyCopy, Res, assignSPIRVTy(std::move(ToAppend))));
1121 };
1122
1123 // Tests that involve more than one class should be processed first.
1124 if ((Mask & fcFinite) == fcFinite) {
1125 // finite(V) ==> abs(V) u< exp_mask
1126 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, Abs,
1127 ExpMaskC));
1128 Mask &= ~fcFinite;
1129 } else if ((Mask & fcFinite) == fcPosFinite) {
1130 // finite(V) && V > 0 ==> V u< exp_mask
1131 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, AsInt,
1132 ExpMaskC));
1133 Mask &= ~fcPosFinite;
1134 } else if ((Mask & fcFinite) == fcNegFinite) {
1135 // finite(V) && V < 0 ==> abs(V) u< exp_mask && signbit == 1
1136 auto Cmp = assignSPIRVTy(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT,
1137 DstTy, Abs, ExpMaskC));
1138 appendToRes(MIRBuilder.buildAnd(DstTy, Cmp, Sign));
1139 Mask &= ~fcNegFinite;
1140 }
1141
1142 if (FPClassTest PartialCheck = Mask & (fcZero | fcSubnormal)) {
1143 // fcZero | fcSubnormal => test all exponent bits are 0
1144 // TODO: Handle sign bit specific cases
1145 // TODO: Handle inverted case
1146 if (PartialCheck == (fcZero | fcSubnormal)) {
1147 auto ExpBits = assignSPIRVTy(MIRBuilder.buildAnd(IntTy, AsInt, ExpMaskC));
1148 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1149 ExpBits, ZeroC));
1150 Mask &= ~PartialCheck;
1151 }
1152 }
1153
1154 // Check for individual classes.
1155 if (FPClassTest PartialCheck = Mask & fcZero) {
1156 if (PartialCheck == fcPosZero)
1157 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1158 AsInt, ZeroC));
1159 else if (PartialCheck == fcZero)
1160 appendToRes(
1161 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy, Abs, ZeroC));
1162 else // fcNegZero
1163 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1164 AsInt, SignBitC));
1165 }
1166
1167 if (FPClassTest PartialCheck = Mask & fcSubnormal) {
1168 // issubnormal(V) ==> unsigned(abs(V) - 1) u< (all mantissa bits set)
1169 // issubnormal(V) && V>0 ==> unsigned(V - 1) u< (all mantissa bits set)
1170 auto V = (PartialCheck == fcPosSubnormal) ? AsInt : Abs;
1171 auto OneC = buildSPIRVConstant(IntTy, 1);
1172 auto VMinusOne = MIRBuilder.buildSub(IntTy, V, OneC);
1173 auto SubnormalRes = assignSPIRVTy(
1174 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, VMinusOne,
1175 buildSPIRVConstant(IntTy, AllOneMantissa)));
1176 if (PartialCheck == fcNegSubnormal)
1177 SubnormalRes = MIRBuilder.buildAnd(DstTy, SubnormalRes, Sign);
1178 appendToRes(std::move(SubnormalRes));
1179 }
1180
1181 if (FPClassTest PartialCheck = Mask & fcInf) {
1182 if (PartialCheck == fcPosInf)
1183 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1184 AsInt, InfC));
1185 else if (PartialCheck == fcInf)
1186 appendToRes(
1187 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy, Abs, InfC));
1188 else { // fcNegInf
1189 APInt NegInf = APFloat::getInf(Semantics, true).bitcastToAPInt();
1190 auto NegInfC = buildSPIRVConstant(IntTy, NegInf);
1191 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1192 AsInt, NegInfC));
1193 }
1194 }
1195
1196 if (FPClassTest PartialCheck = Mask & fcNan) {
1197 auto InfWithQnanBitC =
1198 buildSPIRVConstant(IntTy, std::move(Inf) | QNaNBitMask);
1199 if (PartialCheck == fcNan) {
1200 // isnan(V) ==> abs(V) u> int(inf)
1201 appendToRes(
1202 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGT, DstTy, Abs, InfC));
1203 } else if (PartialCheck == fcQNan) {
1204 // isquiet(V) ==> abs(V) u>= (unsigned(Inf) | quiet_bit)
1205 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGE, DstTy, Abs,
1206 InfWithQnanBitC));
1207 } else { // fcSNan
1208 // issignaling(V) ==> abs(V) u> unsigned(Inf) &&
1209 // abs(V) u< (unsigned(Inf) | quiet_bit)
1210 auto IsNan = assignSPIRVTy(
1211 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGT, DstTy, Abs, InfC));
1212 auto IsNotQnan = assignSPIRVTy(MIRBuilder.buildICmp(
1213 CmpInst::Predicate::ICMP_ULT, DstTy, Abs, InfWithQnanBitC));
1214 appendToRes(MIRBuilder.buildAnd(DstTy, IsNan, IsNotQnan));
1215 }
1216 }
1217
1218 if (FPClassTest PartialCheck = Mask & fcNormal) {
1219 // isnormal(V) ==> (0 u< exp u< max_exp) ==> (unsigned(exp-1) u<
1220 // (max_exp-1))
1221 APInt ExpLSB = ExpMask & ~(ExpMask.shl(1));
1222 auto ExpMinusOne = assignSPIRVTy(
1223 MIRBuilder.buildSub(IntTy, Abs, buildSPIRVConstant(IntTy, ExpLSB)));
1224 APInt MaxExpMinusOne = std::move(ExpMask) - ExpLSB;
1225 auto NormalRes = assignSPIRVTy(
1226 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, ExpMinusOne,
1227 buildSPIRVConstant(IntTy, MaxExpMinusOne)));
1228 if (PartialCheck == fcNegNormal)
1229 NormalRes = MIRBuilder.buildAnd(DstTy, NormalRes, Sign);
1230 else if (PartialCheck == fcPosNormal) {
1231 auto PosSign = assignSPIRVTy(MIRBuilder.buildXor(
1232 DstTy, Sign, buildSPIRVConstant(DstTy, InversionMask)));
1233 NormalRes = MIRBuilder.buildAnd(DstTy, NormalRes, PosSign);
1234 }
1235 appendToRes(std::move(NormalRes));
1236 }
1237
1238 MIRBuilder.buildCopy(DstReg, Res);
1239 MI.eraseFromParent();
1240 return true;
1241}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static void scalarize(Instruction *I, SmallVectorImpl< Instruction * > &Worklist)
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
IRTranslator LLVM IR MI
#define I(x, y, z)
Definition MD5.cpp:57
This file declares the MachineIRBuilder class.
Register Reg
Promote Memory to Register
Definition Mem2Reg.cpp:110
ppc ctr loops verify
const SmallVectorImpl< MachineOperand > & Cond
static bool legalizeSpvInsertElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool needsVectorLegalization(const LLT &Ty, const SPIRVSubtarget &ST)
static MachineInstrBuilder createStackTemporaryForVector(LegalizerHelper &Helper, SPIRVGlobalRegistry *GR, Register SrcReg, LLT SrcTy, MachinePointerInfo &PtrInfo, Align &VecAlign)
static Register convertPtrToInt(Register Reg, LLT ConvTy, SPIRVTypeInst SpvType, LegalizerHelper &Helper, MachineRegisterInfo &MRI, SPIRVGlobalRegistry *GR)
LegalityPredicate typeOfExtendedScalars(unsigned TypeIdx, bool IsExtendedInts)
static bool legalizeExtractVectorElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeStore(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvExtractElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvBitcast(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvConstComposite(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeLoad(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeInsertVectorElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
#define LLVM_DEBUG(...)
Definition Debug.h:119
APInt bitcastToAPInt() const
Definition APFloat.h:1436
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Definition APFloat.h:1203
static APFloat getInf(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Infinity.
Definition APFloat.h:1163
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:235
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:230
unsigned getActiveBits() const
Compute the number of active bits in the value.
Definition APInt.h:1535
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:880
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
Definition APInt.h:240
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
static LLVM_ABI ArrayType * get(Type *ElementType, uint64_t NumElements)
This static method is the primary way to construct an ArrayType.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:740
@ ICMP_UGE
unsigned greater or equal
Definition InstrTypes.h:764
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:763
@ ICMP_ULT
unsigned less than
Definition InstrTypes.h:765
@ ICMP_NE
not equal
Definition InstrTypes.h:762
static constexpr ElementCount getFixed(ScalarTy MinVal)
Definition TypeSize.h:309
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:348
static constexpr LLT vector(ElementCount EC, unsigned ScalarSizeInBits)
Get a low-level vector of some number of elements and element width.
LLT getScalarType() const
constexpr bool isPointerVector() const
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr bool isValid() const
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr bool isPointer() const
constexpr unsigned getAddressSpace() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
constexpr bool isPointerOrPointerVector() const
constexpr bool isFixedVector() const
Returns true if the LLT is a fixed vector.
constexpr TypeSize getSizeInBytes() const
Returns the total size of the type in bytes, i.e.
LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
LLVM_ABI void computeTables()
Compute any ancillary tables needed to quickly decide how an operation should be handled.
LegalizeRuleSet & legalFor(std::initializer_list< LLT > Types)
The instruction is legal when type index 0 is any type in the given list.
LegalizeRuleSet & fewerElementsIf(LegalityPredicate Predicate, LegalizeMutation Mutation)
Remove elements to reach the type selected by the mutation if the predicate is true.
LegalizeRuleSet & moreElementsToNextPow2(unsigned TypeIdx)
Add more elements to the vector to reach the next power of two.
LegalizeRuleSet & lower()
The instruction is lowered.
LegalizeRuleSet & scalarizeIf(LegalityPredicate Predicate, unsigned TypeIdx)
LegalizeRuleSet & lowerIf(LegalityPredicate Predicate)
The instruction is lowered if predicate is true.
LegalizeRuleSet & custom()
Unconditionally custom lower.
LegalizeRuleSet & unsupportedIf(LegalityPredicate Predicate)
LegalizeRuleSet & alwaysLegal()
LegalizeRuleSet & scalarize(unsigned TypeIdx)
LegalizeRuleSet & legalForCartesianProduct(std::initializer_list< LLT > Types)
The instruction is legal when type indexes 0 and 1 are both in the given list.
LegalizeRuleSet & legalIf(LegalityPredicate Predicate)
The instruction is legal if predicate is true.
LegalizeRuleSet & customFor(std::initializer_list< LLT > Types)
LLVM_ABI MachineInstrBuilder createStackTemporary(TypeSize Bytes, Align Alignment, MachinePointerInfo &PtrInfo)
Create a stack temporary based on the size in bytes and the alignment.
MachineIRBuilder & MIRBuilder
Expose MIRBuilder so clients can set their own RecordInsertInstruction functions.
LLVM_ABI Align getStackTemporaryAlignment(LLT Type, Align MinAlign=Align()) const
Return the alignment to use for a stack temporary object with the given type.
LegalizeRuleSet & getActionDefinitionsBuilder(unsigned Opcode)
Get the action definition builder for the given opcode.
const LegacyLegalizerInfo & getLegacyLegalizerInfo() const
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Helper class to build MachineInstr.
LLVMContext & getContext() const
MachineInstrBuilder buildUnmerge(ArrayRef< LLT > Res, const SrcOp &Op)
Build and insert Res0, ... = G_UNMERGE_VALUES Op.
MachineInstrBuilder buildAnd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_AND Op0, Op1.
MachineInstrBuilder buildICmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_ICMP Pred, Op0, Op1.
MachineInstrBuilder buildSub(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_SUB Op0, Op1.
MachineInstrBuilder buildIntrinsic(Intrinsic::ID ID, ArrayRef< Register > Res, bool HasSideEffects, bool isConvergent)
Build and insert a G_INTRINSIC instruction.
MachineInstrBuilder buildSplatBuildVector(const DstOp &Res, const SrcOp &Src)
Build and insert Res = G_BUILD_VECTOR with Src replicated to fill the number of elements.
MachineInstrBuilder buildBuildVector(const DstOp &Res, ArrayRef< Register > Ops)
Build and insert Res = G_BUILD_VECTOR Op0, ...
MachineInstrBuilder buildLoad(const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = G_LOAD Addr, MMO.
MachineInstrBuilder buildStore(const SrcOp &Val, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert G_STORE Val, Addr, MMO.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
MachineFunction & getMF()
Getter for the function we currently build.
MachineInstrBuilder buildBitcast(const DstOp &Dst, const SrcOp &Src)
Build and insert Dst = G_BITCAST Src.
MachineRegisterInfo * getMRI()
Getter for MRI.
MachineInstrBuilder buildOr(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_OR Op0, Op1.
MachineInstrBuilder buildCopy(const DstOp &Res, const SrcOp &Op)
Build and insert Res = COPY Op.
MachineInstrBuilder buildXor(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_XOR Op0, Op1.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
Representation of each machine instruction.
A description of a memory reference used in the backend.
const MachinePointerInfo & getPointerInfo() const
LLVM_ABI Align getAlign() const
Return the minimum known alignment in bytes of the actual memory reference.
MachineOperand class - Representation of each machine instruction operand.
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
LLVM_ABI void setRegClass(Register Reg, const TargetRegisterClass *RC)
setRegClass - Set the register class of the specified virtual register.
LLVM_ABI Register createGenericVirtualRegister(LLT Ty, StringRef Name="")
Create and return a new generic virtual register with low-level type Ty.
Wrapper class representing virtual and physical registers.
Definition Register.h:20
void assignSPIRVTypeToVReg(SPIRVTypeInst Type, Register VReg, const MachineFunction &MF)
const TargetRegisterClass * getRegClass(SPIRVTypeInst SpvType) const
const Type * getTypeForSPIRVType(SPIRVTypeInst Ty) const
LLT getRegType(SPIRVTypeInst SpvType) const
SPIRVTypeInst getOrCreateSPIRVPointerType(const Type *BaseType, MachineIRBuilder &MIRBuilder, SPIRV::StorageClass::StorageClass SC)
SPIRVTypeInst getScalarOrVectorComponentType(SPIRVTypeInst Type) const
SPIRVTypeInst getOrCreateSPIRVType(const Type *Type, MachineInstr &I, SPIRV::AccessQualifier::AccessQualifier AQ, bool EmitIR)
SPIRVTypeInst getSPIRVTypeForVReg(Register VReg, const MachineFunction *MF=nullptr) const
SPIRVLegalizerInfo(const SPIRVSubtarget &ST)
bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI, LostDebugLocObserver &LocObserver) const override
Called for instructions with the Custom LegalizationAction.
bool legalizeIntrinsic(LegalizerHelper &Helper, MachineInstr &MI) const override
SPIRVGlobalRegistry * getSPIRVGlobalRegistry() const
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
LLVM_ABI LegalityPredicate isScalar(unsigned TypeIdx)
True iff the specified type index is a scalar.
LLVM_ABI LegalityPredicate numElementsNotPow2(unsigned TypeIdx)
True iff the specified type index is a vector whose element count is not a power of 2.
LLVM_ABI LegalityPredicate vectorElementCountIsLessThanOrEqualTo(unsigned TypeIdx, unsigned Size)
True iff the specified type index is a vector with a number of elements that's less than or equal to ...
LLVM_ABI LegalityPredicate typeInSet(unsigned TypeIdx, std::initializer_list< LLT > TypesInit)
True iff the given type index is one of the specified types.
LLVM_ABI LegalityPredicate vectorElementCountIsGreaterThan(unsigned TypeIdx, unsigned Size)
True iff the specified type index is a vector with a number of elements that's greater than the given...
Predicate any(Predicate P0, Predicate P1)
True iff P0 or P1 are true.
LegalityPredicate typeIsNot(unsigned TypeIdx, LLT Type)
True iff the given type index is not the specified type.
Predicate all(Predicate P0, Predicate P1)
True iff P0 and P1 are true.
LLVM_ABI LegalityPredicate typeIs(unsigned TypeIdx, LLT TypesInit)
True iff the given type index is the specified type.
LLVM_ABI LegalizeMutation changeElementCountTo(unsigned TypeIdx, unsigned FromTypeIdx)
Keep the same scalar or element type as TypeIdx, but take the number of elements from FromTypeIdx.
LLVM_ABI LegalizeMutation changeElementSizeTo(unsigned TypeIdx, unsigned FromTypeIdx)
Change the scalar size or element size to have the same scalar size as type index FromIndex.
Invariant opcodes: All instruction sets have these as their low opcodes.
This is an optimization pass for GlobalISel generic memory operations.
LLVM_ABI const llvm::fltSemantics & getFltSemanticForLLT(LLT Ty)
Get the appropriate floating point arithmetic semantic based on the bit size of the given scalar LLT.
std::function< bool(const LegalityQuery &)> LegalityPredicate
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:279
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
const std::set< unsigned > & getTypeFoldingSupportedOpcodes()
int64_t foldImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
The LegalityQuery object bundles together all the information that's needed to decide whether a given...
ArrayRef< LLT > Types
This class contains a discriminated union of information about pointers in memory operands,...
MachinePointerInfo getWithOffset(int64_t O) const