35#include "llvm/IR/IntrinsicsWebAssembly.h"
42#define DEBUG_TYPE "wasm-lower"
47 auto MVTPtr = Subtarget->hasAddr64() ? MVT::i64 : MVT::i32;
61 Subtarget->hasAddr64() ? WebAssembly::SP64 : WebAssembly::SP32);
67 if (Subtarget->hasSIMD128()) {
75 if (Subtarget->hasFP16()) {
78 if (Subtarget->hasReferenceTypes()) {
81 if (Subtarget->hasExceptionHandling()) {
90 for (
auto T : {MVT::i32, MVT::i64, MVT::f32, MVT::f64}) {
94 if (Subtarget->hasSIMD128()) {
95 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,
101 if (Subtarget->hasFP16()) {
105 if (Subtarget->hasReferenceTypes()) {
108 for (
auto T : {MVT::externref, MVT::funcref, MVT::Other}) {
129 for (
auto T : {MVT::f32, MVT::f64, MVT::v4f32, MVT::v2f64, MVT::v8f16}) {
130 if (!Subtarget->hasFP16() &&
T == MVT::v8f16) {
143 if (
MVT(
T).isVector())
157 if (
T != MVT::v8f16) {
170 for (
auto T : {MVT::i32, MVT::i64})
172 if (Subtarget->hasSIMD128())
173 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64})
177 if (Subtarget->hasWideArithmetic()) {
185 if (Subtarget->hasNontrappingFPToInt())
187 for (
auto T : {MVT::i32, MVT::i64})
190 if (Subtarget->hasRelaxedSIMD()) {
193 {MVT::v4f32, MVT::v2f64},
Custom);
196 if (Subtarget->hasSIMD128()) {
230 for (
auto T : {MVT::v16i8, MVT::v8i16})
234 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64})
238 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,
242 if (Subtarget->hasFP16())
246 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,
250 if (Subtarget->hasFP16())
254 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,
262 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64})
267 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,
277 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64})
282 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32})
292 for (
auto T : {MVT::v8i16, MVT::v4i32, MVT::v2i64})
298 for (
auto T : {MVT::v4f32, MVT::v2f64})
308 for (
auto T : {MVT::v2i64, MVT::v2f64})
314 if (Subtarget->hasFP16()) {
326 if (Subtarget->hasFP16()) {
330 if (Subtarget->hasRelaxedSIMD()) {
345 if (!Subtarget->hasSignExt()) {
347 auto Action = Subtarget->hasSIMD128() ?
Custom :
Expand;
348 for (
auto T : {MVT::i8, MVT::i16, MVT::i32})
364 for (
auto T : {MVT::i32, MVT::i64, MVT::f32, MVT::f64})
368 if (Subtarget->hasReferenceTypes())
370 for (
auto T : {MVT::externref, MVT::funcref})
375 {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64, MVT::v2f64})
391 if (Subtarget->hasSIMD128()) {
392 for (
auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64, MVT::v4f32,
395 if (
MVT(
T) != MemT) {
434 return MVT::externref;
443 return MVT::externref;
450WebAssemblyTargetLowering::shouldExpandAtomicRMWInIR(
467bool WebAssemblyTargetLowering::shouldScalarizeBinop(
SDValue VecOp)
const {
487FastISel *WebAssemblyTargetLowering::createFastISel(
493MVT WebAssemblyTargetLowering::getScalarShiftAmountTy(
const DataLayout & ,
504 "32-bit shift counts ought to be enough for anyone");
509 "Unable to represent scalar shift amount type");
519 bool IsUnsigned,
bool Int64,
520 bool Float64,
unsigned LoweredOpcode) {
526 unsigned Abs = Float64 ? WebAssembly::ABS_F64 : WebAssembly::ABS_F32;
527 unsigned FConst = Float64 ? WebAssembly::CONST_F64 : WebAssembly::CONST_F32;
528 unsigned LT = Float64 ? WebAssembly::LT_F64 : WebAssembly::LT_F32;
529 unsigned GE = Float64 ? WebAssembly::GE_F64 : WebAssembly::GE_F32;
530 unsigned IConst = Int64 ? WebAssembly::CONST_I64 : WebAssembly::CONST_I32;
531 unsigned Eqz = WebAssembly::EQZ_I32;
532 unsigned And = WebAssembly::AND_I32;
533 int64_t Limit = Int64 ?
INT64_MIN : INT32_MIN;
534 int64_t Substitute = IsUnsigned ? 0 : Limit;
535 double CmpVal = IsUnsigned ? -(double)Limit * 2.0 : -(double)Limit;
546 F->insert(It, FalseMBB);
547 F->insert(It, TrueMBB);
548 F->insert(It, DoneMBB);
551 DoneMBB->
splice(DoneMBB->
begin(), BB, std::next(
MI.getIterator()), BB->
end());
559 unsigned Tmp0, Tmp1, CmpReg, EqzReg, FalseReg, TrueReg;
560 Tmp0 =
MRI.createVirtualRegister(
MRI.getRegClass(InReg));
561 Tmp1 =
MRI.createVirtualRegister(
MRI.getRegClass(InReg));
562 CmpReg =
MRI.createVirtualRegister(&WebAssembly::I32RegClass);
563 EqzReg =
MRI.createVirtualRegister(&WebAssembly::I32RegClass);
564 FalseReg =
MRI.createVirtualRegister(
MRI.getRegClass(OutReg));
565 TrueReg =
MRI.createVirtualRegister(
MRI.getRegClass(OutReg));
567 MI.eraseFromParent();
581 Tmp1 =
MRI.createVirtualRegister(
MRI.getRegClass(InReg));
583 MRI.createVirtualRegister(&WebAssembly::I32RegClass);
584 Register AndReg =
MRI.createVirtualRegister(&WebAssembly::I32RegClass);
624 if (Def->getOpcode() == WebAssembly::CONST_I32 ||
625 Def->getOpcode() == WebAssembly::CONST_I64) {
626 if (Def->getOperand(1).getImm() == 0) {
628 MI.eraseFromParent();
632 unsigned MemoryCopy =
633 Int64 ? WebAssembly::MEMORY_COPY_A64 : WebAssembly::MEMORY_COPY_A32;
640 MI.eraseFromParent();
651 unsigned Eqz = Int64 ? WebAssembly::EQZ_I64 : WebAssembly::EQZ_I32;
652 unsigned MemoryCopy =
653 Int64 ? WebAssembly::MEMORY_COPY_A64 : WebAssembly::MEMORY_COPY_A32;
664 F->insert(It, TrueMBB);
665 F->insert(It, DoneMBB);
668 DoneMBB->
splice(DoneMBB->
begin(), BB, std::next(
MI.getIterator()), BB->
end());
678 EqzReg =
MRI.createVirtualRegister(&WebAssembly::I32RegClass);
681 MI.eraseFromParent();
715 if (Def->getOpcode() == WebAssembly::CONST_I32 ||
716 Def->getOpcode() == WebAssembly::CONST_I64) {
717 if (Def->getOperand(1).getImm() == 0) {
719 MI.eraseFromParent();
723 unsigned MemoryFill =
724 Int64 ? WebAssembly::MEMORY_FILL_A64 : WebAssembly::MEMORY_FILL_A32;
730 MI.eraseFromParent();
741 unsigned Eqz = Int64 ? WebAssembly::EQZ_I64 : WebAssembly::EQZ_I32;
742 unsigned MemoryFill =
743 Int64 ? WebAssembly::MEMORY_FILL_A64 : WebAssembly::MEMORY_FILL_A32;
754 F->insert(It, TrueMBB);
755 F->insert(It, DoneMBB);
758 DoneMBB->
splice(DoneMBB->
begin(), BB, std::next(
MI.getIterator()), BB->
end());
768 EqzReg =
MRI.createVirtualRegister(&WebAssembly::I32RegClass);
771 MI.eraseFromParent();
793 CallResults.
getOpcode() == WebAssembly::RET_CALL_RESULTS);
797 bool IsRetCall = CallResults.
getOpcode() == WebAssembly::RET_CALL_RESULTS;
799 bool IsFuncrefCall =
false;
805 IsFuncrefCall = (TRC == &WebAssembly::FUNCREFRegClass);
810 if (IsIndirect && IsRetCall) {
811 CallOp = WebAssembly::RET_CALL_INDIRECT;
812 }
else if (IsIndirect) {
813 CallOp = WebAssembly::CALL_INDIRECT;
814 }
else if (IsRetCall) {
815 CallOp = WebAssembly::RET_CALL;
817 CallOp = WebAssembly::CALL;
846 for (
auto Def : CallResults.
defs())
870 for (
auto Use : CallParams.
uses())
886 if (IsIndirect && IsFuncrefCall) {
898 BuildMI(MF,
DL,
TII.get(WebAssembly::REF_NULL_FUNCREF), RegFuncref);
902 BuildMI(MF,
DL,
TII.get(WebAssembly::TABLE_SET_FUNCREF))
914 const TargetInstrInfo &
TII = *Subtarget->getInstrInfo();
917 switch (
MI.getOpcode()) {
920 case WebAssembly::FP_TO_SINT_I32_F32:
922 WebAssembly::I32_TRUNC_S_F32);
923 case WebAssembly::FP_TO_UINT_I32_F32:
925 WebAssembly::I32_TRUNC_U_F32);
926 case WebAssembly::FP_TO_SINT_I64_F32:
928 WebAssembly::I64_TRUNC_S_F32);
929 case WebAssembly::FP_TO_UINT_I64_F32:
931 WebAssembly::I64_TRUNC_U_F32);
932 case WebAssembly::FP_TO_SINT_I32_F64:
934 WebAssembly::I32_TRUNC_S_F64);
935 case WebAssembly::FP_TO_UINT_I32_F64:
937 WebAssembly::I32_TRUNC_U_F64);
938 case WebAssembly::FP_TO_SINT_I64_F64:
940 WebAssembly::I64_TRUNC_S_F64);
941 case WebAssembly::FP_TO_UINT_I64_F64:
943 WebAssembly::I64_TRUNC_U_F64);
944 case WebAssembly::MEMCPY_A32:
946 case WebAssembly::MEMCPY_A64:
948 case WebAssembly::MEMSET_A32:
950 case WebAssembly::MEMSET_A64:
952 case WebAssembly::CALL_RESULTS:
953 case WebAssembly::RET_CALL_RESULTS:
958std::pair<unsigned, const TargetRegisterClass *>
959WebAssemblyTargetLowering::getRegForInlineAsmConstraint(
963 if (Constraint.
size() == 1) {
964 switch (Constraint[0]) {
966 assert(VT != MVT::iPTR &&
"Pointer MVT not expected here");
967 if (Subtarget->hasSIMD128() && VT.
isVector()) {
969 return std::make_pair(0U, &WebAssembly::V128RegClass);
973 return std::make_pair(0U, &WebAssembly::I32RegClass);
975 return std::make_pair(0U, &WebAssembly::I64RegClass);
980 return std::make_pair(0U, &WebAssembly::F32RegClass);
982 return std::make_pair(0U, &WebAssembly::F64RegClass);
996bool WebAssemblyTargetLowering::isCheapToSpeculateCttz(
Type *Ty)
const {
1001bool WebAssemblyTargetLowering::isCheapToSpeculateCtlz(
Type *Ty)
const {
1006bool WebAssemblyTargetLowering::isLegalAddressingMode(
const DataLayout &
DL,
1008 Type *Ty,
unsigned AS,
1013 if (AM.BaseOffs < 0)
1024bool WebAssemblyTargetLowering::allowsMisalignedMemoryAccesses(
1038bool WebAssemblyTargetLowering::isIntDivCheap(
EVT VT,
1039 AttributeList Attr)
const {
1045bool WebAssemblyTargetLowering::isVectorLoadExtDesirable(
SDValue ExtVal)
const {
1048 return (ExtT == MVT::v8i16 && MemT == MVT::v8i8) ||
1049 (ExtT == MVT::v4i32 && MemT == MVT::v4i16) ||
1050 (ExtT == MVT::v2i64 && MemT == MVT::v2i32);
1053bool WebAssemblyTargetLowering::isOffsetFoldingLegal(
1056 const GlobalValue *GV = GA->
getGlobal();
1060EVT WebAssemblyTargetLowering::getSetCCResultType(
const DataLayout &
DL,
1073void WebAssemblyTargetLowering::getTgtMemIntrinsic(
1077 switch (Intrinsic) {
1078 case Intrinsic::wasm_memory_atomic_notify:
1080 Info.memVT = MVT::i32;
1081 Info.ptrVal =
I.getArgOperand(0);
1093 case Intrinsic::wasm_memory_atomic_wait32:
1095 Info.memVT = MVT::i32;
1096 Info.ptrVal =
I.getArgOperand(0);
1102 case Intrinsic::wasm_memory_atomic_wait64:
1104 Info.memVT = MVT::i64;
1105 Info.ptrVal =
I.getArgOperand(0);
1111 case Intrinsic::wasm_loadf16_f32:
1113 Info.memVT = MVT::f16;
1114 Info.ptrVal =
I.getArgOperand(0);
1120 case Intrinsic::wasm_storef16_f32:
1122 Info.memVT = MVT::f16;
1123 Info.ptrVal =
I.getArgOperand(1);
1134void WebAssemblyTargetLowering::computeKnownBitsForTargetNode(
1137 switch (
Op.getOpcode()) {
1141 unsigned IntNo =
Op.getConstantOperandVal(0);
1145 case Intrinsic::wasm_bitmask: {
1147 EVT VT =
Op.getOperand(1).getSimpleValueType();
1150 Known.
Zero |= ZeroMask;
1156 case WebAssemblyISD::EXTEND_LOW_U:
1157 case WebAssemblyISD::EXTEND_HIGH_U: {
1162 if (VT == MVT::v8i8 || VT == MVT::v16i8) {
1166 }
else if (VT == MVT::v4i16 || VT == MVT::v8i16) {
1170 }
else if (VT == MVT::v2i32 || VT == MVT::v4i32) {
1180 case WebAssemblyISD::I64_ADD128:
1181 if (
Op.getResNo() == 1) {
1192WebAssemblyTargetLowering::getPreferredVectorAction(
MVT VT)
const {
1198 if (EltVT == MVT::i8 || EltVT == MVT::i16 || EltVT == MVT::i32 ||
1199 EltVT == MVT::i64 || EltVT == MVT::f32 || EltVT == MVT::f64)
1206bool WebAssemblyTargetLowering::isFMAFasterThanFMulAndFAdd(
1208 if (!Subtarget->hasFP16() || !VT.
isVector())
1218bool WebAssemblyTargetLowering::shouldSimplifyDemandedVectorElts(
1219 SDValue Op,
const TargetLoweringOpt &TLO)
const {
1272WebAssemblyTargetLowering::LowerCall(CallLoweringInfo &CLI,
1274 SelectionDAG &DAG = CLI.DAG;
1284 "WebAssembly doesn't support language-specific or target-specific "
1285 "calling conventions yet");
1286 if (CLI.IsPatchPoint)
1287 fail(
DL, DAG,
"WebAssembly doesn't support patch point yet");
1289 if (CLI.IsTailCall) {
1290 auto NoTail = [&](
const char *Msg) {
1291 if (CLI.CB && CLI.CB->isMustTailCall())
1293 CLI.IsTailCall =
false;
1296 if (!Subtarget->hasTailCall())
1297 NoTail(
"WebAssembly 'tail-call' feature not enabled");
1301 NoTail(
"WebAssembly does not support varargs tail calls");
1306 Type *RetTy =
F.getReturnType();
1311 bool TypesMatch = CallerRetTys.
size() == CalleeRetTys.
size() &&
1312 std::equal(CallerRetTys.
begin(), CallerRetTys.
end(),
1313 CalleeRetTys.
begin());
1315 NoTail(
"WebAssembly tail call requires caller and callee return types to "
1320 for (
auto &Arg : CLI.CB->args()) {
1321 Value *Val = Arg.get();
1326 Src =
GEP->getPointerOperand();
1333 "WebAssembly does not support tail calling with stack arguments");
1340 SmallVectorImpl<ISD::InputArg> &Ins = CLI.Ins;
1341 SmallVectorImpl<ISD::OutputArg> &Outs = CLI.Outs;
1342 SmallVectorImpl<SDValue> &OutVals = CLI.OutVals;
1348 Outs[0].Flags.isSRet()) {
1353 bool HasSwiftSelfArg =
false;
1354 bool HasSwiftErrorArg =
false;
1355 unsigned NumFixedArgs = 0;
1356 for (
unsigned I = 0;
I < Outs.
size(); ++
I) {
1357 const ISD::OutputArg &Out = Outs[
I];
1362 fail(
DL, DAG,
"WebAssembly hasn't implemented nest arguments");
1364 fail(
DL, DAG,
"WebAssembly hasn't implemented inalloca arguments");
1366 fail(
DL, DAG,
"WebAssembly hasn't implemented cons regs arguments");
1368 fail(
DL, DAG,
"WebAssembly hasn't implemented cons regs last arguments");
1377 Chain = DAG.
getMemcpy(Chain,
DL, FINode, OutVal, SizeNode,
1380 nullptr, std::nullopt, MachinePointerInfo(),
1381 MachinePointerInfo());
1388 bool IsVarArg = CLI.IsVarArg;
1397 if (!HasSwiftSelfArg) {
1399 ISD::ArgFlagsTy
Flags;
1400 Flags.setSwiftSelf();
1401 ISD::OutputArg Arg(Flags, PtrVT, EVT(PtrVT), PtrTy, 0, 0);
1402 CLI.Outs.push_back(Arg);
1404 CLI.OutVals.push_back(ArgVal);
1406 if (!HasSwiftErrorArg) {
1408 ISD::ArgFlagsTy
Flags;
1409 Flags.setSwiftError();
1410 ISD::OutputArg Arg(Flags, PtrVT, EVT(PtrVT), PtrTy, 0, 0);
1411 CLI.Outs.push_back(Arg);
1413 CLI.OutVals.push_back(ArgVal);
1419 CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.
getContext());
1424 for (
unsigned I = NumFixedArgs;
I < Outs.
size(); ++
I) {
1425 const ISD::OutputArg &Out = Outs[
I];
1428 assert(VT != MVT::iPTR &&
"Legalized args should be concrete");
1433 CCInfo.AllocateStack(Layout.getTypeAllocSize(Ty), Alignment);
1440 unsigned NumBytes = CCInfo.getAlignedCallFrameSize();
1443 if (IsVarArg && NumBytes) {
1446 MaybeAlign StackAlign = Layout.getStackAlignment();
1447 assert(StackAlign &&
"data layout string is missing stack alignment");
1453 assert(ArgLocs[ValNo].getValNo() == ValNo &&
1454 "ArgLocs should remain in order and only hold varargs args");
1455 unsigned Offset = ArgLocs[ValNo++].getLocMemOffset();
1463 if (!Chains.
empty())
1465 }
else if (IsVarArg) {
1483 Ops.push_back(Chain);
1484 Ops.push_back(Callee);
1489 IsVarArg ? OutVals.
begin() + NumFixedArgs : OutVals.
end());
1492 Ops.push_back(FINode);
1495 for (
const auto &In : Ins) {
1496 assert(!
In.Flags.isByVal() &&
"byval is not valid for return values");
1497 assert(!
In.Flags.isNest() &&
"nest is not valid for return values");
1498 if (
In.Flags.isInAlloca())
1499 fail(
DL, DAG,
"WebAssembly hasn't implemented inalloca return values");
1500 if (
In.Flags.isInConsecutiveRegs())
1501 fail(
DL, DAG,
"WebAssembly hasn't implemented cons regs return values");
1502 if (
In.Flags.isInConsecutiveRegsLast())
1504 "WebAssembly hasn't implemented cons regs last return values");
1513 CLI.CB->getCalledOperand()->getType())) {
1528 WebAssemblyISD::TABLE_SET,
DL, DAG.
getVTList(MVT::Other), TableSetOps,
1533 CLI.CB->getCalledOperand()->getPointerAlignment(DAG.
getDataLayout()),
1539 if (CLI.IsTailCall) {
1541 SDVTList NodeTys = DAG.
getVTList(MVT::Other, MVT::Glue);
1546 SDVTList InTyList = DAG.
getVTList(InTys);
1549 for (
size_t I = 0;
I < Ins.size(); ++
I)
1556bool WebAssemblyTargetLowering::CanLowerReturn(
1559 const Type *RetTy)
const {
1564SDValue WebAssemblyTargetLowering::LowerReturn(
1570 "MVP WebAssembly can only return up to one value");
1572 fail(
DL, DAG,
"WebAssembly doesn't support non-C calling conventions");
1575 RetOps.append(OutVals.
begin(), OutVals.
end());
1576 Chain = DAG.
getNode(WebAssemblyISD::RETURN,
DL, MVT::Other, RetOps);
1579 for (
const ISD::OutputArg &Out : Outs) {
1584 fail(
DL, DAG,
"WebAssembly hasn't implemented inalloca results");
1586 fail(
DL, DAG,
"WebAssembly hasn't implemented cons regs results");
1588 fail(
DL, DAG,
"WebAssembly hasn't implemented cons regs last results");
1594SDValue WebAssemblyTargetLowering::LowerFormalArguments(
1599 fail(
DL, DAG,
"WebAssembly doesn't support non-C calling conventions");
1602 auto *MFI = MF.
getInfo<WebAssemblyFunctionInfo>();
1608 bool HasSwiftErrorArg =
false;
1609 bool HasSwiftSelfArg =
false;
1610 for (
const ISD::InputArg &In : Ins) {
1611 HasSwiftSelfArg |=
In.Flags.isSwiftSelf();
1612 HasSwiftErrorArg |=
In.Flags.isSwiftError();
1613 if (
In.Flags.isInAlloca())
1614 fail(
DL, DAG,
"WebAssembly hasn't implemented inalloca arguments");
1615 if (
In.Flags.isNest())
1616 fail(
DL, DAG,
"WebAssembly hasn't implemented nest arguments");
1617 if (
In.Flags.isInConsecutiveRegs())
1618 fail(
DL, DAG,
"WebAssembly hasn't implemented cons regs arguments");
1619 if (
In.Flags.isInConsecutiveRegsLast())
1620 fail(
DL, DAG,
"WebAssembly hasn't implemented cons regs last arguments");
1629 MFI->addParam(
In.VT);
1638 if (!HasSwiftSelfArg) {
1639 MFI->addParam(PtrVT);
1641 if (!HasSwiftErrorArg) {
1642 MFI->addParam(PtrVT);
1651 MFI->setVarargBufferVreg(VarargVreg);
1653 Chain,
DL, VarargVreg,
1654 DAG.
getNode(WebAssemblyISD::ARGUMENT,
DL, PtrVT,
1656 MFI->addParam(PtrVT);
1668 assert(MFI->getParams().size() == Params.
size() &&
1669 std::equal(MFI->getParams().begin(), MFI->getParams().end(),
1675void WebAssemblyTargetLowering::ReplaceNodeResults(
1677 switch (
N->getOpcode()) {
1692 Results.push_back(Replace128Op(
N, DAG));
1696 "ReplaceNodeResults not implemented for this op for WebAssembly!");
1707 switch (
Op.getOpcode()) {
1712 return LowerFrameIndex(
Op, DAG);
1714 return LowerGlobalAddress(
Op, DAG);
1716 return LowerGlobalTLSAddress(
Op, DAG);
1718 return LowerExternalSymbol(
Op, DAG);
1720 return LowerJumpTable(
Op, DAG);
1722 return LowerBR_JT(
Op, DAG);
1724 return LowerVASTART(
Op, DAG);
1727 fail(
DL, DAG,
"WebAssembly hasn't implemented computed gotos");
1730 return LowerRETURNADDR(
Op, DAG);
1732 return LowerFRAMEADDR(
Op, DAG);
1734 return LowerCopyToReg(
Op, DAG);
1737 return LowerAccessVectorElement(
Op, DAG);
1741 return LowerIntrinsic(
Op, DAG);
1743 return LowerSIGN_EXTEND_INREG(
Op, DAG);
1747 return LowerEXTEND_VECTOR_INREG(
Op, DAG);
1749 return LowerBUILD_VECTOR(
Op, DAG);
1751 return LowerVECTOR_SHUFFLE(
Op, DAG);
1753 return LowerSETCC(
Op, DAG);
1757 return LowerShift(
Op, DAG);
1760 return LowerFP_TO_INT_SAT(
Op, DAG);
1763 return LowerFMIN(
Op, DAG);
1766 return LowerFMAX(
Op, DAG);
1768 return LowerLoad(
Op, DAG);
1770 return LowerStore(
Op, DAG);
1779 return LowerMUL_LOHI(
Op, DAG);
1781 return LowerUADDO(
Op, DAG);
1796 return std::nullopt;
1815 SDVTList Tys = DAG.
getVTList(MVT::Other);
1827 SDVTList Tys = DAG.
getVTList(MVT::Other);
1829 return DAG.
getNode(WebAssemblyISD::LOCAL_SET,
DL, Tys,
Ops);
1834 "Encountered an unlowerable store to the wasm_var address space",
1850 "unexpected offset when loading from webassembly global",
false);
1861 "unexpected offset when loading from webassembly local",
false);
1865 return DAG.
getNode(WebAssemblyISD::LOCAL_GET,
DL, {LocalVT, MVT::Other},
1871 "Encountered an unlowerable load from the wasm_var address space",
1879 assert(Subtarget->hasWideArithmetic());
1880 assert(
Op.getValueType() == MVT::i64);
1883 switch (
Op.getOpcode()) {
1885 Opcode = WebAssemblyISD::I64_MUL_WIDE_U;
1888 Opcode = WebAssemblyISD::I64_MUL_WIDE_S;
1909 assert(Subtarget->hasWideArithmetic());
1910 assert(
Op.getValueType() == MVT::i64);
1917 DAG.
getNode(WebAssemblyISD::I64_ADD128,
DL,
1927 assert(Subtarget->hasWideArithmetic());
1928 assert(
N->getValueType(0) == MVT::i128);
1931 switch (
N->getOpcode()) {
1933 Opcode = WebAssemblyISD::I64_ADD128;
1936 Opcode = WebAssemblyISD::I64_SUB128;
1951 LHS_0, LHS_1, RHS_0, RHS_1);
1968 EVT VT = Src.getValueType();
1970 : WebAssembly::COPY_I64,
1973 return Op.getNode()->getNumValues() == 1
1992 if (!Subtarget->getTargetTriple().isOSEmscripten()) {
1994 "Non-Emscripten WebAssembly hasn't implemented "
1995 "__builtin_return_address");
1999 unsigned Depth =
Op.getConstantOperandVal(0);
2001 return makeLibCall(DAG, RTLIB::RETURN_ADDRESS,
Op.getValueType(),
2002 {DAG.getConstant(Depth, DL, MVT::i32)}, CallOptions,
DL)
2011 if (
Op.getConstantOperandVal(0) > 0)
2015 EVT VT =
Op.getValueType();
2022WebAssemblyTargetLowering::LowerGlobalTLSAddress(
SDValue Op,
2028 if (!MF.
getSubtarget<WebAssemblySubtarget>().hasBulkMemory())
2032 const GlobalValue *GV = GA->
getGlobal();
2037 auto model = Subtarget->getTargetTriple().isOSEmscripten()
2052 auto GlobalGet = PtrVT == MVT::i64 ? WebAssembly::GLOBAL_GET_I64
2053 : WebAssembly::GLOBAL_GET_I32;
2064 DAG.
getNode(WebAssemblyISD::WrapperREL,
DL, PtrVT, TLSOffset);
2071 EVT VT =
Op.getValueType();
2072 return DAG.
getNode(WebAssemblyISD::Wrapper,
DL, VT,
2082 EVT VT =
Op.getValueType();
2084 "Unexpected target flags on generic GlobalAddressSDNode");
2086 fail(
DL, DAG,
"Invalid address space for WebAssembly target");
2089 const GlobalValue *GV = GA->
getGlobal();
2097 const char *BaseName;
2106 DAG.
getNode(WebAssemblyISD::Wrapper,
DL, PtrVT,
2110 WebAssemblyISD::WrapperREL,
DL, VT,
2119 return DAG.
getNode(WebAssemblyISD::Wrapper,
DL, VT,
2125WebAssemblyTargetLowering::LowerExternalSymbol(
SDValue Op,
2129 EVT VT =
Op.getValueType();
2130 assert(ES->getTargetFlags() == 0 &&
2131 "Unexpected target flags on generic ExternalSymbolSDNode");
2132 return DAG.
getNode(WebAssemblyISD::Wrapper,
DL, VT,
2155 Ops.push_back(Chain);
2156 Ops.push_back(Index);
2162 for (
auto *
MBB : MBBs)
2169 return DAG.
getNode(WebAssemblyISD::BR_TABLE,
DL, MVT::Other,
Ops);
2181 MFI->getVarargBufferVreg(), PtrVT);
2182 return DAG.
getStore(
Op.getOperand(0),
DL, ArgN,
Op.getOperand(1),
2183 MachinePointerInfo(SV));
2190 switch (
Op.getOpcode()) {
2193 IntNo =
Op.getConstantOperandVal(1);
2196 IntNo =
Op.getConstantOperandVal(0);
2207 case Intrinsic::wasm_lsda: {
2216 DAG.
getNode(WebAssemblyISD::Wrapper,
DL, PtrVT,
2219 DAG.
getNode(WebAssemblyISD::WrapperREL,
DL, PtrVT, Node);
2223 return DAG.
getNode(WebAssemblyISD::Wrapper,
DL, PtrVT, Node);
2226 case Intrinsic::wasm_shuffle: {
2232 while (
OpIdx < 18) {
2241 return DAG.
getNode(WebAssemblyISD::SHUFFLE,
DL,
Op.getValueType(),
Ops);
2244 case Intrinsic::thread_pointer: {
2246 auto GlobalGet = PtrVT == MVT::i64 ? WebAssembly::GLOBAL_GET_I64
2247 : WebAssembly::GLOBAL_GET_I32;
2258WebAssemblyTargetLowering::LowerSIGN_EXTEND_INREG(
SDValue Op,
2268 assert(!Subtarget->hasSignExt() && Subtarget->hasSIMD128());
2272 const SDValue &Extract =
Op.getOperand(0);
2276 MVT ExtractedLaneT =
2280 if (ExtractedVecT == VecT)
2287 unsigned IndexVal =
Index->getAsZExtVal();
2306 assert((UserOpc == WebAssemblyISD::EXTEND_LOW_U ||
2307 UserOpc == WebAssemblyISD::EXTEND_LOW_S) &&
2308 "expected extend_low");
2313 size_t FirstIdx = Mask.size() / 2;
2314 for (
size_t i = 0; i < Mask.size() / 2; ++i) {
2315 if (Mask[i] !=
static_cast<int>(FirstIdx + i)) {
2321 unsigned Opc = UserOpc == WebAssemblyISD::EXTEND_LOW_S
2322 ? WebAssemblyISD::EXTEND_HIGH_S
2323 : WebAssemblyISD::EXTEND_HIGH_U;
2326 ShuffleSrc = DAG.
getBitcast(
Op.getValueType(), ShuffleSrc);
2332WebAssemblyTargetLowering::LowerEXTEND_VECTOR_INREG(
SDValue Op,
2335 EVT VT =
Op.getValueType();
2337 EVT SrcVT = Src.getValueType();
2344 "Unexpected extension factor.");
2347 if (Scale != 2 && Scale != 4 && Scale != 8)
2351 switch (
Op.getOpcode()) {
2356 Ext = WebAssemblyISD::EXTEND_LOW_U;
2359 Ext = WebAssemblyISD::EXTEND_LOW_S;
2370 while (Scale != 1) {
2384 if (
Op.getValueType() != MVT::v2f64)
2388 unsigned &Index) ->
bool {
2389 switch (
Op.getOpcode()) {
2391 Opcode = WebAssemblyISD::CONVERT_LOW_S;
2394 Opcode = WebAssemblyISD::CONVERT_LOW_U;
2397 Opcode = WebAssemblyISD::PROMOTE_LOW;
2403 auto ExtractVector =
Op.getOperand(0);
2410 SrcVec = ExtractVector.getOperand(0);
2411 Index = ExtractVector.getConstantOperandVal(1);
2415 unsigned LHSOpcode, RHSOpcode, LHSIndex, RHSIndex;
2417 if (!GetConvertedLane(
Op.getOperand(0), LHSOpcode, LHSSrcVec, LHSIndex) ||
2418 !GetConvertedLane(
Op.getOperand(1), RHSOpcode, RHSSrcVec, RHSIndex))
2421 if (LHSOpcode != RHSOpcode)
2425 switch (LHSOpcode) {
2426 case WebAssemblyISD::CONVERT_LOW_S:
2427 case WebAssemblyISD::CONVERT_LOW_U:
2428 ExpectedSrcVT = MVT::v4i32;
2430 case WebAssemblyISD::PROMOTE_LOW:
2431 ExpectedSrcVT = MVT::v4f32;
2437 auto Src = LHSSrcVec;
2438 if (LHSIndex != 0 || RHSIndex != 1 || LHSSrcVec != RHSSrcVec) {
2441 ExpectedSrcVT,
DL, LHSSrcVec, RHSSrcVec,
2442 {
static_cast<int>(LHSIndex),
static_cast<int>(RHSIndex) + 4, -1, -1});
2444 return DAG.
getNode(LHSOpcode,
DL, MVT::v2f64, Src);
2449 MVT VT =
Op.getSimpleValueType();
2450 if (VT == MVT::v8f16) {
2465 const EVT VecT =
Op.getValueType();
2466 const EVT LaneT =
Op.getOperand(0).getValueType();
2468 bool CanSwizzle = VecT == MVT::v16i8;
2489 auto GetSwizzleSrcs = [](
size_t I,
const SDValue &Lane) {
2493 const SDValue &SwizzleSrc = Lane->getOperand(0);
2494 const SDValue &IndexExt = Lane->getOperand(1);
2504 Index->getConstantOperandVal(1) !=
I)
2506 return std::make_pair(SwizzleSrc, SwizzleIndices);
2513 auto GetShuffleSrc = [&](
const SDValue &Lane) {
2518 if (Lane->getOperand(0).getValueType().getVectorNumElements() >
2521 return Lane->getOperand(0);
2524 using ValueEntry = std::pair<SDValue, size_t>;
2527 using SwizzleEntry = std::pair<std::pair<SDValue, SDValue>,
size_t>;
2530 using ShuffleEntry = std::pair<SDValue, size_t>;
2533 auto AddCount = [](
auto &Counts,
const auto &Val) {
2536 if (CountIt == Counts.end()) {
2537 Counts.emplace_back(Val, 1);
2543 auto GetMostCommon = [](
auto &Counts) {
2545 assert(CommonIt != Counts.end() &&
"Unexpected all-undef build_vector");
2549 size_t NumConstantLanes = 0;
2552 for (
size_t I = 0;
I < Lanes; ++
I) {
2557 AddCount(SplatValueCounts, Lane);
2561 if (
auto ShuffleSrc = GetShuffleSrc(Lane))
2562 AddCount(ShuffleCounts, ShuffleSrc);
2564 auto SwizzleSrcs = GetSwizzleSrcs(
I, Lane);
2565 if (SwizzleSrcs.first)
2566 AddCount(SwizzleCounts, SwizzleSrcs);
2571 size_t NumSplatLanes;
2572 std::tie(SplatValue, NumSplatLanes) = GetMostCommon(SplatValueCounts);
2576 size_t NumSwizzleLanes = 0;
2577 if (SwizzleCounts.
size())
2578 std::forward_as_tuple(std::tie(SwizzleSrc, SwizzleIndices),
2579 NumSwizzleLanes) = GetMostCommon(SwizzleCounts);
2583 SDValue ShuffleSrc1, ShuffleSrc2;
2584 size_t NumShuffleLanes = 0;
2585 if (ShuffleCounts.
size()) {
2586 std::tie(ShuffleSrc1, NumShuffleLanes) = GetMostCommon(ShuffleCounts);
2588 [&](
const auto &Pair) {
return Pair.first == ShuffleSrc1; });
2590 if (ShuffleCounts.
size()) {
2591 size_t AdditionalShuffleLanes;
2592 std::tie(ShuffleSrc2, AdditionalShuffleLanes) =
2593 GetMostCommon(ShuffleCounts);
2594 NumShuffleLanes += AdditionalShuffleLanes;
2599 std::function<bool(
size_t,
const SDValue &)> IsLaneConstructed;
2602 if (NumSwizzleLanes >= NumShuffleLanes &&
2603 NumSwizzleLanes >= NumConstantLanes && NumSwizzleLanes >= NumSplatLanes) {
2606 auto Swizzled = std::make_pair(SwizzleSrc, SwizzleIndices);
2607 IsLaneConstructed = [&, Swizzled](
size_t I,
const SDValue &Lane) {
2608 return Swizzled == GetSwizzleSrcs(
I, Lane);
2610 }
else if (NumShuffleLanes >= NumConstantLanes &&
2611 NumShuffleLanes >= NumSplatLanes) {
2621 assert(LaneSize > DestLaneSize);
2622 Scale1 = LaneSize / DestLaneSize;
2628 assert(LaneSize > DestLaneSize);
2629 Scale2 = LaneSize / DestLaneSize;
2634 assert(DestLaneCount <= 16);
2635 for (
size_t I = 0;
I < DestLaneCount; ++
I) {
2637 SDValue Src = GetShuffleSrc(Lane);
2638 if (Src == ShuffleSrc1) {
2640 }
else if (Src && Src == ShuffleSrc2) {
2646 ArrayRef<int> MaskRef(Mask, DestLaneCount);
2648 IsLaneConstructed = [&](size_t,
const SDValue &Lane) {
2649 auto Src = GetShuffleSrc(Lane);
2650 return Src == ShuffleSrc1 || (Src && Src == ShuffleSrc2);
2652 }
else if (NumConstantLanes >= NumSplatLanes) {
2654 for (
const SDValue &Lane :
Op->op_values()) {
2660 uint64_t LaneBits = 128 / Lanes;
2663 Const->getAPIntValue().trunc(LaneBits).getZExtValue(),
2664 SDLoc(Lane), LaneT));
2680 if (NumSplatLanes == 1 &&
Op->getOperand(0) == SplatValue &&
2681 (DestLaneSize == 32 || DestLaneSize == 64)) {
2688 IsLaneConstructed = [&SplatValue](
size_t _,
const SDValue &Lane) {
2689 return Lane == SplatValue;
2694 assert(IsLaneConstructed);
2697 for (
size_t I = 0;
I < Lanes; ++
I) {
2699 if (!Lane.
isUndef() && !IsLaneConstructed(
I, Lane))
2708WebAssemblyTargetLowering::LowerVECTOR_SHUFFLE(
SDValue Op,
2712 MVT VecType =
Op.getOperand(0).getSimpleValueType();
2723 for (
int M : Mask) {
2724 for (
size_t J = 0; J < LaneBytes; ++J) {
2728 uint64_t ByteIndex =
M == -1 ? J : (uint64_t)M * LaneBytes + J;
2733 return DAG.
getNode(WebAssemblyISD::SHUFFLE,
DL,
Op.getValueType(),
Ops);
2741 assert(
Op->getOperand(0)->getSimpleValueType(0) == MVT::v2i64);
2746 auto MakeLane = [&](
unsigned I) {
2752 {MakeLane(0), MakeLane(1)});
2756WebAssemblyTargetLowering::LowerAccessVectorElement(
SDValue Op,
2773 EVT LaneT =
Op.getSimpleValueType().getVectorElementType();
2775 if (LaneT.
bitsGE(MVT::i32))
2779 size_t NumLanes =
Op.getSimpleValueType().getVectorNumElements();
2781 unsigned ShiftOpcode =
Op.getOpcode();
2787 for (
size_t i = 0; i < NumLanes; ++i) {
2790 SDValue ShiftedValue = ShiftedElements[i];
2795 DAG.
getNode(ShiftOpcode,
DL, MVT::i32, ShiftedValue, MaskedShiftValue));
2805 assert(
Op.getSimpleValueType().isVector());
2807 uint64_t LaneBits =
Op.getValueType().getScalarSizeInBits();
2808 auto ShiftVal =
Op.getOperand(1);
2811 auto SkipImpliedMask = [](
SDValue MaskOp, uint64_t MaskBits) {
2822 MaskVal == MaskBits)
2829 if (ConstantRHS && ConstantRHS->getAPIntValue() == MaskBits)
2837 ShiftVal = SkipImpliedMask(ShiftVal, LaneBits - 1);
2843 ShiftVal = SkipImpliedMask(ShiftVal, LaneBits - 1);
2848 switch (
Op.getOpcode()) {
2850 Opcode = WebAssemblyISD::VEC_SHL;
2853 Opcode = WebAssemblyISD::VEC_SHR_S;
2856 Opcode = WebAssemblyISD::VEC_SHR_U;
2862 return DAG.
getNode(Opcode,
DL,
Op.getValueType(),
Op.getOperand(0), ShiftVal);
2867 EVT ResT =
Op.getValueType();
2870 if ((ResT == MVT::i32 || ResT == MVT::i64) &&
2871 (SatVT == MVT::i32 || SatVT == MVT::i64))
2874 if (ResT == MVT::v4i32 && SatVT == MVT::i32)
2877 if (ResT == MVT::v8i16 && SatVT == MVT::i16)
2884 return (
Op->getFlags().hasNoNaNs() ||
2887 (
Op->getFlags().hasNoSignedZeros() ||
2895 return DAG.
getNode(WebAssemblyISD::RELAXED_FMIN, SDLoc(
Op),
2896 Op.getValueType(),
Op.getOperand(0),
Op.getOperand(1));
2904 return DAG.
getNode(WebAssemblyISD::RELAXED_FMAX, SDLoc(
Op),
2905 Op.getValueType(),
Op.getOperand(0),
Op.getOperand(1));
2915 auto &DAG = DCI.
DAG;
2922 SDValue Bitcast =
N->getOperand(0);
2925 if (!
N->getOperand(1).isUndef())
2927 SDValue CastOp = Bitcast.getOperand(0);
2929 EVT DstType = Bitcast.getValueType();
2930 if (!SrcType.is128BitVector() ||
2931 SrcType.getVectorNumElements() != DstType.getVectorNumElements())
2934 SrcType,
SDLoc(
N), CastOp, DAG.
getUNDEF(SrcType), Shuffle->getMask());
2944 auto &DAG = DCI.
DAG;
2948 EVT InVT =
N->getOperand(0)->getValueType(0);
2949 EVT ResVT =
N->getValueType(0);
2951 if (ResVT == MVT::v4f32 && (InVT == MVT::v4i16 || InVT == MVT::v4i8))
2953 else if (ResVT == MVT::v2f64 && (InVT == MVT::v2i16 || InVT == MVT::v2i8))
2967 auto &DAG = DCI.
DAG;
2971 EVT VT =
N->getValueType(0);
2985 auto &DAG = DCI.
DAG;
2991 auto Extract =
N->getOperand(0);
2996 if (IndexNode ==
nullptr)
2998 auto Index = IndexNode->getZExtValue();
3002 EVT ResVT =
N->getValueType(0);
3003 if (ResVT == MVT::v8i16) {
3005 Source.getValueType() != MVT::v16i8 || (Index != 0 && Index != 8))
3007 }
else if (ResVT == MVT::v4i32) {
3009 Source.getValueType() != MVT::v8i16 || (Index != 0 && Index != 4))
3011 }
else if (ResVT == MVT::v2i64) {
3013 Source.getValueType() != MVT::v4i32 || (Index != 0 && Index != 2))
3020 bool IsLow = Index == 0;
3022 unsigned Op = IsSext ? (IsLow ? WebAssemblyISD::EXTEND_LOW_S
3023 : WebAssemblyISD::EXTEND_HIGH_S)
3024 : (IsLow ? WebAssemblyISD::EXTEND_LOW_U
3025 : WebAssemblyISD::EXTEND_HIGH_U);
3032 auto &DAG = DCI.
DAG;
3034 auto GetWasmConversionOp = [](
unsigned Op) {
3037 return WebAssemblyISD::TRUNC_SAT_ZERO_S;
3039 return WebAssemblyISD::TRUNC_SAT_ZERO_U;
3041 return WebAssemblyISD::DEMOTE_ZERO;
3046 auto IsZeroSplat = [](
SDValue SplatVal) {
3048 APInt SplatValue, SplatUndef;
3049 unsigned SplatBitSize;
3054 Splat->isConstantSplat(SplatValue, SplatUndef, SplatBitSize,
3072 EVT ExpectedConversionType;
3075 switch (ConversionOp) {
3079 ExpectedConversionType = MVT::v2i32;
3083 ExpectedConversionType = MVT::v2f32;
3089 if (
N->getValueType(0) != ResVT)
3092 if (
Conversion.getValueType() != ExpectedConversionType)
3096 if (Source.getValueType() != MVT::v2f64)
3099 if (!IsZeroSplat(
N->getOperand(1)) ||
3100 N->getOperand(1).getValueType() != ExpectedConversionType)
3103 unsigned Op = GetWasmConversionOp(ConversionOp);
3119 auto ConversionOp =
N->getOpcode();
3120 switch (ConversionOp) {
3132 if (
N->getValueType(0) != ResVT)
3135 auto Concat =
N->getOperand(0);
3136 if (
Concat.getValueType() != MVT::v4f64)
3139 auto Source =
Concat.getOperand(0);
3140 if (Source.getValueType() != MVT::v2f64)
3143 if (!IsZeroSplat(
Concat.getOperand(1)) ||
3144 Concat.getOperand(1).getValueType() != MVT::v2f64)
3147 unsigned Op = GetWasmConversionOp(ConversionOp);
3153 const SDLoc &
DL,
unsigned VectorWidth) {
3161 unsigned ElemsPerChunk = VectorWidth / ElVT.
getSizeInBits();
3166 IdxVal &= ~(ElemsPerChunk - 1);
3171 Vec->
ops().slice(IdxVal, ElemsPerChunk));
3183 EVT SrcVT = In.getValueType();
3201 EVT InVT = MVT::i16, OutVT = MVT::i8;
3206 unsigned SubSizeInBits = SrcSizeInBits / 2;
3208 OutVT =
EVT::getVectorVT(Ctx, OutVT, SubSizeInBits / OutVT.getSizeInBits());
3234 auto &DAG = DCI.
DAG;
3237 EVT InVT = In.getValueType();
3241 EVT OutVT =
N->getValueType(0);
3248 if (!((InSVT == MVT::i16 || InSVT == MVT::i32 || InSVT == MVT::i64) &&
3249 (OutSVT == MVT::i8 || OutSVT == MVT::i16) && OutVT.
is128BitVector()))
3262 auto &DAG = DCI.
DAG;
3265 EVT VT =
N->getValueType(0);
3266 EVT SrcVT = Src.getValueType();
3277 if (NumElts == 2 || NumElts == 4 || NumElts == 8 || NumElts == 16) {
3280 {DAG.getConstant(Intrinsic::wasm_bitmask, DL, MVT::i32),
3281 DAG.getSExtOrTrunc(N->getOperand(0), DL,
3282 SrcVT.changeVectorElementType(
3283 *DAG.getContext(), Width))}),
3288 if (NumElts == 32 || NumElts == 64) {
3314 MVT ReturnType = VectorsToShuffle.
size() == 2 ? MVT::i32 : MVT::i64;
3317 for (
SDValue V : VectorsToShuffle) {
3318 ReturningInteger = DAG.
getNode(
3327 return ReturningInteger;
3342 if (
N->getNumOperands() < 2 ||
3346 EVT LT =
LHS.getValueType();
3347 if (LT.getScalarSizeInBits() > 128 / LT.getVectorNumElements())
3350 auto CombineSetCC = [&
N, &DAG](Intrinsic::WASMIntrinsics InPre,
3352 Intrinsic::WASMIntrinsics InPost) {
3353 if (
N->getConstantOperandVal(0) != InPre)
3364 {DAG.getConstant(InPost, DL, MVT::i32), LHS}),
3367 Ret = DAG.
getNOT(
DL, Ret, MVT::i1);
3372 Intrinsic::wasm_alltrue))
3375 Intrinsic::wasm_anytrue))
3378 Intrinsic::wasm_anytrue))
3381 Intrinsic::wasm_alltrue))
3387template <
int MatchRHS,
ISD::CondCode MatchCond,
bool RequiresNegate,
3402 {DAG.getConstant(Intrin, DL, MVT::i32),
3403 DAG.getSExtOrTrunc(LHS->getOperand(0), DL, VecVT)}),
3406 Ret = DAG.
getNOT(
DL, Ret, MVT::i1);
3419 EVT VT =
N->getValueType(0);
3420 EVT OpVT =
X.getValueType();
3424 Attribute::NoImplicitFloat))
3430 !Subtarget->
hasSIMD128() || !isIntEqualitySetCC(CC))
3434 auto IsVectorBitCastCheap = [](
SDValue X) {
3439 if (!IsVectorBitCastCheap(
X) || !IsVectorBitCastCheap(
Y))
3449 : Intrinsic::wasm_anytrue,
3463 EVT VT =
N->getValueType(0);
3474 EVT FromVT =
LHS->getOperand(0).getValueType();
3479 if (NumElts != 2 && NumElts != 4 && NumElts != 8 && NumElts != 16)
3485 auto &DAG = DCI.
DAG;
3516 EVT VT =
N->getValueType(0);
3517 if (VT != MVT::v8i32 && VT != MVT::v16i32)
3523 if (
LHS.getOpcode() !=
RHS.getOpcode())
3530 if (
LHS->getOperand(0).getValueType() !=
RHS->getOperand(0).getValueType())
3533 EVT FromVT =
LHS->getOperand(0).getValueType();
3535 if (EltTy != MVT::i8)
3563 unsigned ExtendLowOpc =
3564 IsSigned ? WebAssemblyISD::EXTEND_LOW_S : WebAssemblyISD::EXTEND_LOW_U;
3565 unsigned ExtendHighOpc =
3566 IsSigned ? WebAssemblyISD::EXTEND_HIGH_S : WebAssemblyISD::EXTEND_HIGH_U;
3568 auto GetExtendLow = [&DAG, &
DL, &ExtendLowOpc](
EVT VT,
SDValue Op) {
3575 if (NumElts == 16) {
3576 SDValue LowLHS = GetExtendLow(MVT::v8i16, ExtendInLHS);
3577 SDValue LowRHS = GetExtendLow(MVT::v8i16, ExtendInRHS);
3583 GetExtendLow(MVT::v4i32, MulLow),
3585 GetExtendLow(MVT::v4i32, MulHigh),
3594 SDValue Lo = GetExtendLow(MVT::v4i32, MulLow);
3604 EVT VT =
N->getValueType(0);
3613 if (VT != MVT::v8i8 && VT != MVT::v16i8)
3620 EVT MulVT = MVT::v8i16;
3622 if (VT == MVT::v8i8) {
3628 DAG.
getNode(WebAssemblyISD::EXTEND_LOW_U,
DL, MulVT, PromotedLHS);
3630 DAG.
getNode(WebAssemblyISD::EXTEND_LOW_U,
DL, MulVT, PromotedRHS);
3635 MVT::v16i8,
DL, MulLow, DAG.
getUNDEF(MVT::v16i8),
3636 {0, 2, 4, 6, 8, 10, 12, 14, -1, -1, -1, -1, -1, -1, -1, -1});
3639 assert(VT == MVT::v16i8 &&
"Expected v16i8");
3643 DAG.
getNode(WebAssemblyISD::EXTEND_HIGH_U,
DL, MulVT,
LHS);
3645 DAG.
getNode(WebAssemblyISD::EXTEND_HIGH_U,
DL, MulVT,
RHS);
3654 VT,
DL, MulLow, MulHigh,
3655 {0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30});
3663 EVT InVT = In.getValueType();
3668 if (NumElems < RequiredNumElems) {
3675 EVT OutVT =
N->getValueType(0);
3680 if (OutElTy != MVT::i8 && OutElTy != MVT::i16)
3687 EVT FPVT =
N->getOperand(0)->getValueType(0);
3705 EVT NarrowedVT = OutElTy == MVT::i8 ? MVT::v16i8 : MVT::v8i16;
3718WebAssemblyTargetLowering::PerformDAGCombine(
SDNode *
N,
3719 DAGCombinerInfo &DCI)
const {
3720 switch (
N->getOpcode()) {
unsigned const MachineRegisterInfo * MRI
static SDValue performMulCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const AArch64Subtarget *Subtarget)
static SDValue performTruncateCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI)
static SDValue performSETCCCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI, SelectionDAG &DAG)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis false
Function Alias Analysis Results
static void fail(const SDLoc &DL, SelectionDAG &DAG, const Twine &Msg, SDValue Val={})
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
const HexagonInstrInfo * TII
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Register const TargetRegisterInfo * TRI
Promote Memory to Register
MachineInstr unsigned OpIdx
static SDValue performVECTOR_SHUFFLECombine(SDNode *N, SelectionDAG &DAG, const RISCVSubtarget &Subtarget, const RISCVTargetLowering &TLI)
static SDValue combineVectorSizedSetCCEquality(EVT VT, SDValue X, SDValue Y, ISD::CondCode CC, const SDLoc &DL, SelectionDAG &DAG, const RISCVSubtarget &Subtarget)
Try to map an integer comparison with size > XLEN to vector instructions before type legalization spl...
const SmallVectorImpl< MachineOperand > & Cond
Contains matchers for matching SelectionDAG nodes and values.
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")
static MachineBasicBlock * LowerFPToInt(MachineInstr &MI, DebugLoc DL, MachineBasicBlock *BB, const TargetInstrInfo &TII, bool IsUnsigned, bool Int64, bool Float64, unsigned LoweredOpcode)
static bool callingConvSupported(CallingConv::ID CallConv)
static SDValue TryWideExtMulCombine(SDNode *N, SelectionDAG &DAG)
static MachineBasicBlock * LowerMemcpy(MachineInstr &MI, DebugLoc DL, MachineBasicBlock *BB, const TargetInstrInfo &TII, bool Int64)
static std::optional< unsigned > IsWebAssemblyLocal(SDValue Op, SelectionDAG &DAG)
static SDValue performVectorExtendCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
static SDValue performVectorNonNegToFPCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
static SDValue unrollVectorShift(SDValue Op, SelectionDAG &DAG)
static SDValue performAnyAllCombine(SDNode *N, SelectionDAG &DAG)
static MachineBasicBlock * LowerCallResults(MachineInstr &CallResults, DebugLoc DL, MachineBasicBlock *BB, const WebAssemblySubtarget *Subtarget, const TargetInstrInfo &TII)
static SDValue TryMatchTrue(SDNode *N, EVT VecVT, SelectionDAG &DAG)
static SDValue GetExtendHigh(SDValue Op, unsigned UserOpc, EVT VT, SelectionDAG &DAG)
SDValue performConvertFPCombine(SDNode *N, SelectionDAG &DAG)
static SDValue performVectorTruncZeroCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
static bool IsWebAssemblyGlobal(SDValue Op)
static MachineBasicBlock * LowerMemset(MachineInstr &MI, DebugLoc DL, MachineBasicBlock *BB, const TargetInstrInfo &TII, bool Int64)
static bool HasNoSignedZerosOrNaNs(SDValue Op, SelectionDAG &DAG)
SDValue DoubleVectorWidth(SDValue In, unsigned RequiredNumElems, SelectionDAG &DAG)
static SDValue performVectorExtendToFPCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
Convert ({u,s}itofp vec) --> ({u,s}itofp ({s,z}ext vec)) so it doesn't get split up into scalar instr...
static SDValue LowerConvertLow(SDValue Op, SelectionDAG &DAG)
static SDValue extractSubVector(SDValue Vec, unsigned IdxVal, SelectionDAG &DAG, const SDLoc &DL, unsigned VectorWidth)
static SDValue performBitcastCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
static SDValue truncateVectorWithNARROW(EVT DstVT, SDValue In, const SDLoc &DL, SelectionDAG &DAG)
This file defines the interfaces that WebAssembly uses to lower LLVM code into a selection DAG.
This file provides WebAssembly-specific target descriptions.
This file declares WebAssembly-specific per-machine-function information.
This file declares the WebAssembly-specific subclass of TargetSubtarget.
This file declares the WebAssembly-specific subclass of TargetMachine.
This file contains the declaration of the WebAssembly-specific type parsing utility functions.
This file contains the declaration of the WebAssembly-specific utility functions.
static constexpr int Concat[]
Class for arbitrary precision integers.
void setBitsFrom(unsigned loBit)
Set the top bits starting from loBit.
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
static APInt getHighBitsSet(unsigned numBits, unsigned hiBitsSet)
Constructs an APInt value that has the top hiBitsSet bits set.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
an instruction that atomically reads a memory location, combines it with another value,...
BinOp getOperation() const
LLVM Basic Block Representation.
static CCValAssign getMem(unsigned ValNo, MVT ValVT, int64_t Offset, MVT LocVT, LocInfo HTP, bool IsCustom=false)
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
uint64_t getNumOperands() const
A parsed version of the target data layout string in and methods for querying it.
Diagnostic information for unsupported feature in backend.
This is a fast-path instruction selection class that generates poor code and doesn't support illegal ...
FunctionLoweringInfo - This contains information that is global to a function that is used when lower...
FunctionType * getFunctionType() const
Returns the FunctionType for me.
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
int64_t getOffset() const
LLVM_ABI unsigned getAddressSpace() const
unsigned getTargetFlags() const
const GlobalValue * getGlobal() const
ThreadLocalMode getThreadLocalMode() const
Type * getValueType() const
unsigned getTargetFlags() const
This is an important class for using LLVM in a threaded context.
LLVM_ABI void diagnose(const DiagnosticInfo &DI)
Report a message to the currently installed diagnostic handler.
Tracks which library functions to use for a particular subtarget.
const SDValue & getBasePtr() const
const SDValue & getOffset() const
Describe properties that are true of each instruction in the target description file.
bool is128BitVector() const
Return true if this is a 128-bit vector type.
@ INVALID_SIMPLE_VALUE_TYPE
static auto integer_fixedlen_vector_valuetypes()
MVT changeVectorElementType(MVT EltVT) const
Return a VT for a vector type whose attributes match ourselves with the exception of the element type...
unsigned getVectorNumElements() const
bool isVector() const
Return true if this is a vector value type.
bool isInteger() const
Return true if this is an integer or a vector integer type.
static auto integer_valuetypes()
TypeSize getSizeInBits() const
Returns the size of the specified MVT in bits.
static auto fixedlen_vector_valuetypes()
bool isFixedLengthVector() const
static MVT getVectorVT(MVT VT, unsigned NumElements)
MVT getVectorElementType() const
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
static MVT getIntegerVT(unsigned BitWidth)
LLVM_ABI void transferSuccessorsAndUpdatePHIs(MachineBasicBlock *FromMBB)
Transfers all the successors, as in transferSuccessors, and update PHI operands in the successor bloc...
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
const BasicBlock * getBasicBlock() const
Return the LLVM basic block that this instance corresponded to originally.
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
iterator insertAfter(iterator I, MachineInstr *MI)
Insert MI into the instruction list after I.
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
LLVM_ABI int CreateStackObject(uint64_t Size, Align Alignment, bool isSpillSlot, const AllocaInst *Alloca=nullptr, uint8_t ID=0)
Create a new statically sized stack object, returning a nonnegative identifier to represent it.
void setFrameAddressIsTaken(bool T)
unsigned getFunctionNumber() const
getFunctionNumber - Return a unique ID for the current function.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
const char * createExternalSymbolName(StringRef Name)
Allocate a string and populate it with the given external symbol name.
MCContext & getContext() const
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Function & getFunction()
Return the LLVM function that this machine code represents.
BasicBlockListType::iterator iterator
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
const MachineJumpTableInfo * getJumpTableInfo() const
getJumpTableInfo - Return the jump table info object for the current function.
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addSym(MCSymbol *Sym, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addFPImm(const ConstantFP *Val) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
MachineInstr * getInstr() const
If conversion operators fail, use this method to get the MachineInstr explicitly.
Representation of each machine instruction.
mop_range defs()
Returns all explicit operands that are register definitions.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
LLVM_ABI void addOperand(MachineFunction &MF, const MachineOperand &Op)
Add the specified operand to the instruction.
mop_range uses()
Returns all operands which may be register uses.
LLVM_ABI void eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
LLVM_ABI void removeOperand(unsigned OpNo)
Erase an operand from an instruction, leaving it with one fewer operand than it started with.
const MachineOperand & getOperand(unsigned i) const
const std::vector< MachineJumpTableEntry > & getJumpTables() const
Flags
Flags values. These may be or'd together.
@ MOVolatile
The memory access is volatile.
@ MOLoad
The memory access reads data.
@ MOStore
The memory access writes data.
MachineOperand class - Representation of each machine instruction operand.
bool isReg() const
isReg - Tests if this is a MO_Register operand.
void setIsKill(bool Val=true)
Register getReg() const
getReg - Returns the register number.
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
void addLiveIn(MCRegister Reg, Register vreg=Register())
addLiveIn - Add the specified register as a live-in.
unsigned getAddressSpace() const
Return the address space for the associated pointer.
MachineMemOperand * getMemOperand() const
Return the unique MachineMemOperand object describing the memory reference performed by operation.
const SDValue & getChain() const
EVT getMemoryVT() const
Return the type of the in-memory value.
static PointerType * getUnqual(Type *ElementType)
This constructs a pointer to an object of the specified type in the default address space (address sp...
Wrapper class representing virtual and physical registers.
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
ArrayRef< SDUse > ops() const
unsigned getOpcode() const
Return the SelectionDAG opcode value for this node.
uint64_t getAsZExtVal() const
Helper method returns the zero-extended integer value of a ConstantSDNode.
const SDValue & getOperand(unsigned Num) const
uint64_t getConstantOperandVal(unsigned Num) const
Helper method returns the integer value of a ConstantSDNode operand.
EVT getValueType(unsigned ResNo) const
Return the type of a specified result.
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
SDNode * getNode() const
get the SDNode which holds the desired result
SDValue getValue(unsigned R) const
EVT getValueType() const
Return the ValueType of the referenced return value.
const SDValue & getOperand(unsigned i) const
MVT getSimpleValueType() const
Return the simple ValueType of the referenced return value.
unsigned getOpcode() const
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
SDValue getTargetGlobalAddress(const GlobalValue *GV, const SDLoc &DL, EVT VT, int64_t offset=0, unsigned TargetFlags=0)
SDValue getCopyToReg(SDValue Chain, const SDLoc &dl, Register Reg, SDValue N)
LLVM_ABI SDValue getMergeValues(ArrayRef< SDValue > Ops, const SDLoc &dl)
Create a MERGE_VALUES node from the given operands.
LLVM_ABI SDVTList getVTList(EVT VT)
Return an SDVTList that represents the list of values specified.
LLVM_ABI SDValue getShiftAmountConstant(uint64_t Val, EVT VT, const SDLoc &DL)
LLVM_ABI SDValue getSplatValue(SDValue V, bool LegalTypes=false)
If V is a splat vector, return its scalar source operand by extracting that element from the source v...
LLVM_ABI MachineSDNode * getMachineNode(unsigned Opcode, const SDLoc &dl, EVT VT)
These are used for target selectors to create a new node with specified return type(s),...
LLVM_ABI void ExtractVectorElements(SDValue Op, SmallVectorImpl< SDValue > &Args, unsigned Start=0, unsigned Count=0, EVT EltVT=EVT())
Append the extracted elements from Start to Count out of the vector Op in Args.
LLVM_ABI SDValue UnrollVectorOp(SDNode *N, unsigned ResNE=0)
Utility function used by legalize and lowering to "unroll" a vector operation by splitting out the sc...
LLVM_ABI SDValue getConstantFP(double Val, const SDLoc &DL, EVT VT, bool isTarget=false)
Create a ConstantFPSDNode wrapping a constant value.
LLVM_ABI SDValue getMemIntrinsicNode(unsigned Opcode, const SDLoc &dl, SDVTList VTList, ArrayRef< SDValue > Ops, EVT MemVT, MachinePointerInfo PtrInfo, Align Alignment, MachineMemOperand::Flags Flags=MachineMemOperand::MOLoad|MachineMemOperand::MOStore, LocationSize Size=LocationSize::precise(0), const AAMDNodes &AAInfo=AAMDNodes())
Creates a MemIntrinsicNode that may produce a result and takes a list of operands.
SDValue getSetCC(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, ISD::CondCode Cond, SDValue Chain=SDValue(), bool IsSignaling=false, SDNodeFlags Flags={})
Helper function to make it easier to build SetCC's if you just have an ISD::CondCode instead of an SD...
LLVM_ABI SDValue getMemcpy(SDValue Chain, const SDLoc &dl, SDValue Dst, SDValue Src, SDValue Size, Align Alignment, bool isVol, bool AlwaysInline, const CallInst *CI, std::optional< bool > OverrideTailCall, MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo, const AAMDNodes &AAInfo=AAMDNodes(), BatchAAResults *BatchAA=nullptr)
LLVM_ABI SDValue getNOT(const SDLoc &DL, SDValue Val, EVT VT)
Create a bitwise NOT operation as (XOR Val, -1).
SDValue getTargetJumpTable(int JTI, EVT VT, unsigned TargetFlags=0)
SDValue getUNDEF(EVT VT)
Return an UNDEF node. UNDEF does not have a useful SDLoc.
SDValue getBuildVector(EVT VT, const SDLoc &DL, ArrayRef< SDValue > Ops)
Return an ISD::BUILD_VECTOR node.
LLVM_ABI SDValue getBitcast(EVT VT, SDValue V)
Return a bitcast using the SDLoc of the value operand, and casting to the provided type.
SDValue getCopyFromReg(SDValue Chain, const SDLoc &dl, Register Reg, EVT VT)
const DataLayout & getDataLayout() const
SDValue getTargetFrameIndex(int FI, EVT VT)
LLVM_ABI SDValue getConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Create a ConstantSDNode wrapping a constant value.
LLVM_ABI SDValue getStore(SDValue Chain, const SDLoc &dl, SDValue Val, SDValue Ptr, MachinePointerInfo PtrInfo, Align Alignment, MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
Helper function to build ISD::STORE nodes.
LLVM_ABI bool SignBitIsZero(SDValue Op, unsigned Depth=0) const
Return true if the sign bit of Op is known to be zero.
LLVM_ABI SDValue getBasicBlock(MachineBasicBlock *MBB)
const TargetMachine & getTarget() const
LLVM_ABI SDValue getAnyExtOrTrunc(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of integer type, to the integer type VT, by either any-extending or truncat...
LLVM_ABI bool isKnownNeverZeroFloat(SDValue Op) const
Test whether the given floating point SDValue is known to never be positive or negative zero.
LLVM_ABI SDValue getIntPtrConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
LLVM_ABI SDValue getValueType(EVT)
LLVM_ABI SDValue getNode(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDUse > Ops)
Gets or creates the specified node.
LLVM_ABI bool isKnownNeverNaN(SDValue Op, const APInt &DemandedElts, bool SNaN=false, unsigned Depth=0) const
Test whether the given SDValue (or all elements of it, if it is a vector) is known to never be NaN in...
SDValue getTargetConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isOpaque=false)
MachineFunction & getMachineFunction() const
SDValue getPOISON(EVT VT)
Return a POISON node. POISON does not have a useful SDLoc.
SDValue getSplatBuildVector(EVT VT, const SDLoc &DL, SDValue Op)
Return a splat ISD::BUILD_VECTOR node, consisting of Op splatted to all elements.
LLVM_ABI SDValue getFrameIndex(int FI, EVT VT, bool isTarget=false)
LLVM_ABI SDValue getZExtOrTrunc(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of integer type, to the integer type VT, by either zero-extending or trunca...
LLVMContext * getContext() const
LLVM_ABI SDValue getTargetExternalSymbol(const char *Sym, EVT VT, unsigned TargetFlags=0)
LLVM_ABI SDValue getMCSymbol(MCSymbol *Sym, EVT VT)
SDValue getEntryNode() const
Return the token chain corresponding to the entry of the function.
LLVM_ABI SDValue getVectorShuffle(EVT VT, const SDLoc &dl, SDValue N1, SDValue N2, ArrayRef< int > Mask)
Return an ISD::VECTOR_SHUFFLE node.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
const SDValue & getBasePtr() const
const SDValue & getOffset() const
const SDValue & getValue() const
StringRef - Represent a constant reference to a string, i.e.
constexpr size_t size() const
size - Get the string size.
TargetInstrInfo - Interface to description of machine instruction set.
Provides information about what library functions are available for the current target.
void setBooleanVectorContents(BooleanContent Ty)
Specify how the target extends the result of a vector boolean value from a vector of i1 to a wider ty...
void setOperationAction(unsigned Op, MVT VT, LegalizeAction Action)
Indicate that the specified operation does not work with the specified type and indicate what to do a...
virtual const TargetRegisterClass * getRegClassFor(MVT VT, bool isDivergent=false) const
Return the register class that should be used for the specified value type.
const TargetMachine & getTargetMachine() const
unsigned MaxLoadsPerMemcmp
Specify maximum number of load instructions per memcmp call.
LegalizeTypeAction
This enum indicates whether a types are legal for a target, and if not, what action should be used to...
void setMaxAtomicSizeInBitsSupported(unsigned SizeInBits)
Set the maximum atomic operation size supported by the backend.
virtual TargetLoweringBase::LegalizeTypeAction getPreferredVectorAction(MVT VT) const
Return the preferred vector type legalization action.
void setBooleanContents(BooleanContent Ty)
Specify how the target extends the result of integer and floating point boolean values from i1 to a w...
void computeRegisterProperties(const TargetRegisterInfo *TRI)
Once all of the register classes are added, this allows us to compute derived properties we expose.
void addRegisterClass(MVT VT, const TargetRegisterClass *RC)
Add the specified register class as an available regclass for the specified value type.
virtual MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
void setMinimumJumpTableEntries(unsigned Val)
Indicate the minimum number of blocks to generate jump tables.
void setPartialReduceMLAAction(unsigned Opc, MVT AccVT, MVT InputVT, LegalizeAction Action)
Indicate how a PARTIAL_REDUCE_U/SMLA node with Acc type AccVT and Input type InputVT should be treate...
void setTruncStoreAction(MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified truncating store does not work with the specified type and indicate what ...
@ ZeroOrOneBooleanContent
@ ZeroOrNegativeOneBooleanContent
unsigned MaxLoadsPerMemcmpOptSize
Likewise for functions with the OptSize attribute.
virtual bool isBinOp(unsigned Opcode) const
Return true if the node is a math/logic binary operator.
void setStackPointerRegisterToSaveRestore(Register R)
If set to a physical register, this specifies the register that llvm.savestack/llvm....
AtomicExpansionKind
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all.
void setCondCodeAction(ArrayRef< ISD::CondCode > CCs, MVT VT, LegalizeAction Action)
Indicate that the specified condition code is or isn't supported on the target and indicate what to d...
void setTargetDAGCombine(ArrayRef< ISD::NodeType > NTs)
Targets should invoke this method for each target independent node that they want to provide a custom...
void setLoadExtAction(unsigned ExtType, MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified load with extension does not work with the specified type and indicate wh...
virtual MVT getPointerMemTy(const DataLayout &DL, uint32_t AS=0) const
Return the in-memory pointer type for the given address space, defaults to the pointer type from the ...
void setSchedulingPreference(Sched::Preference Pref)
Specify the target scheduling preference.
bool isOperationLegalOrCustomOrPromote(unsigned Op, EVT VT, bool LegalOnly=false) const
Return true if the specified operation is legal on this target or can be made legal with custom lower...
bool isPositionIndependent() const
virtual std::pair< unsigned, const TargetRegisterClass * > getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const
Given a physical register constraint (e.g.
TargetLowering(const TargetLowering &)=delete
virtual bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const
Return true if folding a constant offset with the given GlobalAddress is legal.
std::pair< SDValue, SDValue > makeLibCall(SelectionDAG &DAG, RTLIB::LibcallImpl LibcallImpl, EVT RetVT, ArrayRef< SDValue > Ops, MakeLibCallOptions CallOptions, const SDLoc &dl, SDValue Chain=SDValue()) const
Returns a pair of (return value, chain).
Primary interface to the complete machine description for the target machine.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
The instances of the Type class are immutable: once they are created, they are never changed.
bool isFunctionTy() const
True if this is an instance of FunctionType.
static LLVM_ABI Type * getDoubleTy(LLVMContext &C)
static LLVM_ABI Type * getFloatTy(LLVMContext &C)
A Use represents the edge between a Value definition and its users.
LLVM_ABI const Value * stripPointerCastsAndAliases() const
Strip off pointer casts, all-zero GEPs, address space casts, and aliases.
static std::optional< unsigned > getLocalForStackObject(MachineFunction &MF, int FrameIndex)
bool hasCallIndirectOverlong() const
bool hasReferenceTypes() const
WebAssemblyTargetLowering(const TargetMachine &TM, const WebAssemblySubtarget &STI)
MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const override
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
MVT getPointerMemTy(const DataLayout &DL, uint32_t AS=0) const override
Return the in-memory pointer type for the given address space, defaults to the pointer type from the ...
self_iterator getIterator()
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ Swift
Calling convention for Swift.
@ PreserveMost
Used for runtime calls that preserves most registers.
@ CXX_FAST_TLS
Used for access functions.
@ WASM_EmscriptenInvoke
For emscripten __invoke_* functions.
@ Cold
Attempts to make code in the caller as efficient as possible under the assumption that the call is no...
@ PreserveAll
Used for runtime calls that preserves (almost) all registers.
@ Fast
Attempts to make calls as fast as possible (e.g.
@ C
The default llvm calling convention, compatible with C.
@ SETCC
SetCC operator - This evaluates to a true value iff the condition is true.
@ STACKRESTORE
STACKRESTORE has two operands, an input chain and a pointer to restore to it returns an output chain.
@ STACKSAVE
STACKSAVE - STACKSAVE has one operand, an input chain.
@ PARTIAL_REDUCE_SMLA
PARTIAL_REDUCE_[U|S]MLA(Accumulator, Input1, Input2) The partial reduction nodes sign or zero extend ...
@ SMUL_LOHI
SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing a signed/unsigned value of type i[2...
@ BSWAP
Byte Swap and Counting operators.
@ VAEND
VAEND, VASTART - VAEND and VASTART have three operands: an input chain, pointer, and a SRCVALUE.
@ ADDC
Carry-setting nodes for multiple precision addition and subtraction.
@ ADD
Simple integer binary arithmetic operators.
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
@ FMA
FMA - Perform a * b + c with no intermediate rounding step.
@ INTRINSIC_VOID
OUTCHAIN = INTRINSIC_VOID(INCHAIN, INTRINSICID, arg1, arg2, ...) This node represents a target intrin...
@ SINT_TO_FP
[SU]INT_TO_FP - These operators convert integers (whose interpreted sign depends on the first letter)...
@ CONCAT_VECTORS
CONCAT_VECTORS(VECTOR0, VECTOR1, ...) - Given a number of values of vector type with the same length ...
@ ABS
ABS - Determine the unsigned absolute value of a signed integer value of the same bitwidth.
@ SIGN_EXTEND_VECTOR_INREG
SIGN_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register sign-extension of the low ...
@ SDIVREM
SDIVREM/UDIVREM - Divide two integers and produce both a quotient and remainder result.
@ FP16_TO_FP
FP16_TO_FP, FP_TO_FP16 - These operators are used to perform promotions and truncation for half-preci...
@ FMULADD
FMULADD - Performs a * b + c, with, or without, intermediate rounding.
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
@ BUILD_PAIR
BUILD_PAIR - This is the opposite of EXTRACT_ELEMENT in some ways.
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
@ SIGN_EXTEND
Conversion operators.
@ SCALAR_TO_VECTOR
SCALAR_TO_VECTOR(VAL) - This represents the operation of loading a scalar value into element 0 of the...
@ FSINCOS
FSINCOS - Compute both fsin and fcos as a single operation.
@ BR_CC
BR_CC - Conditional branch.
@ BRIND
BRIND - Indirect branch.
@ BR_JT
BR_JT - Jumptable branch.
@ SSUBSAT
RESULT = [US]SUBSAT(LHS, RHS) - Perform saturation subtraction on 2 integers with the same bit width ...
@ EXTRACT_ELEMENT
EXTRACT_ELEMENT - This is used to get the lower or upper (determined by a Constant,...
@ SPLAT_VECTOR
SPLAT_VECTOR(VAL) - Returns a vector with the scalar value VAL duplicated in all lanes.
@ VACOPY
VACOPY - VACOPY has 5 operands: an input chain, a destination pointer, a source pointer,...
@ MULHU
MULHU/MULHS - Multiply high - Multiply two integers of type iN, producing an unsigned/signed value of...
@ SHL
Shift and rotation operations.
@ VECTOR_SHUFFLE
VECTOR_SHUFFLE(VEC1, VEC2) - Returns a vector, of the same type as VEC1/VEC2.
@ EXTRACT_SUBVECTOR
EXTRACT_SUBVECTOR(VECTOR, IDX) - Returns a subvector from VECTOR.
@ EXTRACT_VECTOR_ELT
EXTRACT_VECTOR_ELT(VECTOR, IDX) - Returns a single element from VECTOR identified by the (potentially...
@ CopyToReg
CopyToReg - This node has three operands: a chain, a register number to set to this value,...
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
@ DEBUGTRAP
DEBUGTRAP - Trap intended to get the attention of a debugger.
@ SELECT_CC
Select with condition operator - This selects between a true value and a false value (ops #2 and #3) ...
@ FMINNUM
FMINNUM/FMAXNUM - Perform floating-point minimum maximum on two values, following IEEE-754 definition...
@ DYNAMIC_STACKALLOC
DYNAMIC_STACKALLOC - Allocate some number of bytes on the stack aligned to a specified boundary.
@ ANY_EXTEND_VECTOR_INREG
ANY_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register any-extension of the low la...
@ SIGN_EXTEND_INREG
SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to sign extend a small value in ...
@ SMIN
[US]{MIN/MAX} - Binary minimum or maximum of signed or unsigned integers.
@ FP_EXTEND
X = FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
@ FRAMEADDR
FRAMEADDR, RETURNADDR - These nodes represent llvm.frameaddress and llvm.returnaddress on the DAG.
@ FMINIMUM
FMINIMUM/FMAXIMUM - NaN-propagating minimum/maximum that also treat -0.0 as less than 0....
@ FP_TO_SINT
FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
@ TargetConstant
TargetConstant* - Like Constant*, but the DAG does not do any folding, simplification,...
@ AND
Bitwise operators - logical and, logical or, logical xor.
@ TRAP
TRAP - Trapping instruction.
@ INTRINSIC_WO_CHAIN
RESULT = INTRINSIC_WO_CHAIN(INTRINSICID, arg1, arg2, ...) This node represents a target intrinsic fun...
@ ADDE
Carry-using nodes for multiple precision addition and subtraction.
@ INSERT_VECTOR_ELT
INSERT_VECTOR_ELT(VECTOR, VAL, IDX) - Returns VECTOR with the element at IDX replaced with VAL.
@ TokenFactor
TokenFactor - This node takes multiple tokens as input and produces a single token result.
@ FP_ROUND
X = FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type down to the precision of the ...
@ CLEAR_CACHE
llvm.clear_cache intrinsic Operands: Input Chain, Start Addres, End Address Outputs: Output Chain
@ ZERO_EXTEND_VECTOR_INREG
ZERO_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register zero-extension of the low ...
@ FP_TO_SINT_SAT
FP_TO_[US]INT_SAT - Convert floating point value in operand 0 to a signed or unsigned scalar integer ...
@ TRUNCATE
TRUNCATE - Completely drop the high bits.
@ VAARG
VAARG - VAARG has four operands: an input chain, a pointer, a SRCVALUE, and the alignment.
@ SHL_PARTS
SHL_PARTS/SRA_PARTS/SRL_PARTS - These operators are used for expanded integer shift operations.
@ FCOPYSIGN
FCOPYSIGN(X, Y) - Return the value of X with the sign of Y.
@ SADDSAT
RESULT = [US]ADDSAT(LHS, RHS) - Perform saturation addition on 2 integers with the same bit width (W)...
@ FMINIMUMNUM
FMINIMUMNUM/FMAXIMUMNUM - minimumnum/maximumnum that is same with FMINNUM_IEEE and FMAXNUM_IEEE besid...
@ INTRINSIC_W_CHAIN
RESULT,OUTCHAIN = INTRINSIC_W_CHAIN(INCHAIN, INTRINSICID, arg1, ...) This node represents a target in...
@ BUILD_VECTOR
BUILD_VECTOR(ELT0, ELT1, ELT2, ELT3,...) - Return a fixed-width vector with the specified,...
LLVM_ABI bool isConstantSplatVector(const SDNode *N, APInt &SplatValue)
Node predicates.
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
This namespace contains an enum with a value for every intrinsic/builtin function known by LLVM.
OperandFlags
These are flags set on operands, but should be considered private, all access should go through the M...
CastOperator_match< OpTy, Instruction::BitCast > m_BitCast(const OpTy &Op)
Matches BitCast.
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
bool sd_match(SDNode *N, const SelectionDAG *DAG, Pattern &&P)
CondCode_match m_SpecificCondCode(ISD::CondCode CC)
Match a conditional code SDNode with a specific ISD::CondCode.
CondCode_match m_CondCode()
Match any conditional code SDNode.
TernaryOpc_match< T0_P, T1_P, T2_P, true, false > m_c_SetCC(const T0_P &LHS, const T1_P &RHS, const T2_P &CC)
MCSymbolWasm * getOrCreateFunctionTableSymbol(MCContext &Ctx, const WebAssemblySubtarget *Subtarget)
Returns the __indirect_function_table, for use in call_indirect and in function bitcasts.
@ WASM_ADDRESS_SPACE_EXTERNREF
@ WASM_ADDRESS_SPACE_FUNCREF
bool isWebAssemblyFuncrefType(const Type *Ty)
Return true if this is a WebAssembly Funcref Type.
bool isWebAssemblyTableType(const Type *Ty)
Return true if the table represents a WebAssembly table type.
MCSymbolWasm * getOrCreateFuncrefCallTableSymbol(MCContext &Ctx, const WebAssemblySubtarget *Subtarget)
Returns the __funcref_call_table, for use in funcref calls when lowered to table.set + call_indirect.
bool isValidAddressSpace(unsigned AS)
FastISel * createFastISel(FunctionLoweringInfo &funcInfo, const TargetLibraryInfo *libInfo, const LibcallLoweringInfo *libcallLowering)
bool canLowerReturn(size_t ResultSize, const WebAssemblySubtarget *Subtarget)
Returns true if the function's return value(s) can be lowered directly, i.e., not indirectly via a po...
bool isWasmVarAddressSpace(unsigned AS)
NodeAddr< NodeBase * > Node
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
unsigned Log2_32_Ceil(uint32_t Value)
Return the ceil log base 2 of the specified value, 32 if the value is zero.
FunctionAddr VTableAddr Value
void computeSignatureVTs(const FunctionType *Ty, const Function *TargetFunc, const Function &ContextFunc, const TargetMachine &TM, SmallVectorImpl< MVT > &Params, SmallVectorImpl< MVT > &Results)
auto size(R &&Range, std::enable_if_t< std::is_base_of< std::random_access_iterator_tag, typename std::iterator_traits< decltype(Range.begin())>::iterator_category >::value, void > *=nullptr)
Get the size of a range.
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
LLVM_ABI bool isNullConstant(SDValue V)
Returns true if V is a constant integer zero.
LLVM_ABI SDValue peekThroughBitcasts(SDValue V)
Return the non-bitcasted source operand of V if it exists.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
DWARFExpression::Operation Op
auto max_element(R &&Range)
Provide wrappers to std::max_element which take ranges instead of having to pass begin/end explicitly...
constexpr unsigned BitWidth
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
void computeLegalValueVTs(const WebAssemblyTargetLowering &TLI, LLVMContext &Ctx, const DataLayout &DL, Type *Ty, SmallVectorImpl< MVT > &ValueVTs)
constexpr uint64_t NextPowerOf2(uint64_t A)
Returns the next power of two (in 64-bits) that is strictly greater than A.
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
This struct is a compact representation of a valid (non-zero power of two) alignment.
EVT changeVectorElementTypeToInteger() const
Return a vector with the same number of elements as this vector, but with the element type converted ...
bool isSimple() const
Test if the given EVT is simple (as opposed to being extended).
static EVT getVectorVT(LLVMContext &Context, EVT VT, unsigned NumElements, bool IsScalable=false)
Returns the EVT that represents a vector NumElements in length, where each element is of type VT.
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
bool isByteSized() const
Return true if the bit size is a multiple of 8.
uint64_t getScalarSizeInBits() const
EVT changeVectorElementType(LLVMContext &Context, EVT EltVT) const
Return a VT for a vector type whose attributes match ourselves with the exception of the element type...
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
bool is128BitVector() const
Return true if this is a 128-bit vector type.
static EVT getIntegerVT(LLVMContext &Context, unsigned BitWidth)
Returns the EVT that represents an integer with the given number of bits.
uint64_t getFixedSizeInBits() const
Return the size of the specified fixed width value type in bits.
EVT widenIntegerVectorElementType(LLVMContext &Context) const
Return a VT for an integer vector type with the size of the elements doubled.
bool isFixedLengthVector() const
bool isVector() const
Return true if this is a vector value type.
EVT getScalarType() const
If this is a vector type, return the element type, otherwise return this.
bool bitsGE(EVT VT) const
Return true if this has no less bits than VT.
bool is256BitVector() const
Return true if this is a 256-bit vector type.
LLVM_ABI Type * getTypeForEVT(LLVMContext &Context) const
This method returns an LLVM type corresponding to the specified EVT.
EVT getVectorElementType() const
Given a vector type, return the type of each element.
bool isScalarInteger() const
Return true if this is an integer, but not a vector.
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
EVT getHalfNumVectorElementsVT(LLVMContext &Context) const
bool isInConsecutiveRegs() const
Align getNonZeroOrigAlign() const
bool isSwiftError() const
unsigned getByValSize() const
bool isInConsecutiveRegsLast() const
Align getNonZeroByValAlign() const
unsigned getBitWidth() const
Get the bit width of this value.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
These are IR-level optimization flags that may be propagated to SDNodes.
bool isBeforeLegalize() const
This structure is used to pass arguments to makeLibCall function.