67#define GET_INSTRINFO_CTOR_DTOR
68#include "AArch64GenInstrInfo.inc"
70#define DEBUG_TYPE "AArch64InstrInfo"
72STATISTIC(NumCopyInstrs,
"Number of COPY instructions expanded");
73STATISTIC(NumZCRegMoveInstrsGPR,
"Number of zero-cycle GPR register move "
74 "instructions expanded from canonical COPY");
75STATISTIC(NumZCRegMoveInstrsFPR,
"Number of zero-cycle FPR register move "
76 "instructions expanded from canonical COPY");
77STATISTIC(NumZCZeroingInstrsGPR,
"Number of zero-cycle GPR zeroing "
78 "instructions expanded from canonical COPY");
83 cl::desc(
"Restrict range of CB instructions (DEBUG)"));
87 cl::desc(
"Restrict range of TB[N]Z instructions (DEBUG)"));
91 cl::desc(
"Restrict range of CB[N]Z instructions (DEBUG)"));
95 cl::desc(
"Restrict range of Bcc instructions (DEBUG)"));
99 cl::desc(
"Restrict range of B instructions (DEBUG)"));
103 cl::desc(
"Restrict range of instructions to search for the "
104 "machine-combiner gather pattern optimization"));
109 RI(STI.getTargetTriple(), STI.getHwMode()), Subtarget(STI) {}
119 switch (
MI.getOpcode()) {
130 if (
MI.getOperand(0).getReg() != AArch64::LR)
135 if (
MI.getOperand(0).getImm() == 3 &&
MI.getOperand(1).getImm() == 7 &&
136 MI.getOperand(3).getImm() == 1)
144 bool ModifiesLR =
false;
145 bool ModifiesSP =
false;
149 if (MO.getReg() == AArch64::LR)
151 else if (MO.getReg() == AArch64::SP)
160 if (
MI.mayLoadOrStore()) {
168 if (ModifiesSP || ModifiesLR)
186 auto Op =
MI.getOpcode();
187 if (
Op == AArch64::INLINEASM ||
Op == AArch64::INLINEASM_BR)
188 return getInlineAsmLength(
MI.getOperand(0).getSymbolName(), MAI);
192 if (
MI.isMetaInstruction())
197 unsigned NumBytes = 0;
207 NumBytes =
Desc.getSize() ?
Desc.getSize() : 4;
210 if (!MFI->shouldSignReturnAddress(*MF))
213 auto Method = STI.getAuthenticatedLRCheckMethod(*MF);
221 switch (
Desc.getOpcode()) {
224 return Desc.getSize();
231 case TargetOpcode::STACKMAP:
234 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
236 case TargetOpcode::PATCHPOINT:
239 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
241 case TargetOpcode::STATEPOINT:
243 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
248 case TargetOpcode::PATCHABLE_FUNCTION_ENTER:
253 F.getFnAttributeAsParsedInteger(
"patchable-function-entry", 9) * 4;
255 case TargetOpcode::PATCHABLE_FUNCTION_EXIT:
256 case TargetOpcode::PATCHABLE_TAIL_CALL:
257 case TargetOpcode::PATCHABLE_TYPED_EVENT_CALL:
261 case TargetOpcode::PATCHABLE_EVENT_CALL:
267 NumBytes =
MI.getOperand(1).getImm();
269 case AArch64::MOVaddr:
270 case AArch64::MOVaddrJT:
271 case AArch64::MOVaddrCP:
272 case AArch64::MOVaddrBA:
273 case AArch64::MOVaddrTLS:
274 case AArch64::MOVaddrEXT: {
278 MI.getOperand(1).getTargetFlags(),
279 Subtarget.isTargetMachO(), Insn);
280 NumBytes = Insn.
size() * 4;
284 case AArch64::MOVi32imm:
285 case AArch64::MOVi64imm: {
287 unsigned BitSize =
Desc.getOpcode() == AArch64::MOVi32imm ? 32 : 64;
290 NumBytes = Insn.
size() * 4;
294 case TargetOpcode::BUNDLE:
295 NumBytes = getInstBundleSize(
MI);
331 case AArch64::CBWPri:
332 case AArch64::CBXPri:
333 case AArch64::CBWPrr:
334 case AArch64::CBXPrr:
342 case AArch64::CBBAssertExt:
343 case AArch64::CBHAssertExt:
374 case AArch64::CBWPri:
375 case AArch64::CBXPri:
376 case AArch64::CBBAssertExt:
377 case AArch64::CBHAssertExt:
378 case AArch64::CBWPrr:
379 case AArch64::CBXPrr:
385 int64_t BrOffset)
const {
387 assert(Bits >= 3 &&
"max branch displacement must be enough to jump"
388 "over conditional branch expansion");
389 return isIntN(Bits, BrOffset / 4);
394 switch (
MI.getOpcode()) {
398 return MI.getOperand(0).getMBB();
403 return MI.getOperand(2).getMBB();
409 return MI.getOperand(1).getMBB();
410 case AArch64::CBWPri:
411 case AArch64::CBXPri:
412 case AArch64::CBBAssertExt:
413 case AArch64::CBHAssertExt:
414 case AArch64::CBWPrr:
415 case AArch64::CBXPrr:
416 return MI.getOperand(3).getMBB();
426 assert(RS &&
"RegScavenger required for long branching");
428 "new block should be inserted for expanding unconditional branch");
431 "restore block should be inserted for restoring clobbered registers");
438 "Branch offsets outside of the signed 33-bit range not supported");
449 RS->enterBasicBlockEnd(
MBB);
452 constexpr Register Reg = AArch64::X16;
453 if (!RS->isRegUsed(Reg)) {
454 insertUnconditionalBranch(
MBB, &NewDestBB,
DL);
465 Register Scavenged = RS->FindUnusedReg(&AArch64::GPR64RegClass);
466 if (Scavenged != AArch64::NoRegister) {
467 buildIndirectBranch(Scavenged, NewDestBB);
468 RS->setRegUsed(Scavenged);
477 "Unable to insert indirect branch inside function that has red zone");
500 bool AllowModify)
const {
507 if (
I->getOpcode() == AArch64::SpeculationBarrierISBDSBEndBB ||
508 I->getOpcode() == AArch64::SpeculationBarrierSBEndBB) {
512 if (!isUnpredicatedTerminator(*
I))
519 unsigned LastOpc = LastInst->
getOpcode();
520 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
535 unsigned SecondLastOpc = SecondLastInst->
getOpcode();
542 LastInst = SecondLastInst;
544 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
549 SecondLastInst = &*
I;
550 SecondLastOpc = SecondLastInst->
getOpcode();
561 LastInst = SecondLastInst;
563 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
565 "unreachable unconditional branches removed above");
574 SecondLastInst = &*
I;
575 SecondLastOpc = SecondLastInst->
getOpcode();
579 if (SecondLastInst &&
I !=
MBB.begin() && isUnpredicatedTerminator(*--
I))
595 I->eraseFromParent();
604 I->eraseFromParent();
613 MachineBranchPredicate &MBP,
614 bool AllowModify)
const {
626 assert(MBP.TrueDest &&
"expected!");
627 MBP.FalseDest = FBB ? FBB :
MBB.getNextNode();
629 MBP.ConditionDef =
nullptr;
630 MBP.SingleUseCondition =
false;
640 if (
I ==
MBB.begin())
656 if (
MI.modifiesRegister(AArch64::NZCV,
nullptr)) {
657 MBP.ConditionDef = &
MI;
666 case AArch64::CBNZX: {
670 MBP.Predicate = (
Opc == AArch64::CBNZX ||
Opc == AArch64::CBNZW)
671 ? MachineBranchPredicate::PRED_NE
672 : MachineBranchPredicate::PRED_EQ;
673 Register CondReg = MBP.LHS.getReg();
682 case AArch64::TBNZX: {
703 Cond[1].setImm(AArch64::CBNZW);
706 Cond[1].setImm(AArch64::CBZW);
709 Cond[1].setImm(AArch64::CBNZX);
712 Cond[1].setImm(AArch64::CBZX);
715 Cond[1].setImm(AArch64::TBNZW);
718 Cond[1].setImm(AArch64::TBZW);
721 Cond[1].setImm(AArch64::TBNZX);
724 Cond[1].setImm(AArch64::TBZX);
728 case AArch64::CBWPri:
729 case AArch64::CBXPri:
730 case AArch64::CBBAssertExt:
731 case AArch64::CBHAssertExt:
732 case AArch64::CBWPrr:
733 case AArch64::CBXPrr: {
746 int *BytesRemoved)
const {
756 I->eraseFromParent();
760 if (
I ==
MBB.begin()) {
773 I->eraseFromParent();
780void AArch64InstrInfo::instantiateCondBranch(
805 if (
Cond.size() > 5) {
816 assert(
TBB &&
"insertBranch must not be told to insert a fallthrough");
843 unsigned Opc =
MI.getOpcode();
850 if (
MI.getOperand(0).getReg() == AArch64::WZR ||
851 MI.getOperand(0).getReg() == AArch64::XZR) {
853 dbgs() <<
"Removing always taken branch: " <<
MI);
856 for (
auto *S : Succs)
858 MBB->removeSuccessor(S);
860 while (
MBB->rbegin() != &
MI)
861 MBB->rbegin()->eraseFromParent();
862 MI.eraseFromParent();
872 if (
MI.getOperand(0).getReg() == AArch64::WZR ||
873 MI.getOperand(0).getReg() == AArch64::XZR) {
875 dbgs() <<
"Removing never taken branch: " <<
MI);
877 MI.getParent()->removeSuccessor(
Target);
878 MI.eraseFromParent();
891 if (!
DefMI->isFullCopy())
893 VReg =
DefMI->getOperand(1).getReg();
902 unsigned *NewReg =
nullptr) {
907 bool Is64Bit = AArch64::GPR64allRegClass.hasSubClassEq(MRI.
getRegClass(VReg));
911 switch (
DefMI->getOpcode()) {
912 case AArch64::SUBREG_TO_REG:
916 if (!
DefMI->getOperand(1).isReg())
918 if (!
DefMI->getOperand(2).isImm() ||
919 DefMI->getOperand(2).getImm() != AArch64::sub_32)
922 if (
DefMI->getOpcode() != AArch64::MOVi32imm)
924 if (!
DefMI->getOperand(1).isImm() ||
DefMI->getOperand(1).getImm() != 1)
927 SrcReg = AArch64::XZR;
928 Opc = AArch64::CSINCXr;
931 case AArch64::MOVi32imm:
932 case AArch64::MOVi64imm:
933 if (!
DefMI->getOperand(1).isImm() ||
DefMI->getOperand(1).getImm() != 1)
935 SrcReg = Is64Bit ? AArch64::XZR : AArch64::WZR;
936 Opc = Is64Bit ? AArch64::CSINCXr : AArch64::CSINCWr;
939 case AArch64::ADDSXri:
940 case AArch64::ADDSWri:
942 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
947 case AArch64::ADDXri:
948 case AArch64::ADDWri:
950 if (!
DefMI->getOperand(2).isImm() ||
DefMI->getOperand(2).getImm() != 1 ||
951 DefMI->getOperand(3).getImm() != 0)
953 SrcReg =
DefMI->getOperand(1).getReg();
954 Opc = Is64Bit ? AArch64::CSINCXr : AArch64::CSINCWr;
957 case AArch64::ORNXrr:
958 case AArch64::ORNWrr: {
961 if (ZReg != AArch64::XZR && ZReg != AArch64::WZR)
963 SrcReg =
DefMI->getOperand(2).getReg();
964 Opc = Is64Bit ? AArch64::CSINVXr : AArch64::CSINVWr;
968 case AArch64::SUBSXrr:
969 case AArch64::SUBSWrr:
971 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
976 case AArch64::SUBXrr:
977 case AArch64::SUBWrr: {
980 if (ZReg != AArch64::XZR && ZReg != AArch64::WZR)
982 SrcReg =
DefMI->getOperand(2).getReg();
983 Opc = Is64Bit ? AArch64::CSNEGXr : AArch64::CSNEGWr;
989 assert(
Opc && SrcReg &&
"Missing parameters");
1001 int &FalseCycles)
const {
1012 if (!RI.getCommonSubClass(RC, MRI.
getRegClass(DstReg)))
1016 unsigned ExtraCondLat =
Cond.size() != 1;
1020 if (AArch64::GPR64allRegClass.hasSubClassEq(RC) ||
1021 AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
1023 CondCycles = 1 + ExtraCondLat;
1024 TrueCycles = FalseCycles = 1;
1034 if (AArch64::FPR64RegClass.hasSubClassEq(RC) ||
1035 AArch64::FPR32RegClass.hasSubClassEq(RC)) {
1036 CondCycles = 5 + ExtraCondLat;
1037 TrueCycles = FalseCycles = 2;
1054 switch (
Cond.size()) {
1074 case AArch64::CBNZW:
1078 case AArch64::CBNZX:
1109 case AArch64::TBNZW:
1110 case AArch64::TBNZX:
1132 unsigned SubsOpc, SubsDestReg;
1138 case AArch64::CBWPri:
1139 SubsOpc = AArch64::SUBSWri;
1140 SubsDestReg = AArch64::WZR;
1143 case AArch64::CBXPri:
1144 SubsOpc = AArch64::SUBSXri;
1145 SubsDestReg = AArch64::XZR;
1148 case AArch64::CBWPrr:
1149 SubsOpc = AArch64::SUBSWrr;
1150 SubsDestReg = AArch64::WZR;
1153 case AArch64::CBXPrr:
1154 SubsOpc = AArch64::SUBSXrr;
1155 SubsDestReg = AArch64::XZR;
1184 switch (ExtendType) {
1190 "Unexpected compare-and-branch instruction for SXTB shift-extend");
1191 ExtOpc = AArch64::SBFMWri;
1197 "Unexpected compare-and-branch instruction for SXTH shift-extend");
1198 ExtOpc = AArch64::SBFMWri;
1204 "Unexpected compare-and-branch instruction for UXTB shift-extend");
1205 ExtOpc = AArch64::ANDWri;
1211 "Unexpected compare-and-branch instruction for UXTH shift-extend");
1212 ExtOpc = AArch64::ANDWri;
1221 if (ExtOpc != AArch64::ANDWri)
1223 MBBI.addImm(ExtBits);
1251 bool TryFold =
false;
1253 RC = &AArch64::GPR64RegClass;
1254 Opc = AArch64::CSELXr;
1257 RC = &AArch64::GPR32RegClass;
1258 Opc = AArch64::CSELWr;
1261 RC = &AArch64::FPR64RegClass;
1262 Opc = AArch64::FCSELDrrr;
1264 RC = &AArch64::FPR32RegClass;
1265 Opc = AArch64::FCSELSrrr;
1267 assert(RC &&
"Unsupported regclass");
1271 unsigned NewReg = 0;
1294 (FalseReg.
isVirtual() || FalseReg == AArch64::WZR ||
1295 FalseReg == AArch64::XZR) &&
1296 "FalseReg was folded into a non-virtual register other than WZR or XZR");
1313 assert(BitSize == 64 &&
"Only bit sizes of 32 or 64 allowed");
1318 return Is.
size() <= 2;
1323 assert(
MI.isCopy() &&
"Expected COPY instruction");
1329 if (
Reg.isVirtual())
1331 if (
Reg.isPhysical())
1332 return RI.getMinimalPhysRegClass(
Reg);
1337 if (DstRC && SrcRC && !RI.getCommonSubClass(DstRC, SrcRC))
1340 return MI.isAsCheapAsAMove();
1346 if (Subtarget.hasExynosCheapAsMoveHandling()) {
1347 if (isExynosCheapAsMove(
MI))
1349 return MI.isAsCheapAsAMove();
1352 switch (
MI.getOpcode()) {
1354 return MI.isAsCheapAsAMove();
1356 case TargetOpcode::COPY:
1359 case AArch64::ADDWrs:
1360 case AArch64::ADDXrs:
1361 case AArch64::SUBWrs:
1362 case AArch64::SUBXrs:
1363 return Subtarget.hasALULSLFast() &&
MI.getOperand(3).getImm() <= 4;
1368 case AArch64::MOVi32imm:
1370 case AArch64::MOVi64imm:
1375bool AArch64InstrInfo::isFalkorShiftExtFast(
const MachineInstr &
MI) {
1376 switch (
MI.getOpcode()) {
1380 case AArch64::ADDWrs:
1381 case AArch64::ADDXrs:
1382 case AArch64::ADDSWrs:
1383 case AArch64::ADDSXrs: {
1384 unsigned Imm =
MI.getOperand(3).getImm();
1391 case AArch64::ADDWrx:
1392 case AArch64::ADDXrx:
1393 case AArch64::ADDXrx64:
1394 case AArch64::ADDSWrx:
1395 case AArch64::ADDSXrx:
1396 case AArch64::ADDSXrx64: {
1397 unsigned Imm =
MI.getOperand(3).getImm();
1409 case AArch64::SUBWrs:
1410 case AArch64::SUBSWrs: {
1411 unsigned Imm =
MI.getOperand(3).getImm();
1413 return ShiftVal == 0 ||
1417 case AArch64::SUBXrs:
1418 case AArch64::SUBSXrs: {
1419 unsigned Imm =
MI.getOperand(3).getImm();
1421 return ShiftVal == 0 ||
1425 case AArch64::SUBWrx:
1426 case AArch64::SUBXrx:
1427 case AArch64::SUBXrx64:
1428 case AArch64::SUBSWrx:
1429 case AArch64::SUBSXrx:
1430 case AArch64::SUBSXrx64: {
1431 unsigned Imm =
MI.getOperand(3).getImm();
1443 case AArch64::LDRBBroW:
1444 case AArch64::LDRBBroX:
1445 case AArch64::LDRBroW:
1446 case AArch64::LDRBroX:
1447 case AArch64::LDRDroW:
1448 case AArch64::LDRDroX:
1449 case AArch64::LDRHHroW:
1450 case AArch64::LDRHHroX:
1451 case AArch64::LDRHroW:
1452 case AArch64::LDRHroX:
1453 case AArch64::LDRQroW:
1454 case AArch64::LDRQroX:
1455 case AArch64::LDRSBWroW:
1456 case AArch64::LDRSBWroX:
1457 case AArch64::LDRSBXroW:
1458 case AArch64::LDRSBXroX:
1459 case AArch64::LDRSHWroW:
1460 case AArch64::LDRSHWroX:
1461 case AArch64::LDRSHXroW:
1462 case AArch64::LDRSHXroX:
1463 case AArch64::LDRSWroW:
1464 case AArch64::LDRSWroX:
1465 case AArch64::LDRSroW:
1466 case AArch64::LDRSroX:
1467 case AArch64::LDRWroW:
1468 case AArch64::LDRWroX:
1469 case AArch64::LDRXroW:
1470 case AArch64::LDRXroX:
1471 case AArch64::PRFMroW:
1472 case AArch64::PRFMroX:
1473 case AArch64::STRBBroW:
1474 case AArch64::STRBBroX:
1475 case AArch64::STRBroW:
1476 case AArch64::STRBroX:
1477 case AArch64::STRDroW:
1478 case AArch64::STRDroX:
1479 case AArch64::STRHHroW:
1480 case AArch64::STRHHroX:
1481 case AArch64::STRHroW:
1482 case AArch64::STRHroX:
1483 case AArch64::STRQroW:
1484 case AArch64::STRQroX:
1485 case AArch64::STRSroW:
1486 case AArch64::STRSroX:
1487 case AArch64::STRWroW:
1488 case AArch64::STRWroX:
1489 case AArch64::STRXroW:
1490 case AArch64::STRXroX: {
1491 unsigned IsSigned =
MI.getOperand(3).getImm();
1498 unsigned Opc =
MI.getOpcode();
1502 case AArch64::SEH_StackAlloc:
1503 case AArch64::SEH_SaveFPLR:
1504 case AArch64::SEH_SaveFPLR_X:
1505 case AArch64::SEH_SaveReg:
1506 case AArch64::SEH_SaveReg_X:
1507 case AArch64::SEH_SaveRegP:
1508 case AArch64::SEH_SaveRegP_X:
1509 case AArch64::SEH_SaveFReg:
1510 case AArch64::SEH_SaveFReg_X:
1511 case AArch64::SEH_SaveFRegP:
1512 case AArch64::SEH_SaveFRegP_X:
1513 case AArch64::SEH_SetFP:
1514 case AArch64::SEH_AddFP:
1515 case AArch64::SEH_Nop:
1516 case AArch64::SEH_PrologEnd:
1517 case AArch64::SEH_EpilogStart:
1518 case AArch64::SEH_EpilogEnd:
1519 case AArch64::SEH_PACSignLR:
1520 case AArch64::SEH_SaveAnyRegI:
1521 case AArch64::SEH_SaveAnyRegIP:
1522 case AArch64::SEH_SaveAnyRegQP:
1523 case AArch64::SEH_SaveAnyRegQPX:
1524 case AArch64::SEH_AllocZ:
1525 case AArch64::SEH_SaveZReg:
1526 case AArch64::SEH_SavePReg:
1533 unsigned &SubIdx)
const {
1534 switch (
MI.getOpcode()) {
1537 case AArch64::SBFMXri:
1538 case AArch64::UBFMXri:
1541 if (
MI.getOperand(2).getImm() != 0 ||
MI.getOperand(3).getImm() != 31)
1544 SrcReg =
MI.getOperand(1).getReg();
1545 DstReg =
MI.getOperand(0).getReg();
1546 SubIdx = AArch64::sub_32;
1555 int64_t OffsetA = 0, OffsetB = 0;
1556 TypeSize WidthA(0,
false), WidthB(0,
false);
1557 bool OffsetAIsScalable =
false, OffsetBIsScalable =
false;
1578 OffsetAIsScalable == OffsetBIsScalable) {
1579 int LowOffset = OffsetA < OffsetB ? OffsetA : OffsetB;
1580 int HighOffset = OffsetA < OffsetB ? OffsetB : OffsetA;
1581 TypeSize LowWidth = (LowOffset == OffsetA) ? WidthA : WidthB;
1582 if (LowWidth.
isScalable() == OffsetAIsScalable &&
1600 switch (
MI.getOpcode()) {
1603 if (
MI.getOperand(0).getImm() == 0x14)
1610 case AArch64::MSRpstatesvcrImm1:
1617 auto Next = std::next(
MI.getIterator());
1618 return Next !=
MBB->end() &&
Next->isCFIInstruction();
1625 Register &SrcReg2, int64_t &CmpMask,
1626 int64_t &CmpValue)
const {
1630 assert(
MI.getNumOperands() >= 2 &&
"All AArch64 cmps should have 2 operands");
1631 if (!
MI.getOperand(1).isReg() ||
MI.getOperand(1).getSubReg())
1634 switch (
MI.getOpcode()) {
1637 case AArch64::PTEST_PP:
1638 case AArch64::PTEST_PP_ANY:
1639 case AArch64::PTEST_PP_FIRST:
1640 SrcReg =
MI.getOperand(0).getReg();
1641 SrcReg2 =
MI.getOperand(1).getReg();
1642 if (
MI.getOperand(2).getSubReg())
1649 case AArch64::SUBSWrr:
1650 case AArch64::SUBSWrs:
1651 case AArch64::SUBSWrx:
1652 case AArch64::SUBSXrr:
1653 case AArch64::SUBSXrs:
1654 case AArch64::SUBSXrx:
1655 case AArch64::ADDSWrr:
1656 case AArch64::ADDSWrs:
1657 case AArch64::ADDSWrx:
1658 case AArch64::ADDSXrr:
1659 case AArch64::ADDSXrs:
1660 case AArch64::ADDSXrx:
1662 SrcReg =
MI.getOperand(1).getReg();
1663 SrcReg2 =
MI.getOperand(2).getReg();
1666 if (
MI.getOperand(2).getSubReg())
1672 case AArch64::SUBSWri:
1673 case AArch64::ADDSWri:
1674 case AArch64::SUBSXri:
1675 case AArch64::ADDSXri:
1676 SrcReg =
MI.getOperand(1).getReg();
1679 CmpValue =
MI.getOperand(2).getImm();
1681 case AArch64::ANDSWri:
1682 case AArch64::ANDSXri:
1685 SrcReg =
MI.getOperand(1).getReg();
1689 MI.getOperand(2).getImm(),
1690 MI.getOpcode() == AArch64::ANDSWri ? 32 : 64);
1699 assert(
MBB &&
"Can't get MachineBasicBlock here");
1701 assert(MF &&
"Can't get MachineFunction here");
1706 for (
unsigned OpIdx = 0, EndIdx = Instr.getNumOperands();
OpIdx < EndIdx;
1713 if (!OpRegCstraints)
1721 "Operand has register constraints without being a register!");
1724 if (
Reg.isPhysical()) {
1741 bool MIDefinesZeroReg =
false;
1742 if (
MI.definesRegister(AArch64::WZR,
nullptr) ||
1743 MI.definesRegister(AArch64::XZR,
nullptr))
1744 MIDefinesZeroReg =
true;
1746 switch (
MI.getOpcode()) {
1748 return MI.getOpcode();
1749 case AArch64::ADDSWrr:
1750 return AArch64::ADDWrr;
1751 case AArch64::ADDSWri:
1752 return MIDefinesZeroReg ? AArch64::ADDSWri : AArch64::ADDWri;
1753 case AArch64::ADDSWrs:
1754 return MIDefinesZeroReg ? AArch64::ADDSWrs : AArch64::ADDWrs;
1755 case AArch64::ADDSWrx:
1756 return AArch64::ADDWrx;
1757 case AArch64::ADDSXrr:
1758 return AArch64::ADDXrr;
1759 case AArch64::ADDSXri:
1760 return MIDefinesZeroReg ? AArch64::ADDSXri : AArch64::ADDXri;
1761 case AArch64::ADDSXrs:
1762 return MIDefinesZeroReg ? AArch64::ADDSXrs : AArch64::ADDXrs;
1763 case AArch64::ADDSXrx:
1764 return AArch64::ADDXrx;
1765 case AArch64::SUBSWrr:
1766 return AArch64::SUBWrr;
1767 case AArch64::SUBSWri:
1768 return MIDefinesZeroReg ? AArch64::SUBSWri : AArch64::SUBWri;
1769 case AArch64::SUBSWrs:
1770 return MIDefinesZeroReg ? AArch64::SUBSWrs : AArch64::SUBWrs;
1771 case AArch64::SUBSWrx:
1772 return AArch64::SUBWrx;
1773 case AArch64::SUBSXrr:
1774 return AArch64::SUBXrr;
1775 case AArch64::SUBSXri:
1776 return MIDefinesZeroReg ? AArch64::SUBSXri : AArch64::SUBXri;
1777 case AArch64::SUBSXrs:
1778 return MIDefinesZeroReg ? AArch64::SUBSXrs : AArch64::SUBXrs;
1779 case AArch64::SUBSXrx:
1780 return AArch64::SUBXrx;
1795 if (To == To->getParent()->begin())
1800 if (To->getParent() != From->getParent())
1812 Instr.modifiesRegister(AArch64::NZCV,
TRI)) ||
1813 ((AccessToCheck &
AK_Read) && Instr.readsRegister(AArch64::NZCV,
TRI)))
1819std::optional<unsigned>
1823 unsigned MaskOpcode =
Mask->getOpcode();
1824 unsigned PredOpcode = Pred->
getOpcode();
1825 bool PredIsPTestLike = isPTestLikeOpcode(PredOpcode);
1826 bool PredIsWhileLike = isWhileOpcode(PredOpcode);
1828 if (PredIsWhileLike) {
1832 if ((Mask == Pred) && PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1839 getElementSizeForOpcode(MaskOpcode) ==
1840 getElementSizeForOpcode(PredOpcode))
1846 if (PTest->
getOpcode() == AArch64::PTEST_PP_FIRST &&
1853 if (PredIsPTestLike) {
1858 if ((Mask == Pred) && PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1866 if (Mask != PTestLikeMask && PTestLikeMask->isFullCopy() &&
1867 PTestLikeMask->getOperand(1).getReg().isVirtual())
1875 getElementSizeForOpcode(MaskOpcode) ==
1876 getElementSizeForOpcode(PredOpcode)) {
1877 if (Mask == PTestLikeMask || PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1903 uint64_t PredElementSize = getElementSizeForOpcode(PredOpcode);
1905 PTest->
getOpcode() == AArch64::PTEST_PP_ANY))
1913 switch (PredOpcode) {
1914 case AArch64::AND_PPzPP:
1915 case AArch64::BIC_PPzPP:
1916 case AArch64::EOR_PPzPP:
1917 case AArch64::NAND_PPzPP:
1918 case AArch64::NOR_PPzPP:
1919 case AArch64::ORN_PPzPP:
1920 case AArch64::ORR_PPzPP:
1921 case AArch64::BRKA_PPzP:
1922 case AArch64::BRKPA_PPzPP:
1923 case AArch64::BRKB_PPzP:
1924 case AArch64::BRKPB_PPzPP:
1925 case AArch64::RDFFR_PPz: {
1929 if (Mask != PredMask)
1933 case AArch64::BRKN_PPzP: {
1937 if ((MaskOpcode != AArch64::PTRUE_B) ||
1938 (
Mask->getOperand(1).getImm() != 31))
1942 case AArch64::PTRUE_B:
1955bool AArch64InstrInfo::optimizePTestInstr(
1956 MachineInstr *PTest,
unsigned MaskReg,
unsigned PredReg,
1961 if (Pred->
isCopy() && PTest->
getOpcode() == AArch64::PTEST_PP_FIRST) {
1965 if (
Op.isReg() &&
Op.getReg().isVirtual() &&
1966 Op.getSubReg() == AArch64::psub0)
1970 unsigned PredOpcode = Pred->
getOpcode();
1971 auto NewOp = canRemovePTestInstr(PTest, Mask, Pred, MRI);
1987 if (*NewOp != PredOpcode) {
1998 for (; i !=
e; ++i) {
2029 if (DeadNZCVIdx != -1) {
2048 if (CmpInstr.
getOpcode() == AArch64::PTEST_PP ||
2049 CmpInstr.
getOpcode() == AArch64::PTEST_PP_ANY ||
2050 CmpInstr.
getOpcode() == AArch64::PTEST_PP_FIRST)
2051 return optimizePTestInstr(&CmpInstr, SrcReg, SrcReg2, MRI);
2060 if (CmpValue == 0 && substituteCmpToZero(CmpInstr, SrcReg, *MRI))
2062 return (CmpValue == 0 || CmpValue == 1) &&
2063 removeCmpToZeroOrOne(CmpInstr, SrcReg, CmpValue, *MRI);
2071 switch (Instr.getOpcode()) {
2073 return AArch64::INSTRUCTION_LIST_END;
2075 case AArch64::ADDSWrr:
2076 case AArch64::ADDSWri:
2077 case AArch64::ADDSXrr:
2078 case AArch64::ADDSXri:
2079 case AArch64::ADDSWrx:
2080 case AArch64::ADDSXrx:
2081 case AArch64::SUBSWrr:
2082 case AArch64::SUBSWri:
2083 case AArch64::SUBSWrx:
2084 case AArch64::SUBSXrr:
2085 case AArch64::SUBSXri:
2086 case AArch64::SUBSXrx:
2087 case AArch64::ANDSWri:
2088 case AArch64::ANDSWrr:
2089 case AArch64::ANDSWrs:
2090 case AArch64::ANDSXri:
2091 case AArch64::ANDSXrr:
2092 case AArch64::ANDSXrs:
2093 case AArch64::BICSWrr:
2094 case AArch64::BICSXrr:
2095 case AArch64::BICSWrs:
2096 case AArch64::BICSXrs:
2097 return Instr.getOpcode();
2099 case AArch64::ADDWrr:
2100 return AArch64::ADDSWrr;
2101 case AArch64::ADDWri:
2102 return AArch64::ADDSWri;
2103 case AArch64::ADDXrr:
2104 return AArch64::ADDSXrr;
2105 case AArch64::ADDXri:
2106 return AArch64::ADDSXri;
2107 case AArch64::ADDWrx:
2108 return AArch64::ADDSWrx;
2109 case AArch64::ADDXrx:
2110 return AArch64::ADDSXrx;
2111 case AArch64::ADCWr:
2112 return AArch64::ADCSWr;
2113 case AArch64::ADCXr:
2114 return AArch64::ADCSXr;
2115 case AArch64::SUBWrr:
2116 return AArch64::SUBSWrr;
2117 case AArch64::SUBWri:
2118 return AArch64::SUBSWri;
2119 case AArch64::SUBXrr:
2120 return AArch64::SUBSXrr;
2121 case AArch64::SUBXri:
2122 return AArch64::SUBSXri;
2123 case AArch64::SUBWrx:
2124 return AArch64::SUBSWrx;
2125 case AArch64::SUBXrx:
2126 return AArch64::SUBSXrx;
2127 case AArch64::SBCWr:
2128 return AArch64::SBCSWr;
2129 case AArch64::SBCXr:
2130 return AArch64::SBCSXr;
2131 case AArch64::ANDWri:
2132 return AArch64::ANDSWri;
2133 case AArch64::ANDXri:
2134 return AArch64::ANDSXri;
2135 case AArch64::ANDWrr:
2136 return AArch64::ANDSWrr;
2137 case AArch64::ANDWrs:
2138 return AArch64::ANDSWrs;
2139 case AArch64::ANDXrr:
2140 return AArch64::ANDSXrr;
2141 case AArch64::ANDXrs:
2142 return AArch64::ANDSXrs;
2143 case AArch64::BICWrr:
2144 return AArch64::BICSWrr;
2145 case AArch64::BICXrr:
2146 return AArch64::BICSXrr;
2147 case AArch64::BICWrs:
2148 return AArch64::BICSWrs;
2149 case AArch64::BICXrs:
2150 return AArch64::BICSXrs;
2156 for (
auto *BB :
MBB->successors())
2157 if (BB->isLiveIn(AArch64::NZCV))
2164int AArch64InstrInfo::findCondCodeUseOperandIdxForBranchOrSelect(
2166 switch (
Instr.getOpcode()) {
2170 case AArch64::Bcc: {
2171 int Idx =
Instr.findRegisterUseOperandIdx(AArch64::NZCV,
nullptr);
2176 case AArch64::CSINVWr:
2177 case AArch64::CSINVXr:
2178 case AArch64::CSINCWr:
2179 case AArch64::CSINCXr:
2180 case AArch64::CSELWr:
2181 case AArch64::CSELXr:
2182 case AArch64::CSNEGWr:
2183 case AArch64::CSNEGXr:
2184 case AArch64::FCSELSrrr:
2185 case AArch64::FCSELDrrr: {
2186 int Idx =
Instr.findRegisterUseOperandIdx(AArch64::NZCV,
nullptr);
2198 AArch64InstrInfo::findCondCodeUseOperandIdxForBranchOrSelect(Instr);
2200 Instr.getOperand(CCIdx).
getImm())
2253std::optional<UsedNZCV>
2258 if (
MI.getParent() != CmpParent)
2259 return std::nullopt;
2262 return std::nullopt;
2267 if (Instr.readsRegister(AArch64::NZCV, &
TRI)) {
2270 return std::nullopt;
2275 if (Instr.modifiesRegister(AArch64::NZCV, &
TRI))
2278 return NZCVUsedAfterCmp;
2282 return Opcode == AArch64::ADDSWri || Opcode == AArch64::ADDSXri;
2286 return Opcode == AArch64::SUBSWri || Opcode == AArch64::SUBSXri;
2292 case AArch64::ANDSWri:
2293 case AArch64::ANDSWrr:
2294 case AArch64::ANDSWrs:
2295 case AArch64::ANDSXri:
2296 case AArch64::ANDSXrr:
2297 case AArch64::ANDSXrs:
2298 case AArch64::BICSWrr:
2299 case AArch64::BICSXrr:
2300 case AArch64::BICSWrs:
2301 case AArch64::BICSXrs:
2327 const unsigned CmpOpcode = CmpInstr.
getOpcode();
2333 "Caller guarantees that CmpInstr compares with constant 0");
2336 if (!NZVCUsed || NZVCUsed->C)
2359bool AArch64InstrInfo::substituteCmpToZero(
2370 if (NewOpc == AArch64::INSTRUCTION_LIST_END)
2377 MI->setDesc(
get(NewOpc));
2382 MI->addRegisterDefined(AArch64::NZCV, &
TRI);
2394 assert((CmpValue == 0 || CmpValue == 1) &&
2395 "Only comparisons to 0 or 1 considered for removal!");
2398 unsigned MIOpc =
MI.getOpcode();
2399 if (MIOpc == AArch64::CSINCWr) {
2400 if (
MI.getOperand(1).getReg() != AArch64::WZR ||
2401 MI.getOperand(2).getReg() != AArch64::WZR)
2403 }
else if (MIOpc == AArch64::CSINCXr) {
2404 if (
MI.getOperand(1).getReg() != AArch64::XZR ||
2405 MI.getOperand(2).getReg() != AArch64::XZR)
2415 if (
MI.findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
true) != -1)
2419 const unsigned CmpOpcode = CmpInstr.
getOpcode();
2421 if (CmpValue && !IsSubsRegImm)
2423 if (!CmpValue && !IsSubsRegImm && !
isADDSRegImm(CmpOpcode))
2428 if (MIUsedNZCV.
C || MIUsedNZCV.
V)
2431 std::optional<UsedNZCV> NZCVUsedAfterCmp =
2435 if (!NZCVUsedAfterCmp || NZCVUsedAfterCmp->C || NZCVUsedAfterCmp->V)
2438 if ((MIUsedNZCV.
Z && NZCVUsedAfterCmp->N) ||
2439 (MIUsedNZCV.
N && NZCVUsedAfterCmp->Z))
2442 if (MIUsedNZCV.
N && !CmpValue)
2484bool AArch64InstrInfo::removeCmpToZeroOrOne(
2491 SmallVector<MachineInstr *, 4> CCUseInstrs;
2492 bool IsInvertCC =
false;
2500 for (MachineInstr *CCUseInstr : CCUseInstrs) {
2501 int Idx = findCondCodeUseOperandIdxForBranchOrSelect(*CCUseInstr);
2502 assert(Idx >= 0 &&
"Unexpected instruction using CC.");
2503 MachineOperand &CCOperand = CCUseInstr->getOperand(Idx);
2512bool AArch64InstrInfo::expandPostRAPseudo(
MachineInstr &
MI)
const {
2513 if (
MI.getOpcode() != TargetOpcode::LOAD_STACK_GUARD &&
2514 MI.getOpcode() != AArch64::CATCHRET)
2517 MachineBasicBlock &
MBB = *
MI.getParent();
2519 auto TRI = Subtarget.getRegisterInfo();
2522 if (
MI.getOpcode() == AArch64::CATCHRET) {
2524 const TargetInstrInfo *
TII =
2526 MachineBasicBlock *TargetMBB =
MI.getOperand(0).getMBB();
2531 FirstEpilogSEH = std::prev(FirstEpilogSEH);
2533 FirstEpilogSEH = std::next(FirstEpilogSEH);
2548 if (
M.getStackProtectorGuard() ==
"sysreg") {
2549 const AArch64SysReg::SysReg *SrcReg =
2550 AArch64SysReg::lookupSysRegByName(
M.getStackProtectorGuardReg());
2558 int Offset =
M.getStackProtectorGuardOffset();
2609 const GlobalValue *GV =
2612 unsigned OpFlags = Subtarget.ClassifyGlobalReference(GV, TM);
2615 unsigned GuardWidth =
M.getStackProtectorGuardValueWidth().value_or(
2616 Subtarget.isTargetILP32() ? 4 : 8);
2617 if (GuardWidth != 4 && GuardWidth != 8)
2622 if (GuardWidth == 4) {
2623 unsigned Reg32 =
TRI->getSubReg(
Reg, AArch64::sub_32);
2637 if (GuardWidth == 4)
2671 if (GuardWidth == 4) {
2672 unsigned Reg32 =
TRI->getSubReg(
Reg, AArch64::sub_32);
2695 switch (
MI.getOpcode()) {
2698 case AArch64::MOVZWi:
2699 case AArch64::MOVZXi:
2700 if (
MI.getOperand(1).isImm() &&
MI.getOperand(1).getImm() == 0) {
2701 assert(
MI.getDesc().getNumOperands() == 3 &&
2702 MI.getOperand(2).getImm() == 0 &&
"invalid MOVZi operands");
2706 case AArch64::ANDWri:
2707 return MI.getOperand(1).getReg() == AArch64::WZR;
2708 case AArch64::ANDXri:
2709 return MI.getOperand(1).getReg() == AArch64::XZR;
2710 case TargetOpcode::COPY:
2711 return MI.getOperand(1).getReg() == AArch64::WZR;
2719 switch (
MI.getOpcode()) {
2722 case TargetOpcode::COPY: {
2725 return (AArch64::GPR32RegClass.
contains(DstReg) ||
2726 AArch64::GPR64RegClass.
contains(DstReg));
2728 case AArch64::ORRXrs:
2729 if (
MI.getOperand(1).getReg() == AArch64::XZR) {
2730 assert(
MI.getDesc().getNumOperands() == 4 &&
2731 MI.getOperand(3).getImm() == 0 &&
"invalid ORRrs operands");
2735 case AArch64::ADDXri:
2736 if (
MI.getOperand(2).getImm() == 0) {
2737 assert(
MI.getDesc().getNumOperands() == 4 &&
2738 MI.getOperand(3).getImm() == 0 &&
"invalid ADDXri operands");
2749 switch (
MI.getOpcode()) {
2752 case TargetOpcode::COPY: {
2754 return AArch64::FPR128RegClass.contains(DstReg);
2756 case AArch64::ORRv16i8:
2757 if (
MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg()) {
2758 assert(
MI.getDesc().getNumOperands() == 3 &&
MI.getOperand(0).isReg() &&
2759 "invalid ORRv16i8 operands");
2771 case AArch64::LDRWui:
2772 case AArch64::LDRXui:
2773 case AArch64::LDRBui:
2774 case AArch64::LDRHui:
2775 case AArch64::LDRSui:
2776 case AArch64::LDRDui:
2777 case AArch64::LDRQui:
2778 case AArch64::LDR_PXI:
2784 int &FrameIndex)
const {
2788 if (
MI.getOperand(0).getSubReg() == 0 &&
MI.getOperand(1).isFI() &&
2789 MI.getOperand(2).isImm() &&
MI.getOperand(2).getImm() == 0) {
2790 FrameIndex =
MI.getOperand(1).getIndex();
2791 return MI.getOperand(0).getReg();
2800 case AArch64::STRWui:
2801 case AArch64::STRXui:
2802 case AArch64::STRBui:
2803 case AArch64::STRHui:
2804 case AArch64::STRSui:
2805 case AArch64::STRDui:
2806 case AArch64::STRQui:
2807 case AArch64::STR_PXI:
2813 int &FrameIndex)
const {
2817 if (
MI.getOperand(0).getSubReg() == 0 &&
MI.getOperand(1).isFI() &&
2818 MI.getOperand(2).isImm() &&
MI.getOperand(2).getImm() == 0) {
2819 FrameIndex =
MI.getOperand(1).getIndex();
2820 return MI.getOperand(0).getReg();
2826 int &FrameIndex)
const {
2841 return MI.getOperand(0).getReg();
2847 int &FrameIndex)
const {
2862 return MI.getOperand(0).getReg();
2870 return MMO->getFlags() & MOSuppressPair;
2876 if (
MI.memoperands_empty())
2884 return MMO->getFlags() & MOStridedAccess;
2892 case AArch64::STURSi:
2893 case AArch64::STRSpre:
2894 case AArch64::STURDi:
2895 case AArch64::STRDpre:
2896 case AArch64::STURQi:
2897 case AArch64::STRQpre:
2898 case AArch64::STURBBi:
2899 case AArch64::STURHHi:
2900 case AArch64::STURWi:
2901 case AArch64::STRWpre:
2902 case AArch64::STURXi:
2903 case AArch64::STRXpre:
2904 case AArch64::LDURSi:
2905 case AArch64::LDRSpre:
2906 case AArch64::LDURDi:
2907 case AArch64::LDRDpre:
2908 case AArch64::LDURQi:
2909 case AArch64::LDRQpre:
2910 case AArch64::LDURWi:
2911 case AArch64::LDRWpre:
2912 case AArch64::LDURXi:
2913 case AArch64::LDRXpre:
2914 case AArch64::LDRSWpre:
2915 case AArch64::LDURSWi:
2916 case AArch64::LDURHHi:
2917 case AArch64::LDURBBi:
2918 case AArch64::LDURSBWi:
2919 case AArch64::LDURSHWi:
2927 case AArch64::PRFMui:
return AArch64::PRFUMi;
2928 case AArch64::LDRXui:
return AArch64::LDURXi;
2929 case AArch64::LDRWui:
return AArch64::LDURWi;
2930 case AArch64::LDRBui:
return AArch64::LDURBi;
2931 case AArch64::LDRHui:
return AArch64::LDURHi;
2932 case AArch64::LDRSui:
return AArch64::LDURSi;
2933 case AArch64::LDRDui:
return AArch64::LDURDi;
2934 case AArch64::LDRQui:
return AArch64::LDURQi;
2935 case AArch64::LDRBBui:
return AArch64::LDURBBi;
2936 case AArch64::LDRHHui:
return AArch64::LDURHHi;
2937 case AArch64::LDRSBXui:
return AArch64::LDURSBXi;
2938 case AArch64::LDRSBWui:
return AArch64::LDURSBWi;
2939 case AArch64::LDRSHXui:
return AArch64::LDURSHXi;
2940 case AArch64::LDRSHWui:
return AArch64::LDURSHWi;
2941 case AArch64::LDRSWui:
return AArch64::LDURSWi;
2942 case AArch64::STRXui:
return AArch64::STURXi;
2943 case AArch64::STRWui:
return AArch64::STURWi;
2944 case AArch64::STRBui:
return AArch64::STURBi;
2945 case AArch64::STRHui:
return AArch64::STURHi;
2946 case AArch64::STRSui:
return AArch64::STURSi;
2947 case AArch64::STRDui:
return AArch64::STURDi;
2948 case AArch64::STRQui:
return AArch64::STURQi;
2949 case AArch64::STRBBui:
return AArch64::STURBBi;
2950 case AArch64::STRHHui:
return AArch64::STURHHi;
2959 case AArch64::LDAPURBi:
2960 case AArch64::LDAPURHi:
2961 case AArch64::LDAPURi:
2962 case AArch64::LDAPURSBWi:
2963 case AArch64::LDAPURSBXi:
2964 case AArch64::LDAPURSHWi:
2965 case AArch64::LDAPURSHXi:
2966 case AArch64::LDAPURSWi:
2967 case AArch64::LDAPURXi:
2968 case AArch64::LDR_PPXI:
2969 case AArch64::LDR_PXI:
2970 case AArch64::LDR_ZXI:
2971 case AArch64::LDR_ZZXI:
2972 case AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS:
2973 case AArch64::LDR_ZZZXI:
2974 case AArch64::LDR_ZZZZXI:
2975 case AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS:
2976 case AArch64::LDRBBui:
2977 case AArch64::LDRBui:
2978 case AArch64::LDRDui:
2979 case AArch64::LDRHHui:
2980 case AArch64::LDRHui:
2981 case AArch64::LDRQui:
2982 case AArch64::LDRSBWui:
2983 case AArch64::LDRSBXui:
2984 case AArch64::LDRSHWui:
2985 case AArch64::LDRSHXui:
2986 case AArch64::LDRSui:
2987 case AArch64::LDRSWui:
2988 case AArch64::LDRWui:
2989 case AArch64::LDRXui:
2990 case AArch64::LDURBBi:
2991 case AArch64::LDURBi:
2992 case AArch64::LDURDi:
2993 case AArch64::LDURHHi:
2994 case AArch64::LDURHi:
2995 case AArch64::LDURQi:
2996 case AArch64::LDURSBWi:
2997 case AArch64::LDURSBXi:
2998 case AArch64::LDURSHWi:
2999 case AArch64::LDURSHXi:
3000 case AArch64::LDURSi:
3001 case AArch64::LDURSWi:
3002 case AArch64::LDURWi:
3003 case AArch64::LDURXi:
3004 case AArch64::PRFMui:
3005 case AArch64::PRFUMi:
3006 case AArch64::ST2Gi:
3008 case AArch64::STLURBi:
3009 case AArch64::STLURHi:
3010 case AArch64::STLURWi:
3011 case AArch64::STLURXi:
3012 case AArch64::StoreSwiftAsyncContext:
3013 case AArch64::STR_PPXI:
3014 case AArch64::STR_PXI:
3015 case AArch64::STR_ZXI:
3016 case AArch64::STR_ZZXI:
3017 case AArch64::STR_ZZXI_STRIDED_CONTIGUOUS:
3018 case AArch64::STR_ZZZXI:
3019 case AArch64::STR_ZZZZXI:
3020 case AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS:
3021 case AArch64::STRBBui:
3022 case AArch64::STRBui:
3023 case AArch64::STRDui:
3024 case AArch64::STRHHui:
3025 case AArch64::STRHui:
3026 case AArch64::STRQui:
3027 case AArch64::STRSui:
3028 case AArch64::STRWui:
3029 case AArch64::STRXui:
3030 case AArch64::STURBBi:
3031 case AArch64::STURBi:
3032 case AArch64::STURDi:
3033 case AArch64::STURHHi:
3034 case AArch64::STURHi:
3035 case AArch64::STURQi:
3036 case AArch64::STURSi:
3037 case AArch64::STURWi:
3038 case AArch64::STURXi:
3039 case AArch64::STZ2Gi:
3040 case AArch64::STZGi:
3041 case AArch64::TAGPstack:
3043 case AArch64::LD1B_D_IMM:
3044 case AArch64::LD1B_H_IMM:
3045 case AArch64::LD1B_IMM:
3046 case AArch64::LD1B_S_IMM:
3047 case AArch64::LD1D_IMM:
3048 case AArch64::LD1H_D_IMM:
3049 case AArch64::LD1H_IMM:
3050 case AArch64::LD1H_S_IMM:
3051 case AArch64::LD1RB_D_IMM:
3052 case AArch64::LD1RB_H_IMM:
3053 case AArch64::LD1RB_IMM:
3054 case AArch64::LD1RB_S_IMM:
3055 case AArch64::LD1RD_IMM:
3056 case AArch64::LD1RH_D_IMM:
3057 case AArch64::LD1RH_IMM:
3058 case AArch64::LD1RH_S_IMM:
3059 case AArch64::LD1RSB_D_IMM:
3060 case AArch64::LD1RSB_H_IMM:
3061 case AArch64::LD1RSB_S_IMM:
3062 case AArch64::LD1RSH_D_IMM:
3063 case AArch64::LD1RSH_S_IMM:
3064 case AArch64::LD1RSW_IMM:
3065 case AArch64::LD1RW_D_IMM:
3066 case AArch64::LD1RW_IMM:
3067 case AArch64::LD1SB_D_IMM:
3068 case AArch64::LD1SB_H_IMM:
3069 case AArch64::LD1SB_S_IMM:
3070 case AArch64::LD1SH_D_IMM:
3071 case AArch64::LD1SH_S_IMM:
3072 case AArch64::LD1SW_D_IMM:
3073 case AArch64::LD1W_D_IMM:
3074 case AArch64::LD1W_IMM:
3075 case AArch64::LD2B_IMM:
3076 case AArch64::LD2D_IMM:
3077 case AArch64::LD2H_IMM:
3078 case AArch64::LD2W_IMM:
3079 case AArch64::LD3B_IMM:
3080 case AArch64::LD3D_IMM:
3081 case AArch64::LD3H_IMM:
3082 case AArch64::LD3W_IMM:
3083 case AArch64::LD4B_IMM:
3084 case AArch64::LD4D_IMM:
3085 case AArch64::LD4H_IMM:
3086 case AArch64::LD4W_IMM:
3088 case AArch64::LDNF1B_D_IMM:
3089 case AArch64::LDNF1B_H_IMM:
3090 case AArch64::LDNF1B_IMM:
3091 case AArch64::LDNF1B_S_IMM:
3092 case AArch64::LDNF1D_IMM:
3093 case AArch64::LDNF1H_D_IMM:
3094 case AArch64::LDNF1H_IMM:
3095 case AArch64::LDNF1H_S_IMM:
3096 case AArch64::LDNF1SB_D_IMM:
3097 case AArch64::LDNF1SB_H_IMM:
3098 case AArch64::LDNF1SB_S_IMM:
3099 case AArch64::LDNF1SH_D_IMM:
3100 case AArch64::LDNF1SH_S_IMM:
3101 case AArch64::LDNF1SW_D_IMM:
3102 case AArch64::LDNF1W_D_IMM:
3103 case AArch64::LDNF1W_IMM:
3104 case AArch64::LDNPDi:
3105 case AArch64::LDNPQi:
3106 case AArch64::LDNPSi:
3107 case AArch64::LDNPWi:
3108 case AArch64::LDNPXi:
3109 case AArch64::LDNT1B_ZRI:
3110 case AArch64::LDNT1D_ZRI:
3111 case AArch64::LDNT1H_ZRI:
3112 case AArch64::LDNT1W_ZRI:
3113 case AArch64::LDPDi:
3114 case AArch64::LDPQi:
3115 case AArch64::LDPSi:
3116 case AArch64::LDPWi:
3117 case AArch64::LDPXi:
3118 case AArch64::LDRBBpost:
3119 case AArch64::LDRBBpre:
3120 case AArch64::LDRBpost:
3121 case AArch64::LDRBpre:
3122 case AArch64::LDRDpost:
3123 case AArch64::LDRDpre:
3124 case AArch64::LDRHHpost:
3125 case AArch64::LDRHHpre:
3126 case AArch64::LDRHpost:
3127 case AArch64::LDRHpre:
3128 case AArch64::LDRQpost:
3129 case AArch64::LDRQpre:
3130 case AArch64::LDRSpost:
3131 case AArch64::LDRSpre:
3132 case AArch64::LDRWpost:
3133 case AArch64::LDRWpre:
3134 case AArch64::LDRXpost:
3135 case AArch64::LDRXpre:
3136 case AArch64::ST1B_D_IMM:
3137 case AArch64::ST1B_H_IMM:
3138 case AArch64::ST1B_IMM:
3139 case AArch64::ST1B_S_IMM:
3140 case AArch64::ST1D_IMM:
3141 case AArch64::ST1H_D_IMM:
3142 case AArch64::ST1H_IMM:
3143 case AArch64::ST1H_S_IMM:
3144 case AArch64::ST1W_D_IMM:
3145 case AArch64::ST1W_IMM:
3146 case AArch64::ST2B_IMM:
3147 case AArch64::ST2D_IMM:
3148 case AArch64::ST2H_IMM:
3149 case AArch64::ST2W_IMM:
3150 case AArch64::ST3B_IMM:
3151 case AArch64::ST3D_IMM:
3152 case AArch64::ST3H_IMM:
3153 case AArch64::ST3W_IMM:
3154 case AArch64::ST4B_IMM:
3155 case AArch64::ST4D_IMM:
3156 case AArch64::ST4H_IMM:
3157 case AArch64::ST4W_IMM:
3158 case AArch64::STGPi:
3159 case AArch64::STGPreIndex:
3160 case AArch64::STZGPreIndex:
3161 case AArch64::ST2GPreIndex:
3162 case AArch64::STZ2GPreIndex:
3163 case AArch64::STGPostIndex:
3164 case AArch64::STZGPostIndex:
3165 case AArch64::ST2GPostIndex:
3166 case AArch64::STZ2GPostIndex:
3167 case AArch64::STNPDi:
3168 case AArch64::STNPQi:
3169 case AArch64::STNPSi:
3170 case AArch64::STNPWi:
3171 case AArch64::STNPXi:
3172 case AArch64::STNT1B_ZRI:
3173 case AArch64::STNT1D_ZRI:
3174 case AArch64::STNT1H_ZRI:
3175 case AArch64::STNT1W_ZRI:
3176 case AArch64::STPDi:
3177 case AArch64::STPQi:
3178 case AArch64::STPSi:
3179 case AArch64::STPWi:
3180 case AArch64::STPXi:
3181 case AArch64::STRBBpost:
3182 case AArch64::STRBBpre:
3183 case AArch64::STRBpost:
3184 case AArch64::STRBpre:
3185 case AArch64::STRDpost:
3186 case AArch64::STRDpre:
3187 case AArch64::STRHHpost:
3188 case AArch64::STRHHpre:
3189 case AArch64::STRHpost:
3190 case AArch64::STRHpre:
3191 case AArch64::STRQpost:
3192 case AArch64::STRQpre:
3193 case AArch64::STRSpost:
3194 case AArch64::STRSpre:
3195 case AArch64::STRWpost:
3196 case AArch64::STRWpre:
3197 case AArch64::STRXpost:
3198 case AArch64::STRXpre:
3199 case AArch64::LD1B_2Z_IMM:
3200 case AArch64::LD1B_2Z_STRIDED_IMM:
3201 case AArch64::LD1H_2Z_IMM:
3202 case AArch64::LD1H_2Z_STRIDED_IMM:
3203 case AArch64::LD1W_2Z_IMM:
3204 case AArch64::LD1W_2Z_STRIDED_IMM:
3205 case AArch64::LD1D_2Z_IMM:
3206 case AArch64::LD1D_2Z_STRIDED_IMM:
3207 case AArch64::LD1B_4Z_IMM:
3208 case AArch64::LD1B_4Z_STRIDED_IMM:
3209 case AArch64::LD1H_4Z_IMM:
3210 case AArch64::LD1H_4Z_STRIDED_IMM:
3211 case AArch64::LD1W_4Z_IMM:
3212 case AArch64::LD1W_4Z_STRIDED_IMM:
3213 case AArch64::LD1D_4Z_IMM:
3214 case AArch64::LD1D_4Z_STRIDED_IMM:
3215 case AArch64::LD1B_2Z_IMM_PSEUDO:
3216 case AArch64::LD1H_2Z_IMM_PSEUDO:
3217 case AArch64::LD1W_2Z_IMM_PSEUDO:
3218 case AArch64::LD1D_2Z_IMM_PSEUDO:
3219 case AArch64::LD1B_4Z_IMM_PSEUDO:
3220 case AArch64::LD1H_4Z_IMM_PSEUDO:
3221 case AArch64::LD1W_4Z_IMM_PSEUDO:
3222 case AArch64::LD1D_4Z_IMM_PSEUDO:
3223 case AArch64::ST1B_2Z_IMM:
3224 case AArch64::ST1B_2Z_STRIDED_IMM:
3225 case AArch64::ST1H_2Z_IMM:
3226 case AArch64::ST1H_2Z_STRIDED_IMM:
3227 case AArch64::ST1W_2Z_IMM:
3228 case AArch64::ST1W_2Z_STRIDED_IMM:
3229 case AArch64::ST1D_2Z_IMM:
3230 case AArch64::ST1D_2Z_STRIDED_IMM:
3231 case AArch64::LDNT1B_2Z_IMM_PSEUDO:
3232 case AArch64::LDNT1B_2Z_IMM:
3233 case AArch64::LDNT1B_2Z_STRIDED_IMM:
3234 case AArch64::LDNT1H_2Z_IMM_PSEUDO:
3235 case AArch64::LDNT1H_2Z_IMM:
3236 case AArch64::LDNT1H_2Z_STRIDED_IMM:
3237 case AArch64::LDNT1W_2Z_IMM_PSEUDO:
3238 case AArch64::LDNT1W_2Z_IMM:
3239 case AArch64::LDNT1W_2Z_STRIDED_IMM:
3240 case AArch64::LDNT1D_2Z_IMM_PSEUDO:
3241 case AArch64::LDNT1D_2Z_IMM:
3242 case AArch64::LDNT1D_2Z_STRIDED_IMM:
3243 case AArch64::STNT1B_2Z_IMM:
3244 case AArch64::STNT1B_2Z_STRIDED_IMM:
3245 case AArch64::STNT1H_2Z_IMM:
3246 case AArch64::STNT1H_2Z_STRIDED_IMM:
3247 case AArch64::STNT1W_2Z_IMM:
3248 case AArch64::STNT1W_2Z_STRIDED_IMM:
3249 case AArch64::STNT1D_2Z_IMM:
3250 case AArch64::STNT1D_2Z_STRIDED_IMM:
3251 case AArch64::ST1B_4Z_IMM:
3252 case AArch64::ST1B_4Z_STRIDED_IMM:
3253 case AArch64::ST1H_4Z_IMM:
3254 case AArch64::ST1H_4Z_STRIDED_IMM:
3255 case AArch64::ST1W_4Z_IMM:
3256 case AArch64::ST1W_4Z_STRIDED_IMM:
3257 case AArch64::ST1D_4Z_IMM:
3258 case AArch64::ST1D_4Z_STRIDED_IMM:
3259 case AArch64::LDNT1B_4Z_IMM_PSEUDO:
3260 case AArch64::LDNT1B_4Z_IMM:
3261 case AArch64::LDNT1B_4Z_STRIDED_IMM:
3262 case AArch64::LDNT1H_4Z_IMM_PSEUDO:
3263 case AArch64::LDNT1H_4Z_IMM:
3264 case AArch64::LDNT1H_4Z_STRIDED_IMM:
3265 case AArch64::LDNT1W_4Z_IMM_PSEUDO:
3266 case AArch64::LDNT1W_4Z_IMM:
3267 case AArch64::LDNT1W_4Z_STRIDED_IMM:
3268 case AArch64::LDNT1D_4Z_IMM_PSEUDO:
3269 case AArch64::LDNT1D_4Z_IMM:
3270 case AArch64::LDNT1D_4Z_STRIDED_IMM:
3271 case AArch64::STNT1B_4Z_IMM:
3272 case AArch64::STNT1B_4Z_STRIDED_IMM:
3273 case AArch64::STNT1H_4Z_IMM:
3274 case AArch64::STNT1H_4Z_STRIDED_IMM:
3275 case AArch64::STNT1W_4Z_IMM:
3276 case AArch64::STNT1W_4Z_STRIDED_IMM:
3277 case AArch64::STNT1D_4Z_IMM:
3278 case AArch64::STNT1D_4Z_STRIDED_IMM:
3280 case AArch64::LDPDpost:
3281 case AArch64::LDPDpre:
3282 case AArch64::LDPQpost:
3283 case AArch64::LDPQpre:
3284 case AArch64::LDPSpost:
3285 case AArch64::LDPSpre:
3286 case AArch64::LDPWpost:
3287 case AArch64::LDPWpre:
3288 case AArch64::LDPXpost:
3289 case AArch64::LDPXpre:
3290 case AArch64::STGPpre:
3291 case AArch64::STGPpost:
3292 case AArch64::STPDpost:
3293 case AArch64::STPDpre:
3294 case AArch64::STPQpost:
3295 case AArch64::STPQpre:
3296 case AArch64::STPSpost:
3297 case AArch64::STPSpre:
3298 case AArch64::STPWpost:
3299 case AArch64::STPWpre:
3300 case AArch64::STPXpost:
3301 case AArch64::STPXpre:
3307 switch (
MI.getOpcode()) {
3311 case AArch64::STRSui:
3312 case AArch64::STRDui:
3313 case AArch64::STRQui:
3314 case AArch64::STRXui:
3315 case AArch64::STRWui:
3316 case AArch64::LDRSui:
3317 case AArch64::LDRDui:
3318 case AArch64::LDRQui:
3319 case AArch64::LDRXui:
3320 case AArch64::LDRWui:
3321 case AArch64::LDRSWui:
3323 case AArch64::STURSi:
3324 case AArch64::STRSpre:
3325 case AArch64::STURDi:
3326 case AArch64::STRDpre:
3327 case AArch64::STURQi:
3328 case AArch64::STRQpre:
3329 case AArch64::STURWi:
3330 case AArch64::STRWpre:
3331 case AArch64::STURXi:
3332 case AArch64::STRXpre:
3333 case AArch64::LDURSi:
3334 case AArch64::LDRSpre:
3335 case AArch64::LDURDi:
3336 case AArch64::LDRDpre:
3337 case AArch64::LDURQi:
3338 case AArch64::LDRQpre:
3339 case AArch64::LDURWi:
3340 case AArch64::LDRWpre:
3341 case AArch64::LDURXi:
3342 case AArch64::LDRXpre:
3343 case AArch64::LDURSWi:
3344 case AArch64::LDRSWpre:
3346 case AArch64::LDR_ZXI:
3347 case AArch64::STR_ZXI:
3353 switch (
MI.getOpcode()) {
3356 "Unexpected instruction - was a new tail call opcode introduced?");
3358 case AArch64::TCRETURNdi:
3359 case AArch64::TCRETURNri:
3360 case AArch64::TCRETURNrix16x17:
3361 case AArch64::TCRETURNrix17:
3362 case AArch64::TCRETURNrinotx16:
3363 case AArch64::TCRETURNriALL:
3364 case AArch64::AUTH_TCRETURN:
3365 case AArch64::AUTH_TCRETURN_BTI:
3375 case AArch64::ADDWri:
3376 return AArch64::ADDSWri;
3377 case AArch64::ADDWrr:
3378 return AArch64::ADDSWrr;
3379 case AArch64::ADDWrs:
3380 return AArch64::ADDSWrs;
3381 case AArch64::ADDWrx:
3382 return AArch64::ADDSWrx;
3383 case AArch64::ANDWri:
3384 return AArch64::ANDSWri;
3385 case AArch64::ANDWrr:
3386 return AArch64::ANDSWrr;
3387 case AArch64::ANDWrs:
3388 return AArch64::ANDSWrs;
3389 case AArch64::BICWrr:
3390 return AArch64::BICSWrr;
3391 case AArch64::BICWrs:
3392 return AArch64::BICSWrs;
3393 case AArch64::SUBWri:
3394 return AArch64::SUBSWri;
3395 case AArch64::SUBWrr:
3396 return AArch64::SUBSWrr;
3397 case AArch64::SUBWrs:
3398 return AArch64::SUBSWrs;
3399 case AArch64::SUBWrx:
3400 return AArch64::SUBSWrx;
3402 case AArch64::ADDXri:
3403 return AArch64::ADDSXri;
3404 case AArch64::ADDXrr:
3405 return AArch64::ADDSXrr;
3406 case AArch64::ADDXrs:
3407 return AArch64::ADDSXrs;
3408 case AArch64::ADDXrx:
3409 return AArch64::ADDSXrx;
3410 case AArch64::ANDXri:
3411 return AArch64::ANDSXri;
3412 case AArch64::ANDXrr:
3413 return AArch64::ANDSXrr;
3414 case AArch64::ANDXrs:
3415 return AArch64::ANDSXrs;
3416 case AArch64::BICXrr:
3417 return AArch64::BICSXrr;
3418 case AArch64::BICXrs:
3419 return AArch64::BICSXrs;
3420 case AArch64::SUBXri:
3421 return AArch64::SUBSXri;
3422 case AArch64::SUBXrr:
3423 return AArch64::SUBSXrr;
3424 case AArch64::SUBXrs:
3425 return AArch64::SUBSXrs;
3426 case AArch64::SUBXrx:
3427 return AArch64::SUBSXrx;
3429 case AArch64::AND_PPzPP:
3430 return AArch64::ANDS_PPzPP;
3431 case AArch64::BIC_PPzPP:
3432 return AArch64::BICS_PPzPP;
3433 case AArch64::EOR_PPzPP:
3434 return AArch64::EORS_PPzPP;
3435 case AArch64::NAND_PPzPP:
3436 return AArch64::NANDS_PPzPP;
3437 case AArch64::NOR_PPzPP:
3438 return AArch64::NORS_PPzPP;
3439 case AArch64::ORN_PPzPP:
3440 return AArch64::ORNS_PPzPP;
3441 case AArch64::ORR_PPzPP:
3442 return AArch64::ORRS_PPzPP;
3443 case AArch64::BRKA_PPzP:
3444 return AArch64::BRKAS_PPzP;
3445 case AArch64::BRKPA_PPzPP:
3446 return AArch64::BRKPAS_PPzPP;
3447 case AArch64::BRKB_PPzP:
3448 return AArch64::BRKBS_PPzP;
3449 case AArch64::BRKPB_PPzPP:
3450 return AArch64::BRKPBS_PPzPP;
3451 case AArch64::BRKN_PPzP:
3452 return AArch64::BRKNS_PPzP;
3453 case AArch64::RDFFR_PPz:
3454 return AArch64::RDFFRS_PPz;
3455 case AArch64::PTRUE_B:
3456 return AArch64::PTRUES_B;
3467 if (
MI.hasOrderedMemoryRef())
3472 assert((
MI.getOperand(IsPreLdSt ? 2 : 1).isReg() ||
3473 MI.getOperand(IsPreLdSt ? 2 : 1).isFI()) &&
3474 "Expected a reg or frame index operand.");
3478 bool IsImmPreLdSt = IsPreLdSt &&
MI.getOperand(3).isImm();
3480 if (!
MI.getOperand(2).isImm() && !IsImmPreLdSt)
3493 if (
MI.getOperand(1).isReg() && !IsPreLdSt) {
3494 Register BaseReg =
MI.getOperand(1).getReg();
3496 if (
MI.modifiesRegister(BaseReg,
TRI))
3502 switch (
MI.getOpcode()) {
3505 case AArch64::LDR_ZXI:
3506 case AArch64::STR_ZXI:
3507 if (!Subtarget.isLittleEndian() ||
3508 Subtarget.getSVEVectorSizeInBits() != 128)
3521 const MCAsmInfo &MAI =
MI.getMF()->getTarget().getMCAsmInfo();
3529 if (Subtarget.isPaired128Slow()) {
3530 switch (
MI.getOpcode()) {
3533 case AArch64::LDURQi:
3534 case AArch64::STURQi:
3535 case AArch64::LDRQui:
3536 case AArch64::STRQui:
3563std::optional<ExtAddrMode>
3568 bool OffsetIsScalable;
3569 if (!getMemOperandWithOffset(MemI,
Base,
Offset, OffsetIsScalable,
TRI))
3570 return std::nullopt;
3573 return std::nullopt;
3588 int64_t OffsetScale = 1;
3593 case AArch64::LDURQi:
3594 case AArch64::STURQi:
3598 case AArch64::LDURDi:
3599 case AArch64::STURDi:
3600 case AArch64::LDURXi:
3601 case AArch64::STURXi:
3605 case AArch64::LDURWi:
3606 case AArch64::LDURSWi:
3607 case AArch64::STURWi:
3611 case AArch64::LDURHi:
3612 case AArch64::STURHi:
3613 case AArch64::LDURHHi:
3614 case AArch64::STURHHi:
3615 case AArch64::LDURSHXi:
3616 case AArch64::LDURSHWi:
3620 case AArch64::LDRBroX:
3621 case AArch64::LDRBBroX:
3622 case AArch64::LDRSBXroX:
3623 case AArch64::LDRSBWroX:
3624 case AArch64::STRBroX:
3625 case AArch64::STRBBroX:
3626 case AArch64::LDURBi:
3627 case AArch64::LDURBBi:
3628 case AArch64::LDURSBXi:
3629 case AArch64::LDURSBWi:
3630 case AArch64::STURBi:
3631 case AArch64::STURBBi:
3632 case AArch64::LDRBui:
3633 case AArch64::LDRBBui:
3634 case AArch64::LDRSBXui:
3635 case AArch64::LDRSBWui:
3636 case AArch64::STRBui:
3637 case AArch64::STRBBui:
3641 case AArch64::LDRQroX:
3642 case AArch64::STRQroX:
3643 case AArch64::LDRQui:
3644 case AArch64::STRQui:
3649 case AArch64::LDRDroX:
3650 case AArch64::STRDroX:
3651 case AArch64::LDRXroX:
3652 case AArch64::STRXroX:
3653 case AArch64::LDRDui:
3654 case AArch64::STRDui:
3655 case AArch64::LDRXui:
3656 case AArch64::STRXui:
3661 case AArch64::LDRWroX:
3662 case AArch64::LDRSWroX:
3663 case AArch64::STRWroX:
3664 case AArch64::LDRWui:
3665 case AArch64::LDRSWui:
3666 case AArch64::STRWui:
3671 case AArch64::LDRHroX:
3672 case AArch64::STRHroX:
3673 case AArch64::LDRHHroX:
3674 case AArch64::STRHHroX:
3675 case AArch64::LDRSHXroX:
3676 case AArch64::LDRSHWroX:
3677 case AArch64::LDRHui:
3678 case AArch64::STRHui:
3679 case AArch64::LDRHHui:
3680 case AArch64::STRHHui:
3681 case AArch64::LDRSHXui:
3682 case AArch64::LDRSHWui:
3690 if (BaseRegOp.
isReg() && BaseRegOp.
getReg() == Reg)
3714 case AArch64::SBFMXri:
3727 AM.
Scale = OffsetScale;
3732 case TargetOpcode::SUBREG_TO_REG: {
3748 if (
DefMI.getOpcode() != AArch64::ORRWrs ||
3749 DefMI.getOperand(1).getReg() != AArch64::WZR ||
3750 DefMI.getOperand(3).getImm() != 0)
3757 AM.
Scale = OffsetScale;
3768 auto validateOffsetForLDP = [](
unsigned NumBytes, int64_t OldOffset,
3769 int64_t NewOffset) ->
bool {
3770 int64_t MinOffset, MaxOffset;
3787 return OldOffset < MinOffset || OldOffset > MaxOffset ||
3788 (NewOffset >= MinOffset && NewOffset <= MaxOffset);
3790 auto canFoldAddSubImmIntoAddrMode = [&](int64_t Disp) ->
bool {
3792 int64_t NewOffset = OldOffset + Disp;
3793 if (!isLegalAddressingMode(NumBytes, NewOffset, 0))
3797 if (!validateOffsetForLDP(NumBytes, OldOffset, NewOffset))
3807 auto canFoldAddRegIntoAddrMode =
3812 if ((
unsigned)Scale != Scale)
3814 if (!isLegalAddressingMode(NumBytes, 0, Scale))
3826 return (Opcode == AArch64::STURQi || Opcode == AArch64::STRQui) &&
3827 Subtarget.isSTRQroSlow();
3836 case AArch64::ADDXri:
3842 return canFoldAddSubImmIntoAddrMode(Disp);
3844 case AArch64::SUBXri:
3850 return canFoldAddSubImmIntoAddrMode(-Disp);
3852 case AArch64::ADDXrs: {
3865 if (Shift != 2 && Shift != 3 && Subtarget.hasAddrLSLSlow14())
3867 if (avoidSlowSTRQ(MemI))
3870 return canFoldAddRegIntoAddrMode(1ULL << Shift);
3873 case AArch64::ADDXrr:
3881 if (!OptSize && avoidSlowSTRQ(MemI))
3883 return canFoldAddRegIntoAddrMode(1);
3885 case AArch64::ADDXrx:
3893 if (!OptSize && avoidSlowSTRQ(MemI))
3902 return canFoldAddRegIntoAddrMode(
3917 case AArch64::LDURQi:
3918 case AArch64::LDRQui:
3919 return AArch64::LDRQroX;
3920 case AArch64::STURQi:
3921 case AArch64::STRQui:
3922 return AArch64::STRQroX;
3923 case AArch64::LDURDi:
3924 case AArch64::LDRDui:
3925 return AArch64::LDRDroX;
3926 case AArch64::STURDi:
3927 case AArch64::STRDui:
3928 return AArch64::STRDroX;
3929 case AArch64::LDURXi:
3930 case AArch64::LDRXui:
3931 return AArch64::LDRXroX;
3932 case AArch64::STURXi:
3933 case AArch64::STRXui:
3934 return AArch64::STRXroX;
3935 case AArch64::LDURWi:
3936 case AArch64::LDRWui:
3937 return AArch64::LDRWroX;
3938 case AArch64::LDURSWi:
3939 case AArch64::LDRSWui:
3940 return AArch64::LDRSWroX;
3941 case AArch64::STURWi:
3942 case AArch64::STRWui:
3943 return AArch64::STRWroX;
3944 case AArch64::LDURHi:
3945 case AArch64::LDRHui:
3946 return AArch64::LDRHroX;
3947 case AArch64::STURHi:
3948 case AArch64::STRHui:
3949 return AArch64::STRHroX;
3950 case AArch64::LDURHHi:
3951 case AArch64::LDRHHui:
3952 return AArch64::LDRHHroX;
3953 case AArch64::STURHHi:
3954 case AArch64::STRHHui:
3955 return AArch64::STRHHroX;
3956 case AArch64::LDURSHXi:
3957 case AArch64::LDRSHXui:
3958 return AArch64::LDRSHXroX;
3959 case AArch64::LDURSHWi:
3960 case AArch64::LDRSHWui:
3961 return AArch64::LDRSHWroX;
3962 case AArch64::LDURBi:
3963 case AArch64::LDRBui:
3964 return AArch64::LDRBroX;
3965 case AArch64::LDURBBi:
3966 case AArch64::LDRBBui:
3967 return AArch64::LDRBBroX;
3968 case AArch64::LDURSBXi:
3969 case AArch64::LDRSBXui:
3970 return AArch64::LDRSBXroX;
3971 case AArch64::LDURSBWi:
3972 case AArch64::LDRSBWui:
3973 return AArch64::LDRSBWroX;
3974 case AArch64::STURBi:
3975 case AArch64::STRBui:
3976 return AArch64::STRBroX;
3977 case AArch64::STURBBi:
3978 case AArch64::STRBBui:
3979 return AArch64::STRBBroX;
3991 case AArch64::LDURQi:
3993 return AArch64::LDRQui;
3994 case AArch64::STURQi:
3996 return AArch64::STRQui;
3997 case AArch64::LDURDi:
3999 return AArch64::LDRDui;
4000 case AArch64::STURDi:
4002 return AArch64::STRDui;
4003 case AArch64::LDURXi:
4005 return AArch64::LDRXui;
4006 case AArch64::STURXi:
4008 return AArch64::STRXui;
4009 case AArch64::LDURWi:
4011 return AArch64::LDRWui;
4012 case AArch64::LDURSWi:
4014 return AArch64::LDRSWui;
4015 case AArch64::STURWi:
4017 return AArch64::STRWui;
4018 case AArch64::LDURHi:
4020 return AArch64::LDRHui;
4021 case AArch64::STURHi:
4023 return AArch64::STRHui;
4024 case AArch64::LDURHHi:
4026 return AArch64::LDRHHui;
4027 case AArch64::STURHHi:
4029 return AArch64::STRHHui;
4030 case AArch64::LDURSHXi:
4032 return AArch64::LDRSHXui;
4033 case AArch64::LDURSHWi:
4035 return AArch64::LDRSHWui;
4036 case AArch64::LDURBi:
4038 return AArch64::LDRBui;
4039 case AArch64::LDURBBi:
4041 return AArch64::LDRBBui;
4042 case AArch64::LDURSBXi:
4044 return AArch64::LDRSBXui;
4045 case AArch64::LDURSBWi:
4047 return AArch64::LDRSBWui;
4048 case AArch64::STURBi:
4050 return AArch64::STRBui;
4051 case AArch64::STURBBi:
4053 return AArch64::STRBBui;
4054 case AArch64::LDRQui:
4055 case AArch64::STRQui:
4058 case AArch64::LDRDui:
4059 case AArch64::STRDui:
4060 case AArch64::LDRXui:
4061 case AArch64::STRXui:
4064 case AArch64::LDRWui:
4065 case AArch64::LDRSWui:
4066 case AArch64::STRWui:
4069 case AArch64::LDRHui:
4070 case AArch64::STRHui:
4071 case AArch64::LDRHHui:
4072 case AArch64::STRHHui:
4073 case AArch64::LDRSHXui:
4074 case AArch64::LDRSHWui:
4077 case AArch64::LDRBui:
4078 case AArch64::LDRBBui:
4079 case AArch64::LDRSBXui:
4080 case AArch64::LDRSBWui:
4081 case AArch64::STRBui:
4082 case AArch64::STRBBui:
4096 case AArch64::LDURQi:
4097 case AArch64::STURQi:
4098 case AArch64::LDURDi:
4099 case AArch64::STURDi:
4100 case AArch64::LDURXi:
4101 case AArch64::STURXi:
4102 case AArch64::LDURWi:
4103 case AArch64::LDURSWi:
4104 case AArch64::STURWi:
4105 case AArch64::LDURHi:
4106 case AArch64::STURHi:
4107 case AArch64::LDURHHi:
4108 case AArch64::STURHHi:
4109 case AArch64::LDURSHXi:
4110 case AArch64::LDURSHWi:
4111 case AArch64::LDURBi:
4112 case AArch64::STURBi:
4113 case AArch64::LDURBBi:
4114 case AArch64::STURBBi:
4115 case AArch64::LDURSBWi:
4116 case AArch64::LDURSBXi:
4118 case AArch64::LDRQui:
4119 return AArch64::LDURQi;
4120 case AArch64::STRQui:
4121 return AArch64::STURQi;
4122 case AArch64::LDRDui:
4123 return AArch64::LDURDi;
4124 case AArch64::STRDui:
4125 return AArch64::STURDi;
4126 case AArch64::LDRXui:
4127 return AArch64::LDURXi;
4128 case AArch64::STRXui:
4129 return AArch64::STURXi;
4130 case AArch64::LDRWui:
4131 return AArch64::LDURWi;
4132 case AArch64::LDRSWui:
4133 return AArch64::LDURSWi;
4134 case AArch64::STRWui:
4135 return AArch64::STURWi;
4136 case AArch64::LDRHui:
4137 return AArch64::LDURHi;
4138 case AArch64::STRHui:
4139 return AArch64::STURHi;
4140 case AArch64::LDRHHui:
4141 return AArch64::LDURHHi;
4142 case AArch64::STRHHui:
4143 return AArch64::STURHHi;
4144 case AArch64::LDRSHXui:
4145 return AArch64::LDURSHXi;
4146 case AArch64::LDRSHWui:
4147 return AArch64::LDURSHWi;
4148 case AArch64::LDRBBui:
4149 return AArch64::LDURBBi;
4150 case AArch64::LDRBui:
4151 return AArch64::LDURBi;
4152 case AArch64::STRBBui:
4153 return AArch64::STURBBi;
4154 case AArch64::STRBui:
4155 return AArch64::STURBi;
4156 case AArch64::LDRSBWui:
4157 return AArch64::LDURSBWi;
4158 case AArch64::LDRSBXui:
4159 return AArch64::LDURSBXi;
4172 case AArch64::LDRQroX:
4173 case AArch64::LDURQi:
4174 case AArch64::LDRQui:
4175 return AArch64::LDRQroW;
4176 case AArch64::STRQroX:
4177 case AArch64::STURQi:
4178 case AArch64::STRQui:
4179 return AArch64::STRQroW;
4180 case AArch64::LDRDroX:
4181 case AArch64::LDURDi:
4182 case AArch64::LDRDui:
4183 return AArch64::LDRDroW;
4184 case AArch64::STRDroX:
4185 case AArch64::STURDi:
4186 case AArch64::STRDui:
4187 return AArch64::STRDroW;
4188 case AArch64::LDRXroX:
4189 case AArch64::LDURXi:
4190 case AArch64::LDRXui:
4191 return AArch64::LDRXroW;
4192 case AArch64::STRXroX:
4193 case AArch64::STURXi:
4194 case AArch64::STRXui:
4195 return AArch64::STRXroW;
4196 case AArch64::LDRWroX:
4197 case AArch64::LDURWi:
4198 case AArch64::LDRWui:
4199 return AArch64::LDRWroW;
4200 case AArch64::LDRSWroX:
4201 case AArch64::LDURSWi:
4202 case AArch64::LDRSWui:
4203 return AArch64::LDRSWroW;
4204 case AArch64::STRWroX:
4205 case AArch64::STURWi:
4206 case AArch64::STRWui:
4207 return AArch64::STRWroW;
4208 case AArch64::LDRHroX:
4209 case AArch64::LDURHi:
4210 case AArch64::LDRHui:
4211 return AArch64::LDRHroW;
4212 case AArch64::STRHroX:
4213 case AArch64::STURHi:
4214 case AArch64::STRHui:
4215 return AArch64::STRHroW;
4216 case AArch64::LDRHHroX:
4217 case AArch64::LDURHHi:
4218 case AArch64::LDRHHui:
4219 return AArch64::LDRHHroW;
4220 case AArch64::STRHHroX:
4221 case AArch64::STURHHi:
4222 case AArch64::STRHHui:
4223 return AArch64::STRHHroW;
4224 case AArch64::LDRSHXroX:
4225 case AArch64::LDURSHXi:
4226 case AArch64::LDRSHXui:
4227 return AArch64::LDRSHXroW;
4228 case AArch64::LDRSHWroX:
4229 case AArch64::LDURSHWi:
4230 case AArch64::LDRSHWui:
4231 return AArch64::LDRSHWroW;
4232 case AArch64::LDRBroX:
4233 case AArch64::LDURBi:
4234 case AArch64::LDRBui:
4235 return AArch64::LDRBroW;
4236 case AArch64::LDRBBroX:
4237 case AArch64::LDURBBi:
4238 case AArch64::LDRBBui:
4239 return AArch64::LDRBBroW;
4240 case AArch64::LDRSBXroX:
4241 case AArch64::LDURSBXi:
4242 case AArch64::LDRSBXui:
4243 return AArch64::LDRSBXroW;
4244 case AArch64::LDRSBWroX:
4245 case AArch64::LDURSBWi:
4246 case AArch64::LDRSBWui:
4247 return AArch64::LDRSBWroW;
4248 case AArch64::STRBroX:
4249 case AArch64::STURBi:
4250 case AArch64::STRBui:
4251 return AArch64::STRBroW;
4252 case AArch64::STRBBroX:
4253 case AArch64::STURBBi:
4254 case AArch64::STRBBui:
4255 return AArch64::STRBBroW;
4280 return B.getInstr();
4284 "Addressing mode not supported for folding");
4301 return B.getInstr();
4308 "Address offset can be a register or an immediate, but not both");
4329 return B.getInstr();
4333 "Function must not be called with an addressing mode it can't handle");
4342 case AArch64::LD1Fourv16b_POST:
4343 case AArch64::LD1Fourv1d_POST:
4344 case AArch64::LD1Fourv2d_POST:
4345 case AArch64::LD1Fourv2s_POST:
4346 case AArch64::LD1Fourv4h_POST:
4347 case AArch64::LD1Fourv4s_POST:
4348 case AArch64::LD1Fourv8b_POST:
4349 case AArch64::LD1Fourv8h_POST:
4350 case AArch64::LD1Onev16b_POST:
4351 case AArch64::LD1Onev1d_POST:
4352 case AArch64::LD1Onev2d_POST:
4353 case AArch64::LD1Onev2s_POST:
4354 case AArch64::LD1Onev4h_POST:
4355 case AArch64::LD1Onev4s_POST:
4356 case AArch64::LD1Onev8b_POST:
4357 case AArch64::LD1Onev8h_POST:
4358 case AArch64::LD1Rv16b_POST:
4359 case AArch64::LD1Rv1d_POST:
4360 case AArch64::LD1Rv2d_POST:
4361 case AArch64::LD1Rv2s_POST:
4362 case AArch64::LD1Rv4h_POST:
4363 case AArch64::LD1Rv4s_POST:
4364 case AArch64::LD1Rv8b_POST:
4365 case AArch64::LD1Rv8h_POST:
4366 case AArch64::LD1Threev16b_POST:
4367 case AArch64::LD1Threev1d_POST:
4368 case AArch64::LD1Threev2d_POST:
4369 case AArch64::LD1Threev2s_POST:
4370 case AArch64::LD1Threev4h_POST:
4371 case AArch64::LD1Threev4s_POST:
4372 case AArch64::LD1Threev8b_POST:
4373 case AArch64::LD1Threev8h_POST:
4374 case AArch64::LD1Twov16b_POST:
4375 case AArch64::LD1Twov1d_POST:
4376 case AArch64::LD1Twov2d_POST:
4377 case AArch64::LD1Twov2s_POST:
4378 case AArch64::LD1Twov4h_POST:
4379 case AArch64::LD1Twov4s_POST:
4380 case AArch64::LD1Twov8b_POST:
4381 case AArch64::LD1Twov8h_POST:
4382 case AArch64::LD1i16_POST:
4383 case AArch64::LD1i32_POST:
4384 case AArch64::LD1i64_POST:
4385 case AArch64::LD1i8_POST:
4386 case AArch64::LD2Rv16b_POST:
4387 case AArch64::LD2Rv1d_POST:
4388 case AArch64::LD2Rv2d_POST:
4389 case AArch64::LD2Rv2s_POST:
4390 case AArch64::LD2Rv4h_POST:
4391 case AArch64::LD2Rv4s_POST:
4392 case AArch64::LD2Rv8b_POST:
4393 case AArch64::LD2Rv8h_POST:
4394 case AArch64::LD2Twov16b_POST:
4395 case AArch64::LD2Twov2d_POST:
4396 case AArch64::LD2Twov2s_POST:
4397 case AArch64::LD2Twov4h_POST:
4398 case AArch64::LD2Twov4s_POST:
4399 case AArch64::LD2Twov8b_POST:
4400 case AArch64::LD2Twov8h_POST:
4401 case AArch64::LD2i16_POST:
4402 case AArch64::LD2i32_POST:
4403 case AArch64::LD2i64_POST:
4404 case AArch64::LD2i8_POST:
4405 case AArch64::LD3Rv16b_POST:
4406 case AArch64::LD3Rv1d_POST:
4407 case AArch64::LD3Rv2d_POST:
4408 case AArch64::LD3Rv2s_POST:
4409 case AArch64::LD3Rv4h_POST:
4410 case AArch64::LD3Rv4s_POST:
4411 case AArch64::LD3Rv8b_POST:
4412 case AArch64::LD3Rv8h_POST:
4413 case AArch64::LD3Threev16b_POST:
4414 case AArch64::LD3Threev2d_POST:
4415 case AArch64::LD3Threev2s_POST:
4416 case AArch64::LD3Threev4h_POST:
4417 case AArch64::LD3Threev4s_POST:
4418 case AArch64::LD3Threev8b_POST:
4419 case AArch64::LD3Threev8h_POST:
4420 case AArch64::LD3i16_POST:
4421 case AArch64::LD3i32_POST:
4422 case AArch64::LD3i64_POST:
4423 case AArch64::LD3i8_POST:
4424 case AArch64::LD4Fourv16b_POST:
4425 case AArch64::LD4Fourv2d_POST:
4426 case AArch64::LD4Fourv2s_POST:
4427 case AArch64::LD4Fourv4h_POST:
4428 case AArch64::LD4Fourv4s_POST:
4429 case AArch64::LD4Fourv8b_POST:
4430 case AArch64::LD4Fourv8h_POST:
4431 case AArch64::LD4Rv16b_POST:
4432 case AArch64::LD4Rv1d_POST:
4433 case AArch64::LD4Rv2d_POST:
4434 case AArch64::LD4Rv2s_POST:
4435 case AArch64::LD4Rv4h_POST:
4436 case AArch64::LD4Rv4s_POST:
4437 case AArch64::LD4Rv8b_POST:
4438 case AArch64::LD4Rv8h_POST:
4439 case AArch64::LD4i16_POST:
4440 case AArch64::LD4i32_POST:
4441 case AArch64::LD4i64_POST:
4442 case AArch64::LD4i8_POST:
4443 case AArch64::LDAPRWpost:
4444 case AArch64::LDAPRXpost:
4445 case AArch64::LDIAPPWpost:
4446 case AArch64::LDIAPPXpost:
4447 case AArch64::LDPDpost:
4448 case AArch64::LDPQpost:
4449 case AArch64::LDPSWpost:
4450 case AArch64::LDPSpost:
4451 case AArch64::LDPWpost:
4452 case AArch64::LDPXpost:
4453 case AArch64::LDRBBpost:
4454 case AArch64::LDRBpost:
4455 case AArch64::LDRDpost:
4456 case AArch64::LDRHHpost:
4457 case AArch64::LDRHpost:
4458 case AArch64::LDRQpost:
4459 case AArch64::LDRSBWpost:
4460 case AArch64::LDRSBXpost:
4461 case AArch64::LDRSHWpost:
4462 case AArch64::LDRSHXpost:
4463 case AArch64::LDRSWpost:
4464 case AArch64::LDRSpost:
4465 case AArch64::LDRWpost:
4466 case AArch64::LDRXpost:
4467 case AArch64::ST1Fourv16b_POST:
4468 case AArch64::ST1Fourv1d_POST:
4469 case AArch64::ST1Fourv2d_POST:
4470 case AArch64::ST1Fourv2s_POST:
4471 case AArch64::ST1Fourv4h_POST:
4472 case AArch64::ST1Fourv4s_POST:
4473 case AArch64::ST1Fourv8b_POST:
4474 case AArch64::ST1Fourv8h_POST:
4475 case AArch64::ST1Onev16b_POST:
4476 case AArch64::ST1Onev1d_POST:
4477 case AArch64::ST1Onev2d_POST:
4478 case AArch64::ST1Onev2s_POST:
4479 case AArch64::ST1Onev4h_POST:
4480 case AArch64::ST1Onev4s_POST:
4481 case AArch64::ST1Onev8b_POST:
4482 case AArch64::ST1Onev8h_POST:
4483 case AArch64::ST1Threev16b_POST:
4484 case AArch64::ST1Threev1d_POST:
4485 case AArch64::ST1Threev2d_POST:
4486 case AArch64::ST1Threev2s_POST:
4487 case AArch64::ST1Threev4h_POST:
4488 case AArch64::ST1Threev4s_POST:
4489 case AArch64::ST1Threev8b_POST:
4490 case AArch64::ST1Threev8h_POST:
4491 case AArch64::ST1Twov16b_POST:
4492 case AArch64::ST1Twov1d_POST:
4493 case AArch64::ST1Twov2d_POST:
4494 case AArch64::ST1Twov2s_POST:
4495 case AArch64::ST1Twov4h_POST:
4496 case AArch64::ST1Twov4s_POST:
4497 case AArch64::ST1Twov8b_POST:
4498 case AArch64::ST1Twov8h_POST:
4499 case AArch64::ST1i16_POST:
4500 case AArch64::ST1i32_POST:
4501 case AArch64::ST1i64_POST:
4502 case AArch64::ST1i8_POST:
4503 case AArch64::ST2GPostIndex:
4504 case AArch64::ST2Twov16b_POST:
4505 case AArch64::ST2Twov2d_POST:
4506 case AArch64::ST2Twov2s_POST:
4507 case AArch64::ST2Twov4h_POST:
4508 case AArch64::ST2Twov4s_POST:
4509 case AArch64::ST2Twov8b_POST:
4510 case AArch64::ST2Twov8h_POST:
4511 case AArch64::ST2i16_POST:
4512 case AArch64::ST2i32_POST:
4513 case AArch64::ST2i64_POST:
4514 case AArch64::ST2i8_POST:
4515 case AArch64::ST3Threev16b_POST:
4516 case AArch64::ST3Threev2d_POST:
4517 case AArch64::ST3Threev2s_POST:
4518 case AArch64::ST3Threev4h_POST:
4519 case AArch64::ST3Threev4s_POST:
4520 case AArch64::ST3Threev8b_POST:
4521 case AArch64::ST3Threev8h_POST:
4522 case AArch64::ST3i16_POST:
4523 case AArch64::ST3i32_POST:
4524 case AArch64::ST3i64_POST:
4525 case AArch64::ST3i8_POST:
4526 case AArch64::ST4Fourv16b_POST:
4527 case AArch64::ST4Fourv2d_POST:
4528 case AArch64::ST4Fourv2s_POST:
4529 case AArch64::ST4Fourv4h_POST:
4530 case AArch64::ST4Fourv4s_POST:
4531 case AArch64::ST4Fourv8b_POST:
4532 case AArch64::ST4Fourv8h_POST:
4533 case AArch64::ST4i16_POST:
4534 case AArch64::ST4i32_POST:
4535 case AArch64::ST4i64_POST:
4536 case AArch64::ST4i8_POST:
4537 case AArch64::STGPostIndex:
4538 case AArch64::STGPpost:
4539 case AArch64::STPDpost:
4540 case AArch64::STPQpost:
4541 case AArch64::STPSpost:
4542 case AArch64::STPWpost:
4543 case AArch64::STPXpost:
4544 case AArch64::STRBBpost:
4545 case AArch64::STRBpost:
4546 case AArch64::STRDpost:
4547 case AArch64::STRHHpost:
4548 case AArch64::STRHpost:
4549 case AArch64::STRQpost:
4550 case AArch64::STRSpost:
4551 case AArch64::STRWpost:
4552 case AArch64::STRXpost:
4553 case AArch64::STZ2GPostIndex:
4554 case AArch64::STZGPostIndex:
4561 bool &OffsetIsScalable,
TypeSize &Width,
4582 int64_t Dummy1, Dummy2;
4604 return BaseOp->
isReg() || BaseOp->
isFI();
4611 assert(OfsOp.
isImm() &&
"Offset operand wasn't immediate.");
4616 TypeSize &Width, int64_t &MinOffset,
4617 int64_t &MaxOffset) {
4622 MinOffset = MaxOffset = 0;
4625 case AArch64::LDRQui:
4626 case AArch64::STRQui:
4631 case AArch64::LDRXui:
4632 case AArch64::LDRDui:
4633 case AArch64::STRXui:
4634 case AArch64::STRDui:
4635 case AArch64::PRFMui:
4640 case AArch64::LDRWui:
4641 case AArch64::LDRSui:
4642 case AArch64::LDRSWui:
4643 case AArch64::STRWui:
4644 case AArch64::STRSui:
4649 case AArch64::LDRHui:
4650 case AArch64::LDRHHui:
4651 case AArch64::LDRSHWui:
4652 case AArch64::LDRSHXui:
4653 case AArch64::STRHui:
4654 case AArch64::STRHHui:
4659 case AArch64::LDRBui:
4660 case AArch64::LDRBBui:
4661 case AArch64::LDRSBWui:
4662 case AArch64::LDRSBXui:
4663 case AArch64::STRBui:
4664 case AArch64::STRBBui:
4670 case AArch64::STRQpre:
4671 case AArch64::LDRQpost:
4677 case AArch64::LDRDpost:
4678 case AArch64::LDRDpre:
4679 case AArch64::LDRXpost:
4680 case AArch64::LDRXpre:
4681 case AArch64::STRDpost:
4682 case AArch64::STRDpre:
4683 case AArch64::STRXpost:
4684 case AArch64::STRXpre:
4690 case AArch64::STRWpost:
4691 case AArch64::STRWpre:
4692 case AArch64::LDRWpost:
4693 case AArch64::LDRWpre:
4694 case AArch64::STRSpost:
4695 case AArch64::STRSpre:
4696 case AArch64::LDRSpost:
4697 case AArch64::LDRSpre:
4703 case AArch64::LDRHpost:
4704 case AArch64::LDRHpre:
4705 case AArch64::STRHpost:
4706 case AArch64::STRHpre:
4707 case AArch64::LDRHHpost:
4708 case AArch64::LDRHHpre:
4709 case AArch64::STRHHpost:
4710 case AArch64::STRHHpre:
4716 case AArch64::LDRBpost:
4717 case AArch64::LDRBpre:
4718 case AArch64::STRBpost:
4719 case AArch64::STRBpre:
4720 case AArch64::LDRBBpost:
4721 case AArch64::LDRBBpre:
4722 case AArch64::STRBBpost:
4723 case AArch64::STRBBpre:
4729 case AArch64::LDURQi:
4730 case AArch64::STURQi:
4736 case AArch64::LDURXi:
4737 case AArch64::LDURDi:
4738 case AArch64::LDAPURXi:
4739 case AArch64::STURXi:
4740 case AArch64::STURDi:
4741 case AArch64::STLURXi:
4742 case AArch64::PRFUMi:
4748 case AArch64::LDURWi:
4749 case AArch64::LDURSi:
4750 case AArch64::LDURSWi:
4751 case AArch64::LDAPURi:
4752 case AArch64::LDAPURSWi:
4753 case AArch64::STURWi:
4754 case AArch64::STURSi:
4755 case AArch64::STLURWi:
4761 case AArch64::LDURHi:
4762 case AArch64::LDURHHi:
4763 case AArch64::LDURSHXi:
4764 case AArch64::LDURSHWi:
4765 case AArch64::LDAPURHi:
4766 case AArch64::LDAPURSHWi:
4767 case AArch64::LDAPURSHXi:
4768 case AArch64::STURHi:
4769 case AArch64::STURHHi:
4770 case AArch64::STLURHi:
4776 case AArch64::LDURBi:
4777 case AArch64::LDURBBi:
4778 case AArch64::LDURSBXi:
4779 case AArch64::LDURSBWi:
4780 case AArch64::LDAPURBi:
4781 case AArch64::LDAPURSBWi:
4782 case AArch64::LDAPURSBXi:
4783 case AArch64::STURBi:
4784 case AArch64::STURBBi:
4785 case AArch64::STLURBi:
4791 case AArch64::LDPQi:
4792 case AArch64::LDNPQi:
4793 case AArch64::STPQi:
4794 case AArch64::STNPQi:
4795 case AArch64::LDPQpost:
4796 case AArch64::LDPQpre:
4797 case AArch64::STPQpost:
4798 case AArch64::STPQpre:
4804 case AArch64::LDPXi:
4805 case AArch64::LDPDi:
4806 case AArch64::LDNPXi:
4807 case AArch64::LDNPDi:
4808 case AArch64::STPXi:
4809 case AArch64::STPDi:
4810 case AArch64::STNPXi:
4811 case AArch64::STNPDi:
4812 case AArch64::LDPDpost:
4813 case AArch64::LDPDpre:
4814 case AArch64::LDPXpost:
4815 case AArch64::LDPXpre:
4816 case AArch64::STPDpost:
4817 case AArch64::STPDpre:
4818 case AArch64::STPXpost:
4819 case AArch64::STPXpre:
4825 case AArch64::LDPWi:
4826 case AArch64::LDPSi:
4827 case AArch64::LDNPWi:
4828 case AArch64::LDNPSi:
4829 case AArch64::STPWi:
4830 case AArch64::STPSi:
4831 case AArch64::STNPWi:
4832 case AArch64::STNPSi:
4833 case AArch64::LDPSpost:
4834 case AArch64::LDPSpre:
4835 case AArch64::LDPWpost:
4836 case AArch64::LDPWpre:
4837 case AArch64::STPSpost:
4838 case AArch64::STPSpre:
4839 case AArch64::STPWpost:
4840 case AArch64::STPWpre:
4846 case AArch64::StoreSwiftAsyncContext:
4859 case AArch64::TAGPstack:
4869 case AArch64::STGPreIndex:
4870 case AArch64::STGPostIndex:
4871 case AArch64::STZGi:
4872 case AArch64::STZGPreIndex:
4873 case AArch64::STZGPostIndex:
4879 case AArch64::STR_ZZZZXI:
4880 case AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS:
4881 case AArch64::LDR_ZZZZXI:
4882 case AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS:
4888 case AArch64::STR_ZZZXI:
4889 case AArch64::LDR_ZZZXI:
4895 case AArch64::STR_ZZXI:
4896 case AArch64::STR_ZZXI_STRIDED_CONTIGUOUS:
4897 case AArch64::LDR_ZZXI:
4898 case AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS:
4904 case AArch64::LDR_PXI:
4905 case AArch64::STR_PXI:
4910 case AArch64::LDR_PPXI:
4911 case AArch64::STR_PPXI:
4917 case AArch64::LDR_ZXI:
4918 case AArch64::STR_ZXI:
4923 case AArch64::LD1B_IMM:
4924 case AArch64::LD1H_IMM:
4925 case AArch64::LD1W_IMM:
4926 case AArch64::LD1D_IMM:
4927 case AArch64::LDNT1B_ZRI:
4928 case AArch64::LDNT1H_ZRI:
4929 case AArch64::LDNT1W_ZRI:
4930 case AArch64::LDNT1D_ZRI:
4931 case AArch64::ST1B_IMM:
4932 case AArch64::ST1H_IMM:
4933 case AArch64::ST1W_IMM:
4934 case AArch64::ST1D_IMM:
4935 case AArch64::STNT1B_ZRI:
4936 case AArch64::STNT1H_ZRI:
4937 case AArch64::STNT1W_ZRI:
4938 case AArch64::STNT1D_ZRI:
4939 case AArch64::LDNF1B_IMM:
4940 case AArch64::LDNF1H_IMM:
4941 case AArch64::LDNF1W_IMM:
4942 case AArch64::LDNF1D_IMM:
4949 case AArch64::LD2B_IMM:
4950 case AArch64::LD2H_IMM:
4951 case AArch64::LD2W_IMM:
4952 case AArch64::LD2D_IMM:
4953 case AArch64::ST2B_IMM:
4954 case AArch64::ST2H_IMM:
4955 case AArch64::ST2W_IMM:
4956 case AArch64::ST2D_IMM:
4957 case AArch64::LD1B_2Z_IMM:
4958 case AArch64::LD1B_2Z_STRIDED_IMM:
4959 case AArch64::LD1H_2Z_IMM:
4960 case AArch64::LD1H_2Z_STRIDED_IMM:
4961 case AArch64::LD1W_2Z_IMM:
4962 case AArch64::LD1W_2Z_STRIDED_IMM:
4963 case AArch64::LD1D_2Z_IMM:
4964 case AArch64::LD1D_2Z_STRIDED_IMM:
4965 case AArch64::LD1B_2Z_IMM_PSEUDO:
4966 case AArch64::LD1H_2Z_IMM_PSEUDO:
4967 case AArch64::LD1W_2Z_IMM_PSEUDO:
4968 case AArch64::LD1D_2Z_IMM_PSEUDO:
4969 case AArch64::ST1B_2Z_IMM:
4970 case AArch64::ST1B_2Z_STRIDED_IMM:
4971 case AArch64::ST1H_2Z_IMM:
4972 case AArch64::ST1H_2Z_STRIDED_IMM:
4973 case AArch64::ST1W_2Z_IMM:
4974 case AArch64::ST1W_2Z_STRIDED_IMM:
4975 case AArch64::ST1D_2Z_IMM:
4976 case AArch64::ST1D_2Z_STRIDED_IMM:
4977 case AArch64::LDNT1B_2Z_IMM_PSEUDO:
4978 case AArch64::LDNT1B_2Z_IMM:
4979 case AArch64::LDNT1B_2Z_STRIDED_IMM:
4980 case AArch64::LDNT1H_2Z_IMM_PSEUDO:
4981 case AArch64::LDNT1H_2Z_IMM:
4982 case AArch64::LDNT1H_2Z_STRIDED_IMM:
4983 case AArch64::LDNT1W_2Z_IMM_PSEUDO:
4984 case AArch64::LDNT1W_2Z_IMM:
4985 case AArch64::LDNT1W_2Z_STRIDED_IMM:
4986 case AArch64::LDNT1D_2Z_IMM_PSEUDO:
4987 case AArch64::LDNT1D_2Z_IMM:
4988 case AArch64::LDNT1D_2Z_STRIDED_IMM:
4989 case AArch64::STNT1B_2Z_IMM:
4990 case AArch64::STNT1B_2Z_STRIDED_IMM:
4991 case AArch64::STNT1H_2Z_IMM:
4992 case AArch64::STNT1H_2Z_STRIDED_IMM:
4993 case AArch64::STNT1W_2Z_IMM:
4994 case AArch64::STNT1W_2Z_STRIDED_IMM:
4995 case AArch64::STNT1D_2Z_IMM:
4996 case AArch64::STNT1D_2Z_STRIDED_IMM:
5001 case AArch64::LD3B_IMM:
5002 case AArch64::LD3H_IMM:
5003 case AArch64::LD3W_IMM:
5004 case AArch64::LD3D_IMM:
5005 case AArch64::ST3B_IMM:
5006 case AArch64::ST3H_IMM:
5007 case AArch64::ST3W_IMM:
5008 case AArch64::ST3D_IMM:
5013 case AArch64::LD4B_IMM:
5014 case AArch64::LD4H_IMM:
5015 case AArch64::LD4W_IMM:
5016 case AArch64::LD4D_IMM:
5017 case AArch64::ST4B_IMM:
5018 case AArch64::ST4H_IMM:
5019 case AArch64::ST4W_IMM:
5020 case AArch64::ST4D_IMM:
5021 case AArch64::LD1B_4Z_IMM:
5022 case AArch64::LD1B_4Z_STRIDED_IMM:
5023 case AArch64::LD1H_4Z_IMM:
5024 case AArch64::LD1H_4Z_STRIDED_IMM:
5025 case AArch64::LD1W_4Z_IMM:
5026 case AArch64::LD1W_4Z_STRIDED_IMM:
5027 case AArch64::LD1D_4Z_IMM:
5028 case AArch64::LD1D_4Z_STRIDED_IMM:
5029 case AArch64::LD1B_4Z_IMM_PSEUDO:
5030 case AArch64::LD1H_4Z_IMM_PSEUDO:
5031 case AArch64::LD1W_4Z_IMM_PSEUDO:
5032 case AArch64::LD1D_4Z_IMM_PSEUDO:
5033 case AArch64::ST1B_4Z_IMM:
5034 case AArch64::ST1B_4Z_STRIDED_IMM:
5035 case AArch64::ST1H_4Z_IMM:
5036 case AArch64::ST1H_4Z_STRIDED_IMM:
5037 case AArch64::ST1W_4Z_IMM:
5038 case AArch64::ST1W_4Z_STRIDED_IMM:
5039 case AArch64::ST1D_4Z_IMM:
5040 case AArch64::ST1D_4Z_STRIDED_IMM:
5041 case AArch64::LDNT1B_4Z_IMM_PSEUDO:
5042 case AArch64::LDNT1B_4Z_IMM:
5043 case AArch64::LDNT1B_4Z_STRIDED_IMM:
5044 case AArch64::LDNT1H_4Z_IMM_PSEUDO:
5045 case AArch64::LDNT1H_4Z_IMM:
5046 case AArch64::LDNT1H_4Z_STRIDED_IMM:
5047 case AArch64::LDNT1W_4Z_IMM_PSEUDO:
5048 case AArch64::LDNT1W_4Z_IMM:
5049 case AArch64::LDNT1W_4Z_STRIDED_IMM:
5050 case AArch64::LDNT1D_4Z_IMM_PSEUDO:
5051 case AArch64::LDNT1D_4Z_IMM:
5052 case AArch64::LDNT1D_4Z_STRIDED_IMM:
5053 case AArch64::STNT1B_4Z_IMM:
5054 case AArch64::STNT1B_4Z_STRIDED_IMM:
5055 case AArch64::STNT1H_4Z_IMM:
5056 case AArch64::STNT1H_4Z_STRIDED_IMM:
5057 case AArch64::STNT1W_4Z_IMM:
5058 case AArch64::STNT1W_4Z_STRIDED_IMM:
5059 case AArch64::STNT1D_4Z_IMM:
5060 case AArch64::STNT1D_4Z_STRIDED_IMM:
5065 case AArch64::LD1B_H_IMM:
5066 case AArch64::LD1SB_H_IMM:
5067 case AArch64::LD1H_S_IMM:
5068 case AArch64::LD1SH_S_IMM:
5069 case AArch64::LD1W_D_IMM:
5070 case AArch64::LD1SW_D_IMM:
5071 case AArch64::ST1B_H_IMM:
5072 case AArch64::ST1H_S_IMM:
5073 case AArch64::ST1W_D_IMM:
5074 case AArch64::LDNF1B_H_IMM:
5075 case AArch64::LDNF1SB_H_IMM:
5076 case AArch64::LDNF1H_S_IMM:
5077 case AArch64::LDNF1SH_S_IMM:
5078 case AArch64::LDNF1W_D_IMM:
5079 case AArch64::LDNF1SW_D_IMM:
5086 case AArch64::LD1B_S_IMM:
5087 case AArch64::LD1SB_S_IMM:
5088 case AArch64::LD1H_D_IMM:
5089 case AArch64::LD1SH_D_IMM:
5090 case AArch64::ST1B_S_IMM:
5091 case AArch64::ST1H_D_IMM:
5092 case AArch64::LDNF1B_S_IMM:
5093 case AArch64::LDNF1SB_S_IMM:
5094 case AArch64::LDNF1H_D_IMM:
5095 case AArch64::LDNF1SH_D_IMM:
5102 case AArch64::LD1B_D_IMM:
5103 case AArch64::LD1SB_D_IMM:
5104 case AArch64::ST1B_D_IMM:
5105 case AArch64::LDNF1B_D_IMM:
5106 case AArch64::LDNF1SB_D_IMM:
5113 case AArch64::ST2Gi:
5114 case AArch64::ST2GPreIndex:
5115 case AArch64::ST2GPostIndex:
5116 case AArch64::STZ2Gi:
5117 case AArch64::STZ2GPreIndex:
5118 case AArch64::STZ2GPostIndex:
5124 case AArch64::STGPi:
5125 case AArch64::STGPpost:
5126 case AArch64::STGPpre:
5131 case AArch64::LD1RB_IMM:
5132 case AArch64::LD1RB_H_IMM:
5133 case AArch64::LD1RB_S_IMM:
5134 case AArch64::LD1RB_D_IMM:
5135 case AArch64::LD1RSB_H_IMM:
5136 case AArch64::LD1RSB_S_IMM:
5137 case AArch64::LD1RSB_D_IMM:
5142 case AArch64::LD1RH_IMM:
5143 case AArch64::LD1RH_S_IMM:
5144 case AArch64::LD1RH_D_IMM:
5145 case AArch64::LD1RSH_S_IMM:
5146 case AArch64::LD1RSH_D_IMM:
5151 case AArch64::LD1RW_IMM:
5152 case AArch64::LD1RW_D_IMM:
5153 case AArch64::LD1RSW_IMM:
5158 case AArch64::LD1RD_IMM:
5173 case AArch64::LDRBui:
5174 case AArch64::LDRBBui:
5175 case AArch64::LDURBBi:
5176 case AArch64::LDRSBWui:
5177 case AArch64::LDURSBWi:
5178 case AArch64::STRBui:
5179 case AArch64::STRBBui:
5180 case AArch64::STURBBi:
5182 case AArch64::LDRHui:
5183 case AArch64::LDRHHui:
5184 case AArch64::LDURHHi:
5185 case AArch64::LDRSHWui:
5186 case AArch64::LDURSHWi:
5187 case AArch64::STRHui:
5188 case AArch64::STRHHui:
5189 case AArch64::STURHHi:
5191 case AArch64::LDRSui:
5192 case AArch64::LDURSi:
5193 case AArch64::LDRSpre:
5194 case AArch64::LDRSWui:
5195 case AArch64::LDURSWi:
5196 case AArch64::LDRSWpre:
5197 case AArch64::LDRWpre:
5198 case AArch64::LDRWui:
5199 case AArch64::LDURWi:
5200 case AArch64::STRSui:
5201 case AArch64::STURSi:
5202 case AArch64::STRSpre:
5203 case AArch64::STRWui:
5204 case AArch64::STURWi:
5205 case AArch64::STRWpre:
5206 case AArch64::LDPSi:
5207 case AArch64::LDPSWi:
5208 case AArch64::LDPWi:
5209 case AArch64::STPSi:
5210 case AArch64::STPWi:
5212 case AArch64::LDRDui:
5213 case AArch64::LDURDi:
5214 case AArch64::LDRDpre:
5215 case AArch64::LDRXui:
5216 case AArch64::LDURXi:
5217 case AArch64::LDRXpre:
5218 case AArch64::STRDui:
5219 case AArch64::STURDi:
5220 case AArch64::STRDpre:
5221 case AArch64::STRXui:
5222 case AArch64::STURXi:
5223 case AArch64::STRXpre:
5224 case AArch64::LDPDi:
5225 case AArch64::LDPXi:
5226 case AArch64::STPDi:
5227 case AArch64::STPXi:
5229 case AArch64::LDRQui:
5230 case AArch64::LDURQi:
5231 case AArch64::STRQui:
5232 case AArch64::STURQi:
5233 case AArch64::STRQpre:
5234 case AArch64::LDPQi:
5235 case AArch64::LDRQpre:
5236 case AArch64::STPQi:
5238 case AArch64::STZGi:
5239 case AArch64::ST2Gi:
5240 case AArch64::STZ2Gi:
5241 case AArch64::STGPi:
5247 switch (
MI.getOpcode()) {
5250 case AArch64::LDRWpre:
5251 case AArch64::LDRXpre:
5252 case AArch64::LDRSWpre:
5253 case AArch64::LDRSpre:
5254 case AArch64::LDRDpre:
5255 case AArch64::LDRQpre:
5261 switch (
MI.getOpcode()) {
5264 case AArch64::STRWpre:
5265 case AArch64::STRXpre:
5266 case AArch64::STRSpre:
5267 case AArch64::STRDpre:
5268 case AArch64::STRQpre:
5278 switch (
MI.getOpcode()) {
5281 case AArch64::LDURBBi:
5282 case AArch64::LDURHHi:
5283 case AArch64::LDURWi:
5284 case AArch64::LDRBBui:
5285 case AArch64::LDRHHui:
5286 case AArch64::LDRWui:
5287 case AArch64::LDRBBroX:
5288 case AArch64::LDRHHroX:
5289 case AArch64::LDRWroX:
5290 case AArch64::LDRBBroW:
5291 case AArch64::LDRHHroW:
5292 case AArch64::LDRWroW:
5298 switch (
MI.getOpcode()) {
5301 case AArch64::LDURSBWi:
5302 case AArch64::LDURSHWi:
5303 case AArch64::LDURSBXi:
5304 case AArch64::LDURSHXi:
5305 case AArch64::LDURSWi:
5306 case AArch64::LDRSBWui:
5307 case AArch64::LDRSHWui:
5308 case AArch64::LDRSBXui:
5309 case AArch64::LDRSHXui:
5310 case AArch64::LDRSWui:
5311 case AArch64::LDRSBWroX:
5312 case AArch64::LDRSHWroX:
5313 case AArch64::LDRSBXroX:
5314 case AArch64::LDRSHXroX:
5315 case AArch64::LDRSWroX:
5316 case AArch64::LDRSBWroW:
5317 case AArch64::LDRSHWroW:
5318 case AArch64::LDRSBXroW:
5319 case AArch64::LDRSHXroW:
5320 case AArch64::LDRSWroW:
5326 switch (
MI.getOpcode()) {
5329 case AArch64::LDPSi:
5330 case AArch64::LDPSWi:
5331 case AArch64::LDPDi:
5332 case AArch64::LDPQi:
5333 case AArch64::LDPWi:
5334 case AArch64::LDPXi:
5335 case AArch64::STPSi:
5336 case AArch64::STPDi:
5337 case AArch64::STPQi:
5338 case AArch64::STPWi:
5339 case AArch64::STPXi:
5340 case AArch64::STGPi:
5346 assert(
MI.mayLoadOrStore() &&
"Load or store instruction expected");
5350 return MI.getOperand(Idx);
5355 assert(
MI.mayLoadOrStore() &&
"Load or store instruction expected");
5359 return MI.getOperand(Idx);
5364 switch (
MI.getOpcode()) {
5367 case AArch64::LDRBroX:
5368 case AArch64::LDRBBroX:
5369 case AArch64::LDRSBXroX:
5370 case AArch64::LDRSBWroX:
5371 case AArch64::LDRHroX:
5372 case AArch64::LDRHHroX:
5373 case AArch64::LDRSHXroX:
5374 case AArch64::LDRSHWroX:
5375 case AArch64::LDRWroX:
5376 case AArch64::LDRSroX:
5377 case AArch64::LDRSWroX:
5378 case AArch64::LDRDroX:
5379 case AArch64::LDRXroX:
5380 case AArch64::LDRQroX:
5381 return MI.getOperand(4);
5387 if (
MI.getParent() ==
nullptr)
5397 auto Reg =
Op.getReg();
5398 if (Reg.isPhysical())
5399 return AArch64::FPR16RegClass.contains(Reg);
5401 return TRC == &AArch64::FPR16RegClass ||
5402 TRC == &AArch64::FPR16_loRegClass;
5411 auto Reg =
Op.getReg();
5412 if (Reg.isPhysical())
5413 return AArch64::FPR128RegClass.contains(Reg);
5415 return TRC == &AArch64::FPR128RegClass ||
5416 TRC == &AArch64::FPR128_loRegClass;
5422 switch (
MI.getOpcode()) {
5425 case AArch64::PACIASP:
5426 case AArch64::PACIBSP:
5429 case AArch64::PAUTH_PROLOGUE:
5432 case AArch64::HINT: {
5433 unsigned Imm =
MI.getOperand(0).getImm();
5435 if (Imm == 32 || Imm == 34 || Imm == 36 || Imm == 38)
5438 if (Imm == 25 || Imm == 27)
5450 assert(Reg.isPhysical() &&
"Expected physical register in isFpOrNEON");
5451 return AArch64::FPR128RegClass.contains(Reg) ||
5452 AArch64::FPR64RegClass.contains(Reg) ||
5453 AArch64::FPR32RegClass.contains(Reg) ||
5454 AArch64::FPR16RegClass.contains(Reg) ||
5455 AArch64::FPR8RegClass.contains(Reg);
5462 auto Reg =
Op.getReg();
5463 if (Reg.isPhysical())
5467 return TRC == &AArch64::FPR128RegClass ||
5468 TRC == &AArch64::FPR128_loRegClass ||
5469 TRC == &AArch64::FPR64RegClass ||
5470 TRC == &AArch64::FPR64_loRegClass ||
5471 TRC == &AArch64::FPR32RegClass || TRC == &AArch64::FPR16RegClass ||
5472 TRC == &AArch64::FPR8RegClass;
5494 if (FirstOpc == SecondOpc)
5500 case AArch64::STRSui:
5501 case AArch64::STURSi:
5502 return SecondOpc == AArch64::STRSui || SecondOpc == AArch64::STURSi;
5503 case AArch64::STRDui:
5504 case AArch64::STURDi:
5505 return SecondOpc == AArch64::STRDui || SecondOpc == AArch64::STURDi;
5506 case AArch64::STRQui:
5507 case AArch64::STURQi:
5508 return SecondOpc == AArch64::STRQui || SecondOpc == AArch64::STURQi;
5509 case AArch64::STRWui:
5510 case AArch64::STURWi:
5511 return SecondOpc == AArch64::STRWui || SecondOpc == AArch64::STURWi;
5512 case AArch64::STRXui:
5513 case AArch64::STURXi:
5514 return SecondOpc == AArch64::STRXui || SecondOpc == AArch64::STURXi;
5515 case AArch64::LDRSui:
5516 case AArch64::LDURSi:
5517 return SecondOpc == AArch64::LDRSui || SecondOpc == AArch64::LDURSi;
5518 case AArch64::LDRDui:
5519 case AArch64::LDURDi:
5520 return SecondOpc == AArch64::LDRDui || SecondOpc == AArch64::LDURDi;
5521 case AArch64::LDRQui:
5522 case AArch64::LDURQi:
5523 return SecondOpc == AArch64::LDRQui || SecondOpc == AArch64::LDURQi;
5524 case AArch64::LDRWui:
5525 case AArch64::LDURWi:
5526 return SecondOpc == AArch64::LDRSWui || SecondOpc == AArch64::LDURSWi;
5527 case AArch64::LDRSWui:
5528 case AArch64::LDURSWi:
5529 return SecondOpc == AArch64::LDRWui || SecondOpc == AArch64::LDURWi;
5530 case AArch64::LDRXui:
5531 case AArch64::LDURXi:
5532 return SecondOpc == AArch64::LDRXui || SecondOpc == AArch64::LDURXi;
5539 int64_t Offset1,
unsigned Opcode1,
int FI2,
5540 int64_t Offset2,
unsigned Opcode2) {
5546 assert(ObjectOffset1 <= ObjectOffset2 &&
"Object offsets are not ordered.");
5549 if (ObjectOffset1 % Scale1 != 0)
5551 ObjectOffset1 /= Scale1;
5553 if (ObjectOffset2 % Scale2 != 0)
5555 ObjectOffset2 /= Scale2;
5556 ObjectOffset1 += Offset1;
5557 ObjectOffset2 += Offset2;
5558 return ObjectOffset1 + 1 == ObjectOffset2;
5570 int64_t OpOffset2,
bool OffsetIsScalable2,
unsigned ClusterSize,
5571 unsigned NumBytes)
const {
5581 "Only base registers and frame indices are supported.");
5588 if (ClusterSize > 2)
5595 unsigned FirstOpc = FirstLdSt.
getOpcode();
5596 unsigned SecondOpc = SecondLdSt.
getOpcode();
5616 if (Offset1 > 63 || Offset1 < -64)
5621 if (BaseOp1.
isFI()) {
5623 "Caller should have ordered offsets.");
5628 BaseOp2.
getIndex(), Offset2, SecondOpc);
5631 assert(Offset1 <= Offset2 &&
"Caller should have ordered offsets.");
5633 return Offset1 + 1 == Offset2;
5643 if (
Reg.isPhysical())
5652 return ((DestReg - SrcReg) & 0x1f) < NumRegs;
5661 assert(Subtarget.hasNEON() &&
"Unexpected register copy without NEON");
5663 uint16_t DestEncoding =
TRI->getEncodingValue(DestReg);
5664 uint16_t SrcEncoding =
TRI->getEncodingValue(SrcReg);
5665 unsigned NumRegs = Indices.
size();
5667 int SubReg = 0, End = NumRegs, Incr = 1;
5669 SubReg = NumRegs - 1;
5674 for (; SubReg != End; SubReg += Incr) {
5686 unsigned Opcode,
unsigned ZeroReg,
5689 unsigned NumRegs = Indices.
size();
5692 uint16_t DestEncoding =
TRI->getEncodingValue(DestReg);
5693 uint16_t SrcEncoding =
TRI->getEncodingValue(SrcReg);
5694 assert(DestEncoding % NumRegs == 0 && SrcEncoding % NumRegs == 0 &&
5695 "GPR reg sequences should not be able to overlap");
5698 for (
unsigned SubReg = 0; SubReg != NumRegs; ++SubReg) {
5719 unsigned Opc =
MI.getOpcode();
5720 if (
Opc == AArch64::MSRpstatesvcrImm1 ||
Opc == AArch64::MSRpstatePseudo) {
5722 int64_t PState =
MI.getOperand(0).getImm();
5723 if (PState == AArch64SVCR::SVCRSM || PState == AArch64SVCR::SVCRSMZA) {
5725 return MI.getOperand(1).getImm() == 1;
5744 bool RenamableSrc)
const {
5746 if (AArch64::GPR32spRegClass.
contains(DestReg) &&
5747 AArch64::GPR32spRegClass.
contains(SrcReg)) {
5748 if (DestReg == AArch64::WSP || SrcReg == AArch64::WSP) {
5750 if (Subtarget.hasZeroCycleRegMoveGPR64() &&
5751 !Subtarget.hasZeroCycleRegMoveGPR32()) {
5753 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5754 &AArch64::GPR64spRegClass);
5755 MCRegister SrcRegX = RI.getMatchingSuperReg(SrcReg, AArch64::sub_32,
5756 &AArch64::GPR64spRegClass);
5766 ++NumZCRegMoveInstrsGPR;
5772 if (Subtarget.hasZeroCycleRegMoveGPR32())
5773 ++NumZCRegMoveInstrsGPR;
5775 }
else if (Subtarget.hasZeroCycleRegMoveGPR64() &&
5776 !Subtarget.hasZeroCycleRegMoveGPR32()) {
5778 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5779 &AArch64::GPR64spRegClass);
5780 assert(DestRegX.
isValid() &&
"Destination super-reg not valid");
5781 MCRegister SrcRegX = RI.getMatchingSuperReg(SrcReg, AArch64::sub_32,
5782 &AArch64::GPR64spRegClass);
5792 ++NumZCRegMoveInstrsGPR;
5798 if (Subtarget.hasZeroCycleRegMoveGPR32())
5799 ++NumZCRegMoveInstrsGPR;
5805 if (AArch64::GPR32spRegClass.
contains(DestReg) && SrcReg == AArch64::WZR) {
5806 if (Subtarget.hasZeroCycleZeroingGPR64() &&
5807 !Subtarget.hasZeroCycleZeroingGPR32()) {
5808 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5809 &AArch64::GPR64spRegClass);
5810 assert(DestRegX.
isValid() &&
"Destination super-reg not valid");
5814 ++NumZCZeroingInstrsGPR;
5815 }
else if (Subtarget.hasZeroCycleZeroingGPR32()) {
5819 ++NumZCZeroingInstrsGPR;
5828 if (AArch64::GPR64spRegClass.
contains(DestReg) &&
5829 AArch64::GPR64spRegClass.
contains(SrcReg)) {
5830 if (DestReg == AArch64::SP || SrcReg == AArch64::SP) {
5836 if (Subtarget.hasZeroCycleRegMoveGPR64())
5837 ++NumZCRegMoveInstrsGPR;
5843 if (Subtarget.hasZeroCycleRegMoveGPR64())
5844 ++NumZCRegMoveInstrsGPR;
5850 if (AArch64::GPR64spRegClass.
contains(DestReg) && SrcReg == AArch64::XZR) {
5851 if (Subtarget.hasZeroCycleZeroingGPR64()) {
5855 ++NumZCZeroingInstrsGPR;
5865 if (AArch64::PPRRegClass.
contains(DestReg) &&
5866 AArch64::PPRRegClass.
contains(SrcReg)) {
5867 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5868 "Unexpected SVE register.");
5878 bool DestIsPNR = AArch64::PNRRegClass.contains(DestReg);
5879 bool SrcIsPNR = AArch64::PNRRegClass.contains(SrcReg);
5880 if (DestIsPNR || SrcIsPNR) {
5882 return (R - AArch64::PN0) + AArch64::P0;
5887 if (PPRSrcReg != PPRDestReg) {
5899 if (AArch64::ZPRRegClass.
contains(DestReg) &&
5900 AArch64::ZPRRegClass.
contains(SrcReg)) {
5901 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5902 "Unexpected SVE register.");
5910 if ((AArch64::ZPR2RegClass.
contains(DestReg) ||
5911 AArch64::ZPR2StridedOrContiguousRegClass.
contains(DestReg)) &&
5912 (AArch64::ZPR2RegClass.
contains(SrcReg) ||
5913 AArch64::ZPR2StridedOrContiguousRegClass.
contains(SrcReg))) {
5914 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5915 "Unexpected SVE register.");
5916 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1};
5923 if (AArch64::ZPR3RegClass.
contains(DestReg) &&
5924 AArch64::ZPR3RegClass.
contains(SrcReg)) {
5925 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5926 "Unexpected SVE register.");
5927 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1,
5935 if ((AArch64::ZPR4RegClass.
contains(DestReg) ||
5936 AArch64::ZPR4StridedOrContiguousRegClass.
contains(DestReg)) &&
5937 (AArch64::ZPR4RegClass.
contains(SrcReg) ||
5938 AArch64::ZPR4StridedOrContiguousRegClass.
contains(SrcReg))) {
5939 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5940 "Unexpected SVE register.");
5941 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1,
5942 AArch64::zsub2, AArch64::zsub3};
5949 if (AArch64::DDDDRegClass.
contains(DestReg) &&
5950 AArch64::DDDDRegClass.
contains(SrcReg)) {
5951 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1,
5952 AArch64::dsub2, AArch64::dsub3};
5959 if (AArch64::DDDRegClass.
contains(DestReg) &&
5960 AArch64::DDDRegClass.
contains(SrcReg)) {
5961 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1,
5969 if (AArch64::DDRegClass.
contains(DestReg) &&
5970 AArch64::DDRegClass.
contains(SrcReg)) {
5971 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1};
5978 if (AArch64::QQQQRegClass.
contains(DestReg) &&
5979 AArch64::QQQQRegClass.
contains(SrcReg)) {
5980 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1,
5981 AArch64::qsub2, AArch64::qsub3};
5988 if (AArch64::QQQRegClass.
contains(DestReg) &&
5989 AArch64::QQQRegClass.
contains(SrcReg)) {
5990 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1,
5998 if (AArch64::QQRegClass.
contains(DestReg) &&
5999 AArch64::QQRegClass.
contains(SrcReg)) {
6000 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1};
6006 if (AArch64::XSeqPairsClassRegClass.
contains(DestReg) &&
6007 AArch64::XSeqPairsClassRegClass.
contains(SrcReg)) {
6008 static const unsigned Indices[] = {AArch64::sube64, AArch64::subo64};
6010 AArch64::XZR, Indices);
6014 if (AArch64::WSeqPairsClassRegClass.
contains(DestReg) &&
6015 AArch64::WSeqPairsClassRegClass.
contains(SrcReg)) {
6016 static const unsigned Indices[] = {AArch64::sube32, AArch64::subo32};
6018 AArch64::WZR, Indices);
6022 if (AArch64::FPR128RegClass.
contains(DestReg) &&
6023 AArch64::FPR128RegClass.
contains(SrcReg)) {
6027 if ((Subtarget.isSVEorStreamingSVEAvailable() &&
6028 !Subtarget.isNeonAvailable()) ||
6032 .
addReg(AArch64::Z0 + (SrcReg - AArch64::Q0))
6033 .
addReg(AArch64::Z0 + (SrcReg - AArch64::Q0));
6034 }
else if (Subtarget.isNeonAvailable()) {
6038 if (Subtarget.hasZeroCycleRegMoveFPR128())
6039 ++NumZCRegMoveInstrsFPR;
6055 if (AArch64::FPR64RegClass.
contains(DestReg) &&
6056 AArch64::FPR64RegClass.
contains(SrcReg)) {
6057 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6058 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6059 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6061 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::dsub,
6062 &AArch64::FPR128RegClass);
6063 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::dsub,
6064 &AArch64::FPR128RegClass);
6073 ++NumZCRegMoveInstrsFPR;
6077 if (Subtarget.hasZeroCycleRegMoveFPR64())
6078 ++NumZCRegMoveInstrsFPR;
6083 if (AArch64::FPR32RegClass.
contains(DestReg) &&
6084 AArch64::FPR32RegClass.
contains(SrcReg)) {
6085 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6086 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6087 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6089 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::ssub,
6090 &AArch64::FPR128RegClass);
6091 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::ssub,
6092 &AArch64::FPR128RegClass);
6101 ++NumZCRegMoveInstrsFPR;
6102 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6103 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6104 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::ssub,
6105 &AArch64::FPR64RegClass);
6106 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::ssub,
6107 &AArch64::FPR64RegClass);
6115 ++NumZCRegMoveInstrsFPR;
6119 if (Subtarget.hasZeroCycleRegMoveFPR32())
6120 ++NumZCRegMoveInstrsFPR;
6125 if (AArch64::FPR16RegClass.
contains(DestReg) &&
6126 AArch64::FPR16RegClass.
contains(SrcReg)) {
6127 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6128 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6129 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6131 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6132 &AArch64::FPR128RegClass);
6133 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6134 &AArch64::FPR128RegClass);
6143 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6144 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6145 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6146 &AArch64::FPR64RegClass);
6147 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6148 &AArch64::FPR64RegClass);
6157 DestReg = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6158 &AArch64::FPR32RegClass);
6159 SrcReg = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6160 &AArch64::FPR32RegClass);
6167 if (AArch64::FPR8RegClass.
contains(DestReg) &&
6168 AArch64::FPR8RegClass.
contains(SrcReg)) {
6169 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6170 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6171 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6173 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6174 &AArch64::FPR128RegClass);
6175 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6176 &AArch64::FPR128RegClass);
6185 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6186 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6187 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6188 &AArch64::FPR64RegClass);
6189 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6190 &AArch64::FPR64RegClass);
6199 DestReg = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6200 &AArch64::FPR32RegClass);
6201 SrcReg = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6202 &AArch64::FPR32RegClass);
6210 if (AArch64::FPR64RegClass.
contains(DestReg) &&
6211 AArch64::GPR64RegClass.
contains(SrcReg)) {
6212 if (AArch64::XZR == SrcReg) {
6220 if (AArch64::GPR64RegClass.
contains(DestReg) &&
6221 AArch64::FPR64RegClass.
contains(SrcReg)) {
6227 if (AArch64::FPR32RegClass.
contains(DestReg) &&
6228 AArch64::GPR32RegClass.
contains(SrcReg)) {
6229 if (AArch64::WZR == SrcReg) {
6237 if (AArch64::GPR32RegClass.
contains(DestReg) &&
6238 AArch64::FPR32RegClass.
contains(SrcReg)) {
6244 if (DestReg == AArch64::NZCV) {
6245 assert(AArch64::GPR64RegClass.
contains(SrcReg) &&
"Invalid NZCV copy");
6247 .
addImm(AArch64SysReg::NZCV)
6253 if (SrcReg == AArch64::NZCV) {
6254 assert(AArch64::GPR64RegClass.
contains(DestReg) &&
"Invalid NZCV copy");
6256 .
addImm(AArch64SysReg::NZCV)
6262 errs() << RI.getRegAsmName(DestReg) <<
" = COPY " << RI.getRegAsmName(SrcReg)
6273 unsigned SubIdx0,
unsigned SubIdx1,
int FI,
6278 SrcReg0 =
TRI.getSubReg(SrcReg, SubIdx0);
6280 SrcReg1 =
TRI.getSubReg(SrcReg, SubIdx1);
6293 Register SrcReg,
bool isKill,
int FI,
6308 switch (RI.getSpillSize(*RC)) {
6310 if (AArch64::FPR8RegClass.hasSubClassEq(RC))
6311 Opc = AArch64::STRBui;
6314 if (AArch64::FPR16RegClass.hasSubClassEq(RC))
6315 Opc = AArch64::STRHui;
6316 else if (AArch64::PNRRegClass.hasSubClassEq(RC) ||
6317 AArch64::PPRRegClass.hasSubClassEq(RC)) {
6318 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6319 "Unexpected register store without SVE store instructions");
6320 Opc = AArch64::STR_PXI;
6326 if (AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
6327 Opc = AArch64::STRWui;
6331 assert(SrcReg != AArch64::WSP);
6332 }
else if (AArch64::FPR32RegClass.hasSubClassEq(RC))
6333 Opc = AArch64::STRSui;
6334 else if (AArch64::PPR2RegClass.hasSubClassEq(RC)) {
6335 Opc = AArch64::STR_PPXI;
6340 if (AArch64::GPR64allRegClass.hasSubClassEq(RC)) {
6341 Opc = AArch64::STRXui;
6345 assert(SrcReg != AArch64::SP);
6346 }
else if (AArch64::FPR64RegClass.hasSubClassEq(RC)) {
6347 Opc = AArch64::STRDui;
6348 }
else if (AArch64::WSeqPairsClassRegClass.hasSubClassEq(RC)) {
6350 get(AArch64::STPWi), SrcReg, isKill,
6351 AArch64::sube32, AArch64::subo32, FI, MMO);
6356 if (AArch64::FPR128RegClass.hasSubClassEq(RC))
6357 Opc = AArch64::STRQui;
6358 else if (AArch64::DDRegClass.hasSubClassEq(RC)) {
6359 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6360 Opc = AArch64::ST1Twov1d;
6362 }
else if (AArch64::XSeqPairsClassRegClass.hasSubClassEq(RC)) {
6364 get(AArch64::STPXi), SrcReg, isKill,
6365 AArch64::sube64, AArch64::subo64, FI, MMO);
6367 }
else if (AArch64::ZPRRegClass.hasSubClassEq(RC)) {
6368 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6369 "Unexpected register store without SVE store instructions");
6370 Opc = AArch64::STR_ZXI;
6375 if (AArch64::DDDRegClass.hasSubClassEq(RC)) {
6376 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6377 Opc = AArch64::ST1Threev1d;
6382 if (AArch64::DDDDRegClass.hasSubClassEq(RC)) {
6383 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6384 Opc = AArch64::ST1Fourv1d;
6386 }
else if (AArch64::QQRegClass.hasSubClassEq(RC)) {
6387 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6388 Opc = AArch64::ST1Twov2d;
6390 }
else if (AArch64::ZPR2StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6391 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6392 "Unexpected register store without SVE store instructions");
6393 Opc = AArch64::STR_ZZXI_STRIDED_CONTIGUOUS;
6395 }
else if (AArch64::ZPR2RegClass.hasSubClassEq(RC)) {
6396 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6397 "Unexpected register store without SVE store instructions");
6398 Opc = AArch64::STR_ZZXI;
6403 if (AArch64::QQQRegClass.hasSubClassEq(RC)) {
6404 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6405 Opc = AArch64::ST1Threev2d;
6407 }
else if (AArch64::ZPR3RegClass.hasSubClassEq(RC)) {
6408 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6409 "Unexpected register store without SVE store instructions");
6410 Opc = AArch64::STR_ZZZXI;
6415 if (AArch64::QQQQRegClass.hasSubClassEq(RC)) {
6416 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6417 Opc = AArch64::ST1Fourv2d;
6419 }
else if (AArch64::ZPR4StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6420 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6421 "Unexpected register store without SVE store instructions");
6422 Opc = AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS;
6424 }
else if (AArch64::ZPR4RegClass.hasSubClassEq(RC)) {
6425 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6426 "Unexpected register store without SVE store instructions");
6427 Opc = AArch64::STR_ZZZZXI;
6432 assert(
Opc &&
"Unknown register class");
6443 MI.addMemOperand(MMO);
6450 Register DestReg,
unsigned SubIdx0,
6451 unsigned SubIdx1,
int FI,
6455 bool IsUndef =
true;
6457 DestReg0 =
TRI.getSubReg(DestReg, SubIdx0);
6459 DestReg1 =
TRI.getSubReg(DestReg, SubIdx1);
6488 switch (
TRI.getSpillSize(*RC)) {
6490 if (AArch64::FPR8RegClass.hasSubClassEq(RC))
6491 Opc = AArch64::LDRBui;
6494 bool IsPNR = AArch64::PNRRegClass.hasSubClassEq(RC);
6495 if (AArch64::FPR16RegClass.hasSubClassEq(RC))
6496 Opc = AArch64::LDRHui;
6497 else if (IsPNR || AArch64::PPRRegClass.hasSubClassEq(RC)) {
6498 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6499 "Unexpected register load without SVE load instructions");
6502 Opc = AArch64::LDR_PXI;
6508 if (AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
6509 Opc = AArch64::LDRWui;
6513 assert(DestReg != AArch64::WSP);
6514 }
else if (AArch64::FPR32RegClass.hasSubClassEq(RC))
6515 Opc = AArch64::LDRSui;
6516 else if (AArch64::PPR2RegClass.hasSubClassEq(RC)) {
6517 Opc = AArch64::LDR_PPXI;
6522 if (AArch64::GPR64allRegClass.hasSubClassEq(RC)) {
6523 Opc = AArch64::LDRXui;
6527 assert(DestReg != AArch64::SP);
6528 }
else if (AArch64::FPR64RegClass.hasSubClassEq(RC)) {
6529 Opc = AArch64::LDRDui;
6530 }
else if (AArch64::WSeqPairsClassRegClass.hasSubClassEq(RC)) {
6532 get(AArch64::LDPWi), DestReg, AArch64::sube32,
6533 AArch64::subo32, FI, MMO);
6538 if (AArch64::FPR128RegClass.hasSubClassEq(RC))
6539 Opc = AArch64::LDRQui;
6540 else if (AArch64::DDRegClass.hasSubClassEq(RC)) {
6541 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6542 Opc = AArch64::LD1Twov1d;
6544 }
else if (AArch64::XSeqPairsClassRegClass.hasSubClassEq(RC)) {
6546 get(AArch64::LDPXi), DestReg, AArch64::sube64,
6547 AArch64::subo64, FI, MMO);
6549 }
else if (AArch64::ZPRRegClass.hasSubClassEq(RC)) {
6550 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6551 "Unexpected register load without SVE load instructions");
6552 Opc = AArch64::LDR_ZXI;
6557 if (AArch64::DDDRegClass.hasSubClassEq(RC)) {
6558 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6559 Opc = AArch64::LD1Threev1d;
6564 if (AArch64::DDDDRegClass.hasSubClassEq(RC)) {
6565 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6566 Opc = AArch64::LD1Fourv1d;
6568 }
else if (AArch64::QQRegClass.hasSubClassEq(RC)) {
6569 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6570 Opc = AArch64::LD1Twov2d;
6572 }
else if (AArch64::ZPR2StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6573 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6574 "Unexpected register load without SVE load instructions");
6575 Opc = AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS;
6577 }
else if (AArch64::ZPR2RegClass.hasSubClassEq(RC)) {
6578 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6579 "Unexpected register load without SVE load instructions");
6580 Opc = AArch64::LDR_ZZXI;
6585 if (AArch64::QQQRegClass.hasSubClassEq(RC)) {
6586 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6587 Opc = AArch64::LD1Threev2d;
6589 }
else if (AArch64::ZPR3RegClass.hasSubClassEq(RC)) {
6590 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6591 "Unexpected register load without SVE load instructions");
6592 Opc = AArch64::LDR_ZZZXI;
6597 if (AArch64::QQQQRegClass.hasSubClassEq(RC)) {
6598 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6599 Opc = AArch64::LD1Fourv2d;
6601 }
else if (AArch64::ZPR4StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6602 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6603 "Unexpected register load without SVE load instructions");
6604 Opc = AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS;
6606 }
else if (AArch64::ZPR4RegClass.hasSubClassEq(RC)) {
6607 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6608 "Unexpected register load without SVE load instructions");
6609 Opc = AArch64::LDR_ZZZZXI;
6615 assert(
Opc &&
"Unknown register class");
6625 MI.addMemOperand(MMO);
6632 UseMI.getIterator()),
6634 return I.modifiesRegister(AArch64::NZCV, TRI) ||
6635 I.readsRegister(AArch64::NZCV, TRI);
6639void AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
6644 assert(
Offset.getScalable() % 2 == 0 &&
"Invalid frame offset");
6651 ByteSized =
Offset.getFixed();
6652 VGSized =
Offset.getScalable() / 2;
6658void AArch64InstrInfo::decomposeStackOffsetForFrameOffsets(
6660 int64_t &NumDataVectors) {
6664 assert(
Offset.getScalable() % 2 == 0 &&
"Invalid frame offset");
6666 NumBytes =
Offset.getFixed();
6668 NumPredicateVectors =
Offset.getScalable() / 2;
6673 if (NumPredicateVectors % 8 == 0 || NumPredicateVectors < -64 ||
6674 NumPredicateVectors > 62) {
6675 NumDataVectors = NumPredicateVectors / 8;
6676 NumPredicateVectors -= NumDataVectors * 8;
6702 Expr.
push_back((
char)dwarf::DW_OP_bregx);
6710 int64_t OffsetFromDefCFA) {
6724 Comment << (NumBytes < 0 ?
" - " :
" + ") << std::abs(NumBytes);
6725 if (!RegScale.empty())
6735 int64_t NumBytes, NumVGScaledBytes;
6736 AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
Offset, NumBytes,
6738 std::string CommentBuffer;
6741 if (
Reg == AArch64::SP)
6743 else if (
Reg == AArch64::FP)
6750 unsigned DwarfReg =
TRI.getDwarfRegNum(
Reg,
true);
6751 assert(DwarfReg <= 31 &&
"DwarfReg out of bounds (0..31)");
6753 Expr.
push_back(dwarf::DW_OP_breg0 + DwarfReg);
6756 if (NumVGScaledBytes) {
6766 DefCfaExpr.
push_back(dwarf::DW_CFA_def_cfa_expression);
6774 unsigned FrameReg,
unsigned Reg,
6776 bool LastAdjustmentWasScalable) {
6777 if (
Offset.getScalable())
6780 if (FrameReg == Reg && !LastAdjustmentWasScalable)
6783 unsigned DwarfReg =
TRI.getDwarfRegNum(Reg,
true);
6790 std::optional<int64_t> IncomingVGOffsetFromDefCFA) {
6791 int64_t NumBytes, NumVGScaledBytes;
6792 AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
6793 OffsetFromDefCFA, NumBytes, NumVGScaledBytes);
6795 unsigned DwarfReg =
TRI.getDwarfRegNum(Reg,
true);
6798 if (!NumVGScaledBytes)
6801 std::string CommentBuffer;
6806 assert(NumVGScaledBytes &&
"Expected scalable offset");
6810 if (IncomingVGOffsetFromDefCFA) {
6812 VGRegScale =
"* IncomingVG";
6815 VGRegScale =
"* VG";
6819 OffsetExpr.
push_back(dwarf::DW_OP_plus);
6828 CfaExpr.
push_back(dwarf::DW_CFA_expression);
6843 unsigned SrcReg, int64_t
Offset,
unsigned Opc,
6846 bool *HasWinCFI,
bool EmitCFAOffset,
6849 unsigned MaxEncoding, ShiftSize;
6851 case AArch64::ADDXri:
6852 case AArch64::ADDSXri:
6853 case AArch64::SUBXri:
6854 case AArch64::SUBSXri:
6855 MaxEncoding = 0xfff;
6858 case AArch64::ADDVL_XXI:
6859 case AArch64::ADDPL_XXI:
6860 case AArch64::ADDSVL_XXI:
6861 case AArch64::ADDSPL_XXI:
6876 if (
Opc == AArch64::ADDVL_XXI ||
Opc == AArch64::ADDSVL_XXI)
6878 else if (
Opc == AArch64::ADDPL_XXI ||
Opc == AArch64::ADDSPL_XXI)
6892 const unsigned MaxEncodableValue = MaxEncoding << ShiftSize;
6894 if (TmpReg == AArch64::XZR)
6895 TmpReg =
MBB.getParent()->getRegInfo().createVirtualRegister(
6896 &AArch64::GPR64RegClass);
6898 uint64_t ThisVal = std::min<uint64_t>(
Offset, MaxEncodableValue);
6899 unsigned LocalShiftSize = 0;
6900 if (ThisVal > MaxEncoding) {
6901 ThisVal = ThisVal >> ShiftSize;
6902 LocalShiftSize = ShiftSize;
6904 assert((ThisVal >> ShiftSize) <= MaxEncoding &&
6905 "Encoding cannot handle value that big");
6907 Offset -= ThisVal << LocalShiftSize;
6912 .
addImm(Sign * (
int)ThisVal);
6922 if (Sign == -1 ||
Opc == AArch64::SUBXri ||
Opc == AArch64::SUBSXri)
6923 CFAOffset += Change;
6925 CFAOffset -= Change;
6926 if (EmitCFAOffset && DestReg == TmpReg) {
6939 int Imm = (int)(ThisVal << LocalShiftSize);
6940 if (VScale != 1 && DestReg == AArch64::SP) {
6946 }
else if ((DestReg == AArch64::FP && SrcReg == AArch64::SP) ||
6947 (SrcReg == AArch64::FP && DestReg == AArch64::SP)) {
6948 assert(VScale == 1 &&
"Expected non-scalable operation");
6957 assert(
Offset == 0 &&
"Expected remaining offset to be zero to "
6958 "emit a single SEH directive");
6959 }
else if (DestReg == AArch64::SP) {
6960 assert(VScale == 1 &&
"Expected non-scalable operation");
6963 assert(SrcReg == AArch64::SP &&
"Unexpected SrcReg for SEH_StackAlloc");
6976 unsigned DestReg,
unsigned SrcReg,
6979 bool NeedsWinCFI,
bool *HasWinCFI,
6981 unsigned FrameReg) {
6988 bool UseSVL =
F.hasFnAttribute(
"aarch64_pstate_sm_body");
6990 int64_t Bytes, NumPredicateVectors, NumDataVectors;
6991 AArch64InstrInfo::decomposeStackOffsetForFrameOffsets(
6992 Offset, Bytes, NumPredicateVectors, NumDataVectors);
6995 bool NeedsFinalDefNZCV = SetNZCV && (NumPredicateVectors || NumDataVectors);
6996 if (NeedsFinalDefNZCV)
7000 if (Bytes || (!
Offset && SrcReg != DestReg)) {
7001 assert((DestReg != AArch64::SP || Bytes % 8 == 0) &&
7002 "SP increment/decrement not 8-byte aligned");
7003 unsigned Opc = SetNZCV ? AArch64::ADDSXri : AArch64::ADDXri;
7006 Opc = SetNZCV ? AArch64::SUBSXri : AArch64::SUBXri;
7009 NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
7011 CFAOffset += (
Opc == AArch64::ADDXri ||
Opc == AArch64::ADDSXri)
7018 assert(!(NeedsWinCFI && NumPredicateVectors) &&
7019 "WinCFI can't allocate fractions of an SVE data vector");
7021 if (NumDataVectors) {
7023 UseSVL ? AArch64::ADDSVL_XXI : AArch64::ADDVL_XXI,
TII,
7024 Flag, NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
7030 if (NumPredicateVectors) {
7031 assert(DestReg != AArch64::SP &&
"Unaligned access to SP");
7033 UseSVL ? AArch64::ADDSPL_XXI : AArch64::ADDPL_XXI,
TII,
7034 Flag, NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
7038 if (NeedsFinalDefNZCV)
7060 if (
MI.isFullCopy()) {
7063 if (SrcReg == AArch64::SP && DstReg.
isVirtual()) {
7067 if (DstReg == AArch64::SP && SrcReg.
isVirtual()) {
7072 if (SrcReg == AArch64::NZCV || DstReg == AArch64::NZCV)
7100 if (
MI.isCopy() &&
Ops.size() == 1 &&
7102 (
Ops[0] == 0 ||
Ops[0] == 1)) {
7103 bool IsSpill =
Ops[0] == 0;
7104 bool IsFill = !IsSpill;
7116 :
TRI.getMinimalPhysRegClass(Reg);
7122 "Mismatched register size in non subreg COPY");
7129 return &*--InsertPt;
7141 if (IsSpill && DstMO.
isUndef() && SrcReg == AArch64::WZR &&
7144 "Unexpected subreg on physical register");
7146 FrameIndex, &AArch64::GPR64RegClass,
Register());
7147 return &*--InsertPt;
7164 case AArch64::sub_32:
7165 if (AArch64::GPR64RegClass.hasSubClassEq(
getRegClass(DstReg)))
7166 FillRC = &AArch64::GPR32RegClass;
7169 FillRC = &AArch64::FPR32RegClass;
7172 FillRC = &AArch64::FPR64RegClass;
7178 TRI.getRegSizeInBits(*FillRC) &&
7179 "Mismatched regclass size on folded subreg COPY");
7198 bool *OutUseUnscaledOp,
7199 unsigned *OutUnscaledOp,
7200 int64_t *EmittableOffset) {
7202 if (EmittableOffset)
7203 *EmittableOffset = 0;
7204 if (OutUseUnscaledOp)
7205 *OutUseUnscaledOp =
false;
7211 switch (
MI.getOpcode()) {
7214 case AArch64::LD1Rv1d:
7215 case AArch64::LD1Rv2s:
7216 case AArch64::LD1Rv2d:
7217 case AArch64::LD1Rv4h:
7218 case AArch64::LD1Rv4s:
7219 case AArch64::LD1Rv8b:
7220 case AArch64::LD1Rv8h:
7221 case AArch64::LD1Rv16b:
7222 case AArch64::LD1Twov2d:
7223 case AArch64::LD1Threev2d:
7224 case AArch64::LD1Fourv2d:
7225 case AArch64::LD1Twov1d:
7226 case AArch64::LD1Threev1d:
7227 case AArch64::LD1Fourv1d:
7228 case AArch64::ST1Twov2d:
7229 case AArch64::ST1Threev2d:
7230 case AArch64::ST1Fourv2d:
7231 case AArch64::ST1Twov1d:
7232 case AArch64::ST1Threev1d:
7233 case AArch64::ST1Fourv1d:
7234 case AArch64::ST1i8:
7235 case AArch64::ST1i16:
7236 case AArch64::ST1i32:
7237 case AArch64::ST1i64:
7239 case AArch64::IRGstack:
7240 case AArch64::STGloop:
7241 case AArch64::STZGloop:
7246 TypeSize ScaleValue(0U,
false), Width(0U,
false);
7247 int64_t MinOff, MaxOff;
7253 bool IsMulVL = ScaleValue.isScalable();
7254 unsigned Scale = ScaleValue.getKnownMinValue();
7264 std::optional<unsigned> UnscaledOp =
7266 bool useUnscaledOp = UnscaledOp && (
Offset % Scale ||
Offset < 0);
7267 if (useUnscaledOp &&
7272 Scale = ScaleValue.getKnownMinValue();
7273 assert(IsMulVL == ScaleValue.isScalable() &&
7274 "Unscaled opcode has different value for scalable");
7276 int64_t Remainder =
Offset % Scale;
7277 assert(!(Remainder && useUnscaledOp) &&
7278 "Cannot have remainder when using unscaled op");
7280 assert(MinOff < MaxOff &&
"Unexpected Min/Max offsets");
7281 int64_t NewOffset =
Offset / Scale;
7282 if (MinOff <= NewOffset && NewOffset <= MaxOff)
7285 NewOffset = NewOffset < 0 ? MinOff : MaxOff;
7289 if (EmittableOffset)
7290 *EmittableOffset = NewOffset;
7291 if (OutUseUnscaledOp)
7292 *OutUseUnscaledOp = useUnscaledOp;
7293 if (OutUnscaledOp && UnscaledOp)
7294 *OutUnscaledOp = *UnscaledOp;
7307 unsigned Opcode =
MI.getOpcode();
7308 unsigned ImmIdx = FrameRegIdx + 1;
7310 if (Opcode == AArch64::ADDSXri || Opcode == AArch64::ADDXri) {
7315 MI.eraseFromParent();
7321 unsigned UnscaledOp;
7324 &UnscaledOp, &NewOffset);
7328 MI.getOperand(FrameRegIdx).ChangeToRegister(FrameReg,
false);
7330 MI.setDesc(
TII->get(UnscaledOp));
7332 MI.getOperand(ImmIdx).ChangeToImmediate(NewOffset);
7348bool AArch64InstrInfo::useMachineCombiner()
const {
return true; }
7353 case AArch64::ADDSWrr:
7354 case AArch64::ADDSWri:
7355 case AArch64::ADDSXrr:
7356 case AArch64::ADDSXri:
7357 case AArch64::SUBSWrr:
7358 case AArch64::SUBSXrr:
7360 case AArch64::SUBSWri:
7361 case AArch64::SUBSXri:
7372 case AArch64::ADDWrr:
7373 case AArch64::ADDWri:
7374 case AArch64::SUBWrr:
7375 case AArch64::ADDSWrr:
7376 case AArch64::ADDSWri:
7377 case AArch64::SUBSWrr:
7379 case AArch64::SUBWri:
7380 case AArch64::SUBSWri:
7391 case AArch64::ADDXrr:
7392 case AArch64::ADDXri:
7393 case AArch64::SUBXrr:
7394 case AArch64::ADDSXrr:
7395 case AArch64::ADDSXri:
7396 case AArch64::SUBSXrr:
7398 case AArch64::SUBXri:
7399 case AArch64::SUBSXri:
7400 case AArch64::ADDv8i8:
7401 case AArch64::ADDv16i8:
7402 case AArch64::ADDv4i16:
7403 case AArch64::ADDv8i16:
7404 case AArch64::ADDv2i32:
7405 case AArch64::ADDv4i32:
7406 case AArch64::SUBv8i8:
7407 case AArch64::SUBv16i8:
7408 case AArch64::SUBv4i16:
7409 case AArch64::SUBv8i16:
7410 case AArch64::SUBv2i32:
7411 case AArch64::SUBv4i32:
7424 case AArch64::FADDHrr:
7425 case AArch64::FADDSrr:
7426 case AArch64::FADDDrr:
7427 case AArch64::FADDv4f16:
7428 case AArch64::FADDv8f16:
7429 case AArch64::FADDv2f32:
7430 case AArch64::FADDv2f64:
7431 case AArch64::FADDv4f32:
7432 case AArch64::FSUBHrr:
7433 case AArch64::FSUBSrr:
7434 case AArch64::FSUBDrr:
7435 case AArch64::FSUBv4f16:
7436 case AArch64::FSUBv8f16:
7437 case AArch64::FSUBv2f32:
7438 case AArch64::FSUBv2f64:
7439 case AArch64::FSUBv4f32:
7458 unsigned CombineOpc,
unsigned ZeroReg = 0,
7459 bool CheckZeroReg =
false) {
7466 if (!
MI ||
MI->getParent() != &
MBB ||
MI->getOpcode() != CombineOpc)
7473 assert(
MI->getNumOperands() >= 4 &&
MI->getOperand(0).isReg() &&
7474 MI->getOperand(1).isReg() &&
MI->getOperand(2).isReg() &&
7475 MI->getOperand(3).isReg() &&
"MAdd/MSub must have a least 4 regs");
7477 if (
MI->getOperand(3).getReg() != ZeroReg)
7482 MI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
true) == -1)
7491 unsigned MulOpc,
unsigned ZeroReg) {
7506bool AArch64InstrInfo::isAssociativeAndCommutative(
const MachineInstr &Inst,
7507 bool Invert)
const {
7513 case AArch64::FADDHrr:
7514 case AArch64::FADDSrr:
7515 case AArch64::FADDDrr:
7516 case AArch64::FMULHrr:
7517 case AArch64::FMULSrr:
7518 case AArch64::FMULDrr:
7519 case AArch64::FMULX16:
7520 case AArch64::FMULX32:
7521 case AArch64::FMULX64:
7523 case AArch64::FADDv4f16:
7524 case AArch64::FADDv8f16:
7525 case AArch64::FADDv2f32:
7526 case AArch64::FADDv4f32:
7527 case AArch64::FADDv2f64:
7528 case AArch64::FMULv4f16:
7529 case AArch64::FMULv8f16:
7530 case AArch64::FMULv2f32:
7531 case AArch64::FMULv4f32:
7532 case AArch64::FMULv2f64:
7533 case AArch64::FMULXv4f16:
7534 case AArch64::FMULXv8f16:
7535 case AArch64::FMULXv2f32:
7536 case AArch64::FMULXv4f32:
7537 case AArch64::FMULXv2f64:
7541 case AArch64::FADD_ZZZ_H:
7542 case AArch64::FADD_ZZZ_S:
7543 case AArch64::FADD_ZZZ_D:
7544 case AArch64::FMUL_ZZZ_H:
7545 case AArch64::FMUL_ZZZ_S:
7546 case AArch64::FMUL_ZZZ_D:
7557 case AArch64::ADDWrr:
7558 case AArch64::ADDXrr:
7559 case AArch64::ANDWrr:
7560 case AArch64::ANDXrr:
7561 case AArch64::ORRWrr:
7562 case AArch64::ORRXrr:
7563 case AArch64::EORWrr:
7564 case AArch64::EORXrr:
7565 case AArch64::EONWrr:
7566 case AArch64::EONXrr:
7570 case AArch64::ADDv8i8:
7571 case AArch64::ADDv16i8:
7572 case AArch64::ADDv4i16:
7573 case AArch64::ADDv8i16:
7574 case AArch64::ADDv2i32:
7575 case AArch64::ADDv4i32:
7576 case AArch64::ADDv1i64:
7577 case AArch64::ADDv2i64:
7578 case AArch64::MULv8i8:
7579 case AArch64::MULv16i8:
7580 case AArch64::MULv4i16:
7581 case AArch64::MULv8i16:
7582 case AArch64::MULv2i32:
7583 case AArch64::MULv4i32:
7584 case AArch64::ANDv8i8:
7585 case AArch64::ANDv16i8:
7586 case AArch64::ORRv8i8:
7587 case AArch64::ORRv16i8:
7588 case AArch64::EORv8i8:
7589 case AArch64::EORv16i8:
7591 case AArch64::ADD_ZZZ_B:
7592 case AArch64::ADD_ZZZ_H:
7593 case AArch64::ADD_ZZZ_S:
7594 case AArch64::ADD_ZZZ_D:
7595 case AArch64::MUL_ZZZ_B:
7596 case AArch64::MUL_ZZZ_H:
7597 case AArch64::MUL_ZZZ_S:
7598 case AArch64::MUL_ZZZ_D:
7599 case AArch64::AND_ZZZ:
7600 case AArch64::ORR_ZZZ:
7601 case AArch64::EOR_ZZZ:
7632 auto setFound = [&](
int Opcode,
int Operand,
unsigned ZeroReg,
7640 auto setVFound = [&](
int Opcode,
int Operand,
unsigned Pattern) {
7652 case AArch64::ADDWrr:
7654 "ADDWrr does not have register operands");
7655 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULADDW_OP1);
7656 setFound(AArch64::MADDWrrr, 2, AArch64::WZR, MCP::MULADDW_OP2);
7658 case AArch64::ADDXrr:
7659 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULADDX_OP1);
7660 setFound(AArch64::MADDXrrr, 2, AArch64::XZR, MCP::MULADDX_OP2);
7662 case AArch64::SUBWrr:
7663 setFound(AArch64::MADDWrrr, 2, AArch64::WZR, MCP::MULSUBW_OP2);
7664 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULSUBW_OP1);
7666 case AArch64::SUBXrr:
7667 setFound(AArch64::MADDXrrr, 2, AArch64::XZR, MCP::MULSUBX_OP2);
7668 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULSUBX_OP1);
7670 case AArch64::ADDWri:
7671 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULADDWI_OP1);
7673 case AArch64::ADDXri:
7674 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULADDXI_OP1);
7676 case AArch64::SUBWri:
7677 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULSUBWI_OP1);
7679 case AArch64::SUBXri:
7680 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULSUBXI_OP1);
7682 case AArch64::ADDv8i8:
7683 setVFound(AArch64::MULv8i8, 1, MCP::MULADDv8i8_OP1);
7684 setVFound(AArch64::MULv8i8, 2, MCP::MULADDv8i8_OP2);
7686 case AArch64::ADDv16i8:
7687 setVFound(AArch64::MULv16i8, 1, MCP::MULADDv16i8_OP1);
7688 setVFound(AArch64::MULv16i8, 2, MCP::MULADDv16i8_OP2);
7690 case AArch64::ADDv4i16:
7691 setVFound(AArch64::MULv4i16, 1, MCP::MULADDv4i16_OP1);
7692 setVFound(AArch64::MULv4i16, 2, MCP::MULADDv4i16_OP2);
7693 setVFound(AArch64::MULv4i16_indexed, 1, MCP::MULADDv4i16_indexed_OP1);
7694 setVFound(AArch64::MULv4i16_indexed, 2, MCP::MULADDv4i16_indexed_OP2);
7696 case AArch64::ADDv8i16:
7697 setVFound(AArch64::MULv8i16, 1, MCP::MULADDv8i16_OP1);
7698 setVFound(AArch64::MULv8i16, 2, MCP::MULADDv8i16_OP2);
7699 setVFound(AArch64::MULv8i16_indexed, 1, MCP::MULADDv8i16_indexed_OP1);
7700 setVFound(AArch64::MULv8i16_indexed, 2, MCP::MULADDv8i16_indexed_OP2);
7702 case AArch64::ADDv2i32:
7703 setVFound(AArch64::MULv2i32, 1, MCP::MULADDv2i32_OP1);
7704 setVFound(AArch64::MULv2i32, 2, MCP::MULADDv2i32_OP2);
7705 setVFound(AArch64::MULv2i32_indexed, 1, MCP::MULADDv2i32_indexed_OP1);
7706 setVFound(AArch64::MULv2i32_indexed, 2, MCP::MULADDv2i32_indexed_OP2);
7708 case AArch64::ADDv4i32:
7709 setVFound(AArch64::MULv4i32, 1, MCP::MULADDv4i32_OP1);
7710 setVFound(AArch64::MULv4i32, 2, MCP::MULADDv4i32_OP2);
7711 setVFound(AArch64::MULv4i32_indexed, 1, MCP::MULADDv4i32_indexed_OP1);
7712 setVFound(AArch64::MULv4i32_indexed, 2, MCP::MULADDv4i32_indexed_OP2);
7714 case AArch64::SUBv8i8:
7715 setVFound(AArch64::MULv8i8, 1, MCP::MULSUBv8i8_OP1);
7716 setVFound(AArch64::MULv8i8, 2, MCP::MULSUBv8i8_OP2);
7718 case AArch64::SUBv16i8:
7719 setVFound(AArch64::MULv16i8, 1, MCP::MULSUBv16i8_OP1);
7720 setVFound(AArch64::MULv16i8, 2, MCP::MULSUBv16i8_OP2);
7722 case AArch64::SUBv4i16:
7723 setVFound(AArch64::MULv4i16, 1, MCP::MULSUBv4i16_OP1);
7724 setVFound(AArch64::MULv4i16, 2, MCP::MULSUBv4i16_OP2);
7725 setVFound(AArch64::MULv4i16_indexed, 1, MCP::MULSUBv4i16_indexed_OP1);
7726 setVFound(AArch64::MULv4i16_indexed, 2, MCP::MULSUBv4i16_indexed_OP2);
7728 case AArch64::SUBv8i16:
7729 setVFound(AArch64::MULv8i16, 1, MCP::MULSUBv8i16_OP1);
7730 setVFound(AArch64::MULv8i16, 2, MCP::MULSUBv8i16_OP2);
7731 setVFound(AArch64::MULv8i16_indexed, 1, MCP::MULSUBv8i16_indexed_OP1);
7732 setVFound(AArch64::MULv8i16_indexed, 2, MCP::MULSUBv8i16_indexed_OP2);
7734 case AArch64::SUBv2i32:
7735 setVFound(AArch64::MULv2i32, 1, MCP::MULSUBv2i32_OP1);
7736 setVFound(AArch64::MULv2i32, 2, MCP::MULSUBv2i32_OP2);
7737 setVFound(AArch64::MULv2i32_indexed, 1, MCP::MULSUBv2i32_indexed_OP1);
7738 setVFound(AArch64::MULv2i32_indexed, 2, MCP::MULSUBv2i32_indexed_OP2);
7740 case AArch64::SUBv4i32:
7741 setVFound(AArch64::MULv4i32, 1, MCP::MULSUBv4i32_OP1);
7742 setVFound(AArch64::MULv4i32, 2, MCP::MULSUBv4i32_OP2);
7743 setVFound(AArch64::MULv4i32_indexed, 1, MCP::MULSUBv4i32_indexed_OP1);
7744 setVFound(AArch64::MULv4i32_indexed, 2, MCP::MULSUBv4i32_indexed_OP2);
7750bool AArch64InstrInfo::isAccumulationOpcode(
unsigned Opcode)
const {
7754 case AArch64::UABALB_ZZZ_D:
7755 case AArch64::UABALB_ZZZ_H:
7756 case AArch64::UABALB_ZZZ_S:
7757 case AArch64::UABALT_ZZZ_D:
7758 case AArch64::UABALT_ZZZ_H:
7759 case AArch64::UABALT_ZZZ_S:
7760 case AArch64::SABALB_ZZZ_D:
7761 case AArch64::SABALB_ZZZ_S:
7762 case AArch64::SABALB_ZZZ_H:
7763 case AArch64::SABALT_ZZZ_D:
7764 case AArch64::SABALT_ZZZ_S:
7765 case AArch64::SABALT_ZZZ_H:
7766 case AArch64::UABALv16i8_v8i16:
7767 case AArch64::UABALv2i32_v2i64:
7768 case AArch64::UABALv4i16_v4i32:
7769 case AArch64::UABALv4i32_v2i64:
7770 case AArch64::UABALv8i16_v4i32:
7771 case AArch64::UABALv8i8_v8i16:
7772 case AArch64::UABAv16i8:
7773 case AArch64::UABAv2i32:
7774 case AArch64::UABAv4i16:
7775 case AArch64::UABAv4i32:
7776 case AArch64::UABAv8i16:
7777 case AArch64::UABAv8i8:
7778 case AArch64::SABALv16i8_v8i16:
7779 case AArch64::SABALv2i32_v2i64:
7780 case AArch64::SABALv4i16_v4i32:
7781 case AArch64::SABALv4i32_v2i64:
7782 case AArch64::SABALv8i16_v4i32:
7783 case AArch64::SABALv8i8_v8i16:
7784 case AArch64::SABAv16i8:
7785 case AArch64::SABAv2i32:
7786 case AArch64::SABAv4i16:
7787 case AArch64::SABAv4i32:
7788 case AArch64::SABAv8i16:
7789 case AArch64::SABAv8i8:
7796unsigned AArch64InstrInfo::getAccumulationStartOpcode(
7797 unsigned AccumulationOpcode)
const {
7798 switch (AccumulationOpcode) {
7801 case AArch64::UABALB_ZZZ_D:
7802 return AArch64::UABDLB_ZZZ_D;
7803 case AArch64::UABALB_ZZZ_H:
7804 return AArch64::UABDLB_ZZZ_H;
7805 case AArch64::UABALB_ZZZ_S:
7806 return AArch64::UABDLB_ZZZ_S;
7807 case AArch64::UABALT_ZZZ_D:
7808 return AArch64::UABDLT_ZZZ_D;
7809 case AArch64::UABALT_ZZZ_H:
7810 return AArch64::UABDLT_ZZZ_H;
7811 case AArch64::UABALT_ZZZ_S:
7812 return AArch64::UABDLT_ZZZ_S;
7813 case AArch64::UABALv16i8_v8i16:
7814 return AArch64::UABDLv16i8_v8i16;
7815 case AArch64::UABALv2i32_v2i64:
7816 return AArch64::UABDLv2i32_v2i64;
7817 case AArch64::UABALv4i16_v4i32:
7818 return AArch64::UABDLv4i16_v4i32;
7819 case AArch64::UABALv4i32_v2i64:
7820 return AArch64::UABDLv4i32_v2i64;
7821 case AArch64::UABALv8i16_v4i32:
7822 return AArch64::UABDLv8i16_v4i32;
7823 case AArch64::UABALv8i8_v8i16:
7824 return AArch64::UABDLv8i8_v8i16;
7825 case AArch64::UABAv16i8:
7826 return AArch64::UABDv16i8;
7827 case AArch64::UABAv2i32:
7828 return AArch64::UABDv2i32;
7829 case AArch64::UABAv4i16:
7830 return AArch64::UABDv4i16;
7831 case AArch64::UABAv4i32:
7832 return AArch64::UABDv4i32;
7833 case AArch64::UABAv8i16:
7834 return AArch64::UABDv8i16;
7835 case AArch64::UABAv8i8:
7836 return AArch64::UABDv8i8;
7837 case AArch64::SABALB_ZZZ_D:
7838 return AArch64::SABDLB_ZZZ_D;
7839 case AArch64::SABALB_ZZZ_S:
7840 return AArch64::SABDLB_ZZZ_S;
7841 case AArch64::SABALB_ZZZ_H:
7842 return AArch64::SABDLB_ZZZ_H;
7843 case AArch64::SABALT_ZZZ_D:
7844 return AArch64::SABDLT_ZZZ_D;
7845 case AArch64::SABALT_ZZZ_S:
7846 return AArch64::SABDLT_ZZZ_S;
7847 case AArch64::SABALT_ZZZ_H:
7848 return AArch64::SABDLT_ZZZ_H;
7849 case AArch64::SABALv16i8_v8i16:
7850 return AArch64::SABDLv16i8_v8i16;
7851 case AArch64::SABALv2i32_v2i64:
7852 return AArch64::SABDLv2i32_v2i64;
7853 case AArch64::SABALv4i16_v4i32:
7854 return AArch64::SABDLv4i16_v4i32;
7855 case AArch64::SABALv4i32_v2i64:
7856 return AArch64::SABDLv4i32_v2i64;
7857 case AArch64::SABALv8i16_v4i32:
7858 return AArch64::SABDLv8i16_v4i32;
7859 case AArch64::SABALv8i8_v8i16:
7860 return AArch64::SABDLv8i8_v8i16;
7861 case AArch64::SABAv16i8:
7862 return AArch64::SABDv16i8;
7863 case AArch64::SABAv2i32:
7864 return AArch64::SABAv2i32;
7865 case AArch64::SABAv4i16:
7866 return AArch64::SABDv4i16;
7867 case AArch64::SABAv4i32:
7868 return AArch64::SABDv4i32;
7869 case AArch64::SABAv8i16:
7870 return AArch64::SABDv8i16;
7871 case AArch64::SABAv8i8:
7872 return AArch64::SABDv8i8;
7888 auto Match = [&](
int Opcode,
int Operand,
unsigned Pattern) ->
bool {
7900 assert(
false &&
"Unsupported FP instruction in combiner\n");
7902 case AArch64::FADDHrr:
7904 "FADDHrr does not have register operands");
7906 Found = Match(AArch64::FMULHrr, 1, MCP::FMULADDH_OP1);
7907 Found |= Match(AArch64::FMULHrr, 2, MCP::FMULADDH_OP2);
7909 case AArch64::FADDSrr:
7911 "FADDSrr does not have register operands");
7913 Found |= Match(AArch64::FMULSrr, 1, MCP::FMULADDS_OP1) ||
7914 Match(AArch64::FMULv1i32_indexed, 1, MCP::FMLAv1i32_indexed_OP1);
7916 Found |= Match(AArch64::FMULSrr, 2, MCP::FMULADDS_OP2) ||
7917 Match(AArch64::FMULv1i32_indexed, 2, MCP::FMLAv1i32_indexed_OP2);
7919 case AArch64::FADDDrr:
7920 Found |= Match(AArch64::FMULDrr, 1, MCP::FMULADDD_OP1) ||
7921 Match(AArch64::FMULv1i64_indexed, 1, MCP::FMLAv1i64_indexed_OP1);
7923 Found |= Match(AArch64::FMULDrr, 2, MCP::FMULADDD_OP2) ||
7924 Match(AArch64::FMULv1i64_indexed, 2, MCP::FMLAv1i64_indexed_OP2);
7926 case AArch64::FADDv4f16:
7927 Found |= Match(AArch64::FMULv4i16_indexed, 1, MCP::FMLAv4i16_indexed_OP1) ||
7928 Match(AArch64::FMULv4f16, 1, MCP::FMLAv4f16_OP1);
7930 Found |= Match(AArch64::FMULv4i16_indexed, 2, MCP::FMLAv4i16_indexed_OP2) ||
7931 Match(AArch64::FMULv4f16, 2, MCP::FMLAv4f16_OP2);
7933 case AArch64::FADDv8f16:
7934 Found |= Match(AArch64::FMULv8i16_indexed, 1, MCP::FMLAv8i16_indexed_OP1) ||
7935 Match(AArch64::FMULv8f16, 1, MCP::FMLAv8f16_OP1);
7937 Found |= Match(AArch64::FMULv8i16_indexed, 2, MCP::FMLAv8i16_indexed_OP2) ||
7938 Match(AArch64::FMULv8f16, 2, MCP::FMLAv8f16_OP2);
7940 case AArch64::FADDv2f32:
7941 Found |= Match(AArch64::FMULv2i32_indexed, 1, MCP::FMLAv2i32_indexed_OP1) ||
7942 Match(AArch64::FMULv2f32, 1, MCP::FMLAv2f32_OP1);
7944 Found |= Match(AArch64::FMULv2i32_indexed, 2, MCP::FMLAv2i32_indexed_OP2) ||
7945 Match(AArch64::FMULv2f32, 2, MCP::FMLAv2f32_OP2);
7947 case AArch64::FADDv2f64:
7948 Found |= Match(AArch64::FMULv2i64_indexed, 1, MCP::FMLAv2i64_indexed_OP1) ||
7949 Match(AArch64::FMULv2f64, 1, MCP::FMLAv2f64_OP1);
7951 Found |= Match(AArch64::FMULv2i64_indexed, 2, MCP::FMLAv2i64_indexed_OP2) ||
7952 Match(AArch64::FMULv2f64, 2, MCP::FMLAv2f64_OP2);
7954 case AArch64::FADDv4f32:
7955 Found |= Match(AArch64::FMULv4i32_indexed, 1, MCP::FMLAv4i32_indexed_OP1) ||
7956 Match(AArch64::FMULv4f32, 1, MCP::FMLAv4f32_OP1);
7958 Found |= Match(AArch64::FMULv4i32_indexed, 2, MCP::FMLAv4i32_indexed_OP2) ||
7959 Match(AArch64::FMULv4f32, 2, MCP::FMLAv4f32_OP2);
7961 case AArch64::FSUBHrr:
7962 Found = Match(AArch64::FMULHrr, 1, MCP::FMULSUBH_OP1);
7963 Found |= Match(AArch64::FMULHrr, 2, MCP::FMULSUBH_OP2);
7964 Found |= Match(AArch64::FNMULHrr, 1, MCP::FNMULSUBH_OP1);
7966 case AArch64::FSUBSrr:
7967 Found = Match(AArch64::FMULSrr, 1, MCP::FMULSUBS_OP1);
7969 Found |= Match(AArch64::FMULSrr, 2, MCP::FMULSUBS_OP2) ||
7970 Match(AArch64::FMULv1i32_indexed, 2, MCP::FMLSv1i32_indexed_OP2);
7972 Found |= Match(AArch64::FNMULSrr, 1, MCP::FNMULSUBS_OP1);
7974 case AArch64::FSUBDrr:
7975 Found = Match(AArch64::FMULDrr, 1, MCP::FMULSUBD_OP1);
7977 Found |= Match(AArch64::FMULDrr, 2, MCP::FMULSUBD_OP2) ||
7978 Match(AArch64::FMULv1i64_indexed, 2, MCP::FMLSv1i64_indexed_OP2);
7980 Found |= Match(AArch64::FNMULDrr, 1, MCP::FNMULSUBD_OP1);
7982 case AArch64::FSUBv4f16:
7983 Found |= Match(AArch64::FMULv4i16_indexed, 2, MCP::FMLSv4i16_indexed_OP2) ||
7984 Match(AArch64::FMULv4f16, 2, MCP::FMLSv4f16_OP2);
7986 Found |= Match(AArch64::FMULv4i16_indexed, 1, MCP::FMLSv4i16_indexed_OP1) ||
7987 Match(AArch64::FMULv4f16, 1, MCP::FMLSv4f16_OP1);
7989 case AArch64::FSUBv8f16:
7990 Found |= Match(AArch64::FMULv8i16_indexed, 2, MCP::FMLSv8i16_indexed_OP2) ||
7991 Match(AArch64::FMULv8f16, 2, MCP::FMLSv8f16_OP2);
7993 Found |= Match(AArch64::FMULv8i16_indexed, 1, MCP::FMLSv8i16_indexed_OP1) ||
7994 Match(AArch64::FMULv8f16, 1, MCP::FMLSv8f16_OP1);
7996 case AArch64::FSUBv2f32:
7997 Found |= Match(AArch64::FMULv2i32_indexed, 2, MCP::FMLSv2i32_indexed_OP2) ||
7998 Match(AArch64::FMULv2f32, 2, MCP::FMLSv2f32_OP2);
8000 Found |= Match(AArch64::FMULv2i32_indexed, 1, MCP::FMLSv2i32_indexed_OP1) ||
8001 Match(AArch64::FMULv2f32, 1, MCP::FMLSv2f32_OP1);
8003 case AArch64::FSUBv2f64:
8004 Found |= Match(AArch64::FMULv2i64_indexed, 2, MCP::FMLSv2i64_indexed_OP2) ||
8005 Match(AArch64::FMULv2f64, 2, MCP::FMLSv2f64_OP2);
8007 Found |= Match(AArch64::FMULv2i64_indexed, 1, MCP::FMLSv2i64_indexed_OP1) ||
8008 Match(AArch64::FMULv2f64, 1, MCP::FMLSv2f64_OP1);
8010 case AArch64::FSUBv4f32:
8011 Found |= Match(AArch64::FMULv4i32_indexed, 2, MCP::FMLSv4i32_indexed_OP2) ||
8012 Match(AArch64::FMULv4f32, 2, MCP::FMLSv4f32_OP2);
8014 Found |= Match(AArch64::FMULv4i32_indexed, 1, MCP::FMLSv4i32_indexed_OP1) ||
8015 Match(AArch64::FMULv4f32, 1, MCP::FMLSv4f32_OP1);
8026 auto Match = [&](
unsigned Opcode,
int Operand,
unsigned Pattern) ->
bool {
8033 if (
MI &&
MI->getOpcode() == TargetOpcode::COPY &&
8034 MI->getOperand(1).getReg().isVirtual())
8036 if (
MI &&
MI->getOpcode() == Opcode) {
8048 case AArch64::FMULv2f32:
8049 Found = Match(AArch64::DUPv2i32lane, 1, MCP::FMULv2i32_indexed_OP1);
8050 Found |= Match(AArch64::DUPv2i32lane, 2, MCP::FMULv2i32_indexed_OP2);
8052 case AArch64::FMULv2f64:
8053 Found = Match(AArch64::DUPv2i64lane, 1, MCP::FMULv2i64_indexed_OP1);
8054 Found |= Match(AArch64::DUPv2i64lane, 2, MCP::FMULv2i64_indexed_OP2);
8056 case AArch64::FMULv4f16:
8057 Found = Match(AArch64::DUPv4i16lane, 1, MCP::FMULv4i16_indexed_OP1);
8058 Found |= Match(AArch64::DUPv4i16lane, 2, MCP::FMULv4i16_indexed_OP2);
8060 case AArch64::FMULv4f32:
8061 Found = Match(AArch64::DUPv4i32lane, 1, MCP::FMULv4i32_indexed_OP1);
8062 Found |= Match(AArch64::DUPv4i32lane, 2, MCP::FMULv4i32_indexed_OP2);
8064 case AArch64::FMULv8f16:
8065 Found = Match(AArch64::DUPv8i16lane, 1, MCP::FMULv8i16_indexed_OP1);
8066 Found |= Match(AArch64::DUPv8i16lane, 2, MCP::FMULv8i16_indexed_OP2);
8079 auto Match = [&](
unsigned Opcode,
unsigned Pattern) ->
bool {
8082 if (
MI !=
nullptr && (
MI->getOpcode() == Opcode) &&
8097 case AArch64::FNEGDr:
8099 case AArch64::FNEGSr:
8231 case AArch64::SUBWrr:
8232 case AArch64::SUBSWrr:
8233 case AArch64::SUBXrr:
8234 case AArch64::SUBSXrr:
8279 unsigned LoadLaneOpCode,
unsigned NumLanes) {
8302 while (!RemainingLanes.
empty() && CurrInstr &&
8303 CurrInstr->getOpcode() == LoadLaneOpCode &&
8305 CurrInstr->getNumOperands() == 4) {
8306 RemainingLanes.
erase(CurrInstr->getOperand(2).getImm());
8312 if (!RemainingLanes.
empty())
8316 if (CurrInstr->getOpcode() != TargetOpcode::SUBREG_TO_REG)
8320 auto Lane0LoadReg = CurrInstr->getOperand(1).getReg();
8321 unsigned SingleLaneSizeInBits = 128 / NumLanes;
8322 if (
TRI->getRegSizeInBits(Lane0LoadReg, MRI) != SingleLaneSizeInBits)
8338 RemainingLoadInstrs.
insert(LoadInstrs.
begin(), LoadInstrs.
end());
8341 for (; MBBItr !=
MBB->begin() && RemainingSteps > 0 &&
8342 !RemainingLoadInstrs.
empty();
8343 --MBBItr, --RemainingSteps) {
8347 RemainingLoadInstrs.
erase(&CurrInstr);
8357 if (RemainingSteps == 0 && !RemainingLoadInstrs.
empty())
8383 case AArch64::LD1i32:
8385 case AArch64::LD1i16:
8387 case AArch64::LD1i8:
8403 unsigned Pattern,
unsigned NumLanes) {
8411 for (
unsigned i = 0; i < NumLanes - 1; ++i) {
8419 return A->getOperand(2).getImm() >
B->getOperand(2).getImm();
8425 auto LoadToLaneInstrsAscending =
llvm::reverse(LoadToLaneInstrs);
8431 auto CreateLD1Instruction = [&](
MachineInstr *OriginalInstr,
8432 Register SrcRegister,
unsigned Lane,
8434 bool OffsetRegisterKillState) {
8443 InstrIdxForVirtReg.
insert(std::make_pair(NewRegister, InsInstrs.
size()));
8444 InsInstrs.
push_back(LoadIndexIntoRegister);
8450 auto CreateLDRInstruction =
8456 Opcode = AArch64::LDRSui;
8459 Opcode = AArch64::LDRHui;
8462 Opcode = AArch64::LDRBui;
8466 "Got unsupported number of lanes in machine-combiner gather pattern");
8476 auto LanesToLoadToReg0 =
8478 LoadToLaneInstrsAscending.begin() + NumLanes / 2);
8479 Register PrevReg = SubregToReg->getOperand(0).getReg();
8481 const MachineOperand &OffsetRegOperand = LoadInstr->getOperand(3);
8482 PrevReg = CreateLD1Instruction(LoadInstr, PrevReg, Index + 1,
8483 OffsetRegOperand.
getReg(),
8484 OffsetRegOperand.
isKill());
8491 MachineInstr *Lane0Load = *LoadToLaneInstrsAscending.begin();
8493 *std::next(LoadToLaneInstrsAscending.begin(), NumLanes / 2);
8500 CreateLDRInstruction(NumLanes, DestRegForMiddleIndex,
8501 OriginalSplitToLoadOffsetOperand.
getReg(),
8504 InstrIdxForVirtReg.
insert(
8505 std::make_pair(DestRegForMiddleIndex, InsInstrs.
size()));
8506 InsInstrs.
push_back(MiddleIndexLoadInstr);
8511 unsigned SubregType;
8514 SubregType = AArch64::ssub;
8517 SubregType = AArch64::hsub;
8520 SubregType = AArch64::bsub;
8524 "Got invalid NumLanes for machine-combiner gather pattern");
8527 auto SubRegToRegInstr =
8529 DestRegForSubregToReg)
8532 InstrIdxForVirtReg.
insert(
8533 std::make_pair(DestRegForSubregToReg, InsInstrs.
size()));
8537 auto LanesToLoadToReg1 =
8539 LoadToLaneInstrsAscending.end());
8540 PrevReg = SubRegToRegInstr->getOperand(0).getReg();
8542 const MachineOperand &OffsetRegOperand = LoadInstr->getOperand(3);
8543 PrevReg = CreateLD1Instruction(LoadInstr, PrevReg, Index + 1,
8544 OffsetRegOperand.
getReg(),
8545 OffsetRegOperand.
isKill());
8548 if (Index == NumLanes / 2 - 2) {
8583bool AArch64InstrInfo::getMachineCombinerPatterns(
8585 bool DoRegPressureReduce)
const {
8606 DoRegPressureReduce);
8635 const Register *ReplacedAddend =
nullptr) {
8636 assert(IdxMulOpd == 1 || IdxMulOpd == 2);
8638 unsigned IdxOtherOpd = IdxMulOpd == 1 ? 2 : 1;
8641 Register SrcReg0 = MUL->getOperand(1).getReg();
8642 bool Src0IsKill = MUL->getOperand(1).isKill();
8643 Register SrcReg1 = MUL->getOperand(2).getReg();
8644 bool Src1IsKill = MUL->getOperand(2).isKill();
8648 if (ReplacedAddend) {
8650 SrcReg2 = *ReplacedAddend;
8677 .
addImm(MUL->getOperand(3).getImm());
8684 assert(
false &&
"Invalid FMA instruction kind \n");
8698 if (AArch64::FPR32RegClass.hasSubClassEq(RC))
8699 Opc = AArch64::FNMADDSrrr;
8700 else if (AArch64::FPR64RegClass.hasSubClassEq(RC))
8701 Opc = AArch64::FNMADDDrrr;
8735 unsigned IdxDupOp,
unsigned MulOpc,
8737 assert(((IdxDupOp == 1) || (IdxDupOp == 2)) &&
8738 "Invalid index of FMUL operand");
8746 if (Dup->
getOpcode() == TargetOpcode::COPY)
8755 unsigned IdxMulOp = IdxDupOp == 1 ? 2 : 1;
8796 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
8811 genNeg(MF, MRI,
TII, Root, InsInstrs, InstrIdxForVirtReg, MnegOpc, RC);
8838 genNeg(MF, MRI,
TII, Root, InsInstrs, InstrIdxForVirtReg, MnegOpc, RC);
8866 unsigned IdxMulOpd,
unsigned MaddOpc,
unsigned VR,
8868 assert(IdxMulOpd == 1 || IdxMulOpd == 2);
8872 Register SrcReg0 = MUL->getOperand(1).getReg();
8873 bool Src0IsKill = MUL->getOperand(1).isKill();
8874 Register SrcReg1 = MUL->getOperand(2).getReg();
8875 bool Src1IsKill = MUL->getOperand(2).isKill();
8905 assert(IdxOpd1 == 1 || IdxOpd1 == 2);
8906 unsigned IdxOtherOpd = IdxOpd1 == 1 ? 2 : 1;
8920 if (Opcode == AArch64::SUBSWrr)
8921 Opcode = AArch64::SUBWrr;
8922 else if (Opcode == AArch64::SUBSXrr)
8923 Opcode = AArch64::SUBXrr;
8925 assert((Opcode == AArch64::SUBWrr || Opcode == AArch64::SUBXrr) &&
8926 "Unexpected instruction opcode.");
8943 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
8950unsigned AArch64InstrInfo::getReduceOpcodeForAccumulator(
8951 unsigned int AccumulatorOpCode)
const {
8952 switch (AccumulatorOpCode) {
8953 case AArch64::UABALB_ZZZ_D:
8954 case AArch64::SABALB_ZZZ_D:
8955 case AArch64::UABALT_ZZZ_D:
8956 case AArch64::SABALT_ZZZ_D:
8957 return AArch64::ADD_ZZZ_D;
8958 case AArch64::UABALB_ZZZ_H:
8959 case AArch64::SABALB_ZZZ_H:
8960 case AArch64::UABALT_ZZZ_H:
8961 case AArch64::SABALT_ZZZ_H:
8962 return AArch64::ADD_ZZZ_H;
8963 case AArch64::UABALB_ZZZ_S:
8964 case AArch64::SABALB_ZZZ_S:
8965 case AArch64::UABALT_ZZZ_S:
8966 case AArch64::SABALT_ZZZ_S:
8967 return AArch64::ADD_ZZZ_S;
8968 case AArch64::UABALv16i8_v8i16:
8969 case AArch64::SABALv8i8_v8i16:
8970 case AArch64::SABAv8i16:
8971 case AArch64::UABAv8i16:
8972 return AArch64::ADDv8i16;
8973 case AArch64::SABALv2i32_v2i64:
8974 case AArch64::UABALv2i32_v2i64:
8975 case AArch64::SABALv4i32_v2i64:
8976 return AArch64::ADDv2i64;
8977 case AArch64::UABALv4i16_v4i32:
8978 case AArch64::SABALv4i16_v4i32:
8979 case AArch64::SABALv8i16_v4i32:
8980 case AArch64::SABAv4i32:
8981 case AArch64::UABAv4i32:
8982 return AArch64::ADDv4i32;
8983 case AArch64::UABALv4i32_v2i64:
8984 return AArch64::ADDv2i64;
8985 case AArch64::UABALv8i16_v4i32:
8986 return AArch64::ADDv4i32;
8987 case AArch64::UABALv8i8_v8i16:
8988 case AArch64::SABALv16i8_v8i16:
8989 return AArch64::ADDv8i16;
8990 case AArch64::UABAv16i8:
8991 case AArch64::SABAv16i8:
8992 return AArch64::ADDv16i8;
8993 case AArch64::UABAv4i16:
8994 case AArch64::SABAv4i16:
8995 return AArch64::ADDv4i16;
8996 case AArch64::UABAv2i32:
8997 case AArch64::SABAv2i32:
8998 return AArch64::ADDv2i32;
8999 case AArch64::UABAv8i8:
9000 case AArch64::SABAv8i8:
9001 return AArch64::ADDv8i8;
9010void AArch64InstrInfo::genAlternativeCodeSequence(
9020 MachineInstr *
MUL =
nullptr;
9021 const TargetRegisterClass *RC;
9027 DelInstrs, InstrIdxForVirtReg);
9033 InstrIdxForVirtReg);
9039 InstrIdxForVirtReg);
9048 Opc = AArch64::MADDWrrr;
9049 RC = &AArch64::GPR32RegClass;
9051 Opc = AArch64::MADDXrrr;
9052 RC = &AArch64::GPR64RegClass;
9063 Opc = AArch64::MADDWrrr;
9064 RC = &AArch64::GPR32RegClass;
9066 Opc = AArch64::MADDXrrr;
9067 RC = &AArch64::GPR64RegClass;
9080 const TargetRegisterClass *RC;
9081 unsigned BitSize, MovImm;
9084 MovImm = AArch64::MOVi32imm;
9085 RC = &AArch64::GPR32spRegClass;
9087 Opc = AArch64::MADDWrrr;
9088 RC = &AArch64::GPR32RegClass;
9090 MovImm = AArch64::MOVi64imm;
9091 RC = &AArch64::GPR64spRegClass;
9093 Opc = AArch64::MADDXrrr;
9094 RC = &AArch64::GPR64RegClass;
9105 uint64_t UImm =
SignExtend64(IsSub ? -Imm : Imm, BitSize);
9109 if (Insn.
size() != 1)
9111 MachineInstrBuilder MIB1 =
9112 BuildMI(MF, MIMetadata(Root),
TII->get(MovImm), NewVR)
9113 .
addImm(IsSub ? -Imm : Imm);
9115 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9126 const TargetRegisterClass *SubRC;
9127 unsigned SubOpc, ZeroReg;
9129 SubOpc = AArch64::SUBWrr;
9130 SubRC = &AArch64::GPR32spRegClass;
9131 ZeroReg = AArch64::WZR;
9132 Opc = AArch64::MADDWrrr;
9133 RC = &AArch64::GPR32RegClass;
9135 SubOpc = AArch64::SUBXrr;
9136 SubRC = &AArch64::GPR64spRegClass;
9137 ZeroReg = AArch64::XZR;
9138 Opc = AArch64::MADDXrrr;
9139 RC = &AArch64::GPR64RegClass;
9143 MachineInstrBuilder MIB1 =
9144 BuildMI(MF, MIMetadata(Root),
TII->get(SubOpc), NewVR)
9148 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9159 Opc = AArch64::MSUBWrrr;
9160 RC = &AArch64::GPR32RegClass;
9162 Opc = AArch64::MSUBXrrr;
9163 RC = &AArch64::GPR64RegClass;
9168 Opc = AArch64::MLAv8i8;
9169 RC = &AArch64::FPR64RegClass;
9173 Opc = AArch64::MLAv8i8;
9174 RC = &AArch64::FPR64RegClass;
9178 Opc = AArch64::MLAv16i8;
9179 RC = &AArch64::FPR128RegClass;
9183 Opc = AArch64::MLAv16i8;
9184 RC = &AArch64::FPR128RegClass;
9188 Opc = AArch64::MLAv4i16;
9189 RC = &AArch64::FPR64RegClass;
9193 Opc = AArch64::MLAv4i16;
9194 RC = &AArch64::FPR64RegClass;
9198 Opc = AArch64::MLAv8i16;
9199 RC = &AArch64::FPR128RegClass;
9203 Opc = AArch64::MLAv8i16;
9204 RC = &AArch64::FPR128RegClass;
9208 Opc = AArch64::MLAv2i32;
9209 RC = &AArch64::FPR64RegClass;
9213 Opc = AArch64::MLAv2i32;
9214 RC = &AArch64::FPR64RegClass;
9218 Opc = AArch64::MLAv4i32;
9219 RC = &AArch64::FPR128RegClass;
9223 Opc = AArch64::MLAv4i32;
9224 RC = &AArch64::FPR128RegClass;
9229 Opc = AArch64::MLAv8i8;
9230 RC = &AArch64::FPR64RegClass;
9232 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i8,
9236 Opc = AArch64::MLSv8i8;
9237 RC = &AArch64::FPR64RegClass;
9241 Opc = AArch64::MLAv16i8;
9242 RC = &AArch64::FPR128RegClass;
9244 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv16i8,
9248 Opc = AArch64::MLSv16i8;
9249 RC = &AArch64::FPR128RegClass;
9253 Opc = AArch64::MLAv4i16;
9254 RC = &AArch64::FPR64RegClass;
9256 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i16,
9260 Opc = AArch64::MLSv4i16;
9261 RC = &AArch64::FPR64RegClass;
9265 Opc = AArch64::MLAv8i16;
9266 RC = &AArch64::FPR128RegClass;
9268 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i16,
9272 Opc = AArch64::MLSv8i16;
9273 RC = &AArch64::FPR128RegClass;
9277 Opc = AArch64::MLAv2i32;
9278 RC = &AArch64::FPR64RegClass;
9280 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv2i32,
9284 Opc = AArch64::MLSv2i32;
9285 RC = &AArch64::FPR64RegClass;
9289 Opc = AArch64::MLAv4i32;
9290 RC = &AArch64::FPR128RegClass;
9292 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i32,
9296 Opc = AArch64::MLSv4i32;
9297 RC = &AArch64::FPR128RegClass;
9302 Opc = AArch64::MLAv4i16_indexed;
9303 RC = &AArch64::FPR64RegClass;
9307 Opc = AArch64::MLAv4i16_indexed;
9308 RC = &AArch64::FPR64RegClass;
9312 Opc = AArch64::MLAv8i16_indexed;
9313 RC = &AArch64::FPR128RegClass;
9317 Opc = AArch64::MLAv8i16_indexed;
9318 RC = &AArch64::FPR128RegClass;
9322 Opc = AArch64::MLAv2i32_indexed;
9323 RC = &AArch64::FPR64RegClass;
9327 Opc = AArch64::MLAv2i32_indexed;
9328 RC = &AArch64::FPR64RegClass;
9332 Opc = AArch64::MLAv4i32_indexed;
9333 RC = &AArch64::FPR128RegClass;
9337 Opc = AArch64::MLAv4i32_indexed;
9338 RC = &AArch64::FPR128RegClass;
9343 Opc = AArch64::MLAv4i16_indexed;
9344 RC = &AArch64::FPR64RegClass;
9346 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i16,
9350 Opc = AArch64::MLSv4i16_indexed;
9351 RC = &AArch64::FPR64RegClass;
9355 Opc = AArch64::MLAv8i16_indexed;
9356 RC = &AArch64::FPR128RegClass;
9358 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i16,
9362 Opc = AArch64::MLSv8i16_indexed;
9363 RC = &AArch64::FPR128RegClass;
9367 Opc = AArch64::MLAv2i32_indexed;
9368 RC = &AArch64::FPR64RegClass;
9370 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv2i32,
9374 Opc = AArch64::MLSv2i32_indexed;
9375 RC = &AArch64::FPR64RegClass;
9379 Opc = AArch64::MLAv4i32_indexed;
9380 RC = &AArch64::FPR128RegClass;
9382 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i32,
9386 Opc = AArch64::MLSv4i32_indexed;
9387 RC = &AArch64::FPR128RegClass;
9393 Opc = AArch64::FMADDHrrr;
9394 RC = &AArch64::FPR16RegClass;
9398 Opc = AArch64::FMADDSrrr;
9399 RC = &AArch64::FPR32RegClass;
9403 Opc = AArch64::FMADDDrrr;
9404 RC = &AArch64::FPR64RegClass;
9409 Opc = AArch64::FMADDHrrr;
9410 RC = &AArch64::FPR16RegClass;
9414 Opc = AArch64::FMADDSrrr;
9415 RC = &AArch64::FPR32RegClass;
9419 Opc = AArch64::FMADDDrrr;
9420 RC = &AArch64::FPR64RegClass;
9425 Opc = AArch64::FMLAv1i32_indexed;
9426 RC = &AArch64::FPR32RegClass;
9431 Opc = AArch64::FMLAv1i32_indexed;
9432 RC = &AArch64::FPR32RegClass;
9438 Opc = AArch64::FMLAv1i64_indexed;
9439 RC = &AArch64::FPR64RegClass;
9444 Opc = AArch64::FMLAv1i64_indexed;
9445 RC = &AArch64::FPR64RegClass;
9451 RC = &AArch64::FPR64RegClass;
9452 Opc = AArch64::FMLAv4i16_indexed;
9457 RC = &AArch64::FPR64RegClass;
9458 Opc = AArch64::FMLAv4f16;
9463 RC = &AArch64::FPR64RegClass;
9464 Opc = AArch64::FMLAv4i16_indexed;
9469 RC = &AArch64::FPR64RegClass;
9470 Opc = AArch64::FMLAv4f16;
9477 RC = &AArch64::FPR64RegClass;
9479 Opc = AArch64::FMLAv2i32_indexed;
9483 Opc = AArch64::FMLAv2f32;
9490 RC = &AArch64::FPR64RegClass;
9492 Opc = AArch64::FMLAv2i32_indexed;
9496 Opc = AArch64::FMLAv2f32;
9503 RC = &AArch64::FPR128RegClass;
9504 Opc = AArch64::FMLAv8i16_indexed;
9509 RC = &AArch64::FPR128RegClass;
9510 Opc = AArch64::FMLAv8f16;
9515 RC = &AArch64::FPR128RegClass;
9516 Opc = AArch64::FMLAv8i16_indexed;
9521 RC = &AArch64::FPR128RegClass;
9522 Opc = AArch64::FMLAv8f16;
9529 RC = &AArch64::FPR128RegClass;
9531 Opc = AArch64::FMLAv2i64_indexed;
9535 Opc = AArch64::FMLAv2f64;
9542 RC = &AArch64::FPR128RegClass;
9544 Opc = AArch64::FMLAv2i64_indexed;
9548 Opc = AArch64::FMLAv2f64;
9556 RC = &AArch64::FPR128RegClass;
9558 Opc = AArch64::FMLAv4i32_indexed;
9562 Opc = AArch64::FMLAv4f32;
9570 RC = &AArch64::FPR128RegClass;
9572 Opc = AArch64::FMLAv4i32_indexed;
9576 Opc = AArch64::FMLAv4f32;
9583 Opc = AArch64::FNMSUBHrrr;
9584 RC = &AArch64::FPR16RegClass;
9588 Opc = AArch64::FNMSUBSrrr;
9589 RC = &AArch64::FPR32RegClass;
9593 Opc = AArch64::FNMSUBDrrr;
9594 RC = &AArch64::FPR64RegClass;
9599 Opc = AArch64::FNMADDHrrr;
9600 RC = &AArch64::FPR16RegClass;
9604 Opc = AArch64::FNMADDSrrr;
9605 RC = &AArch64::FPR32RegClass;
9609 Opc = AArch64::FNMADDDrrr;
9610 RC = &AArch64::FPR64RegClass;
9615 Opc = AArch64::FMSUBHrrr;
9616 RC = &AArch64::FPR16RegClass;
9620 Opc = AArch64::FMSUBSrrr;
9621 RC = &AArch64::FPR32RegClass;
9625 Opc = AArch64::FMSUBDrrr;
9626 RC = &AArch64::FPR64RegClass;
9631 Opc = AArch64::FMLSv1i32_indexed;
9632 RC = &AArch64::FPR32RegClass;
9638 Opc = AArch64::FMLSv1i64_indexed;
9639 RC = &AArch64::FPR64RegClass;
9646 RC = &AArch64::FPR64RegClass;
9648 MachineInstrBuilder MIB1 =
9649 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv4f16), NewVR)
9652 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9654 Opc = AArch64::FMLAv4f16;
9658 Opc = AArch64::FMLAv4i16_indexed;
9665 RC = &AArch64::FPR64RegClass;
9666 Opc = AArch64::FMLSv4f16;
9671 RC = &AArch64::FPR64RegClass;
9672 Opc = AArch64::FMLSv4i16_indexed;
9679 RC = &AArch64::FPR64RegClass;
9681 Opc = AArch64::FMLSv2i32_indexed;
9685 Opc = AArch64::FMLSv2f32;
9693 RC = &AArch64::FPR128RegClass;
9695 MachineInstrBuilder MIB1 =
9696 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv8f16), NewVR)
9699 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9701 Opc = AArch64::FMLAv8f16;
9705 Opc = AArch64::FMLAv8i16_indexed;
9712 RC = &AArch64::FPR128RegClass;
9713 Opc = AArch64::FMLSv8f16;
9718 RC = &AArch64::FPR128RegClass;
9719 Opc = AArch64::FMLSv8i16_indexed;
9726 RC = &AArch64::FPR128RegClass;
9728 Opc = AArch64::FMLSv2i64_indexed;
9732 Opc = AArch64::FMLSv2f64;
9740 RC = &AArch64::FPR128RegClass;
9742 Opc = AArch64::FMLSv4i32_indexed;
9746 Opc = AArch64::FMLSv4f32;
9753 RC = &AArch64::FPR64RegClass;
9755 MachineInstrBuilder MIB1 =
9756 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv2f32), NewVR)
9759 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9761 Opc = AArch64::FMLAv2i32_indexed;
9765 Opc = AArch64::FMLAv2f32;
9773 RC = &AArch64::FPR128RegClass;
9775 MachineInstrBuilder MIB1 =
9776 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv4f32), NewVR)
9779 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9781 Opc = AArch64::FMLAv4i32_indexed;
9785 Opc = AArch64::FMLAv4f32;
9793 RC = &AArch64::FPR128RegClass;
9795 MachineInstrBuilder MIB1 =
9796 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv2f64), NewVR)
9799 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9801 Opc = AArch64::FMLAv2i64_indexed;
9805 Opc = AArch64::FMLAv2f64;
9817 &AArch64::FPR128RegClass, MRI);
9826 &AArch64::FPR128RegClass, MRI);
9835 &AArch64::FPR128_loRegClass, MRI);
9844 &AArch64::FPR128RegClass, MRI);
9853 &AArch64::FPR128_loRegClass, MRI);
9887 for (
auto *
MI : InsInstrs)
9888 MI->setFlags(Flags);
9929 bool IsNegativeBranch =
false;
9930 bool IsTestAndBranch =
false;
9931 unsigned TargetBBInMI = 0;
9932 switch (
MI.getOpcode()) {
9936 case AArch64::CBWPri:
9937 case AArch64::CBXPri:
9938 case AArch64::CBBAssertExt:
9939 case AArch64::CBHAssertExt:
9940 case AArch64::CBWPrr:
9941 case AArch64::CBXPrr:
9947 case AArch64::CBNZW:
9948 case AArch64::CBNZX:
9950 IsNegativeBranch =
true;
9955 IsTestAndBranch =
true;
9957 case AArch64::TBNZW:
9958 case AArch64::TBNZX:
9960 IsNegativeBranch =
true;
9961 IsTestAndBranch =
true;
9967 if (IsTestAndBranch &&
MI.getOperand(1).getImm())
9971 assert(
MI.getParent() &&
"Incomplete machine instruction\n");
9982 while (
DefMI->isCopy()) {
9991 switch (
DefMI->getOpcode()) {
9995 case AArch64::ANDWri:
9996 case AArch64::ANDXri: {
9997 if (IsTestAndBranch)
10004 bool Is32Bit = (
DefMI->getOpcode() == AArch64::ANDWri);
10006 DefMI->getOperand(2).getImm(), Is32Bit ? 32 : 64);
10020 unsigned Imm =
Log2_64(Mask);
10021 unsigned Opc = (Imm < 32)
10022 ? (IsNegativeBranch ? AArch64::TBNZW : AArch64::TBZW)
10023 : (IsNegativeBranch ? AArch64::TBNZX : AArch64::TBZX);
10036 if (!Is32Bit && Imm < 32)
10038 MI.eraseFromParent();
10042 case AArch64::CSINCWr:
10043 case AArch64::CSINCXr: {
10044 if (!(
DefMI->getOperand(1).getReg() == AArch64::WZR &&
10045 DefMI->getOperand(2).getReg() == AArch64::WZR) &&
10046 !(
DefMI->getOperand(1).getReg() == AArch64::XZR &&
10047 DefMI->getOperand(2).getReg() == AArch64::XZR))
10050 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
10063 if (IsNegativeBranch)
10066 MI.eraseFromParent();
10072std::pair<unsigned, unsigned>
10073AArch64InstrInfo::decomposeMachineOperandsTargetFlags(
unsigned TF)
const {
10075 return std::make_pair(TF & Mask, TF & ~Mask);
10079AArch64InstrInfo::getSerializableDirectMachineOperandTargetFlags()
const {
10082 static const std::pair<unsigned, const char *> TargetFlags[] = {
10083 {MO_PAGE,
"aarch64-page"}, {
MO_PAGEOFF,
"aarch64-pageoff"},
10084 {
MO_G3,
"aarch64-g3"}, {
MO_G2,
"aarch64-g2"},
10085 {
MO_G1,
"aarch64-g1"}, {
MO_G0,
"aarch64-g0"},
10091AArch64InstrInfo::getSerializableBitmaskMachineOperandTargetFlags()
const {
10092 using namespace AArch64II;
10094 static const std::pair<unsigned, const char *> TargetFlags[] = {
10096 {
MO_GOT,
"aarch64-got"},
10097 {
MO_NC,
"aarch64-nc"},
10098 {
MO_S,
"aarch64-s"},
10099 {
MO_TLS,
"aarch64-tls"},
10109AArch64InstrInfo::getSerializableMachineMemOperandTargetFlags()
const {
10110 static const std::pair<MachineMemOperand::Flags, const char *> TargetFlags[] =
10212 MachineFunction *MF =
C.getMF();
10214 const AArch64RegisterInfo *ARI =
10215 static_cast<const AArch64RegisterInfo *
>(&
TRI);
10218 for (
unsigned Reg : AArch64::GPR64RegClass) {
10220 Reg != AArch64::LR &&
10221 Reg != AArch64::X16 &&
10222 Reg != AArch64::X17 &&
10223 C.isAvailableAcrossAndOutOfSeq(
Reg,
TRI) &&
10224 C.isAvailableInsideSeq(
Reg,
TRI))
10255 return SubtargetA.hasV8_3aOps() == SubtargetB.hasV8_3aOps();
10258std::optional<std::unique_ptr<outliner::OutlinedFunction>>
10259AArch64InstrInfo::getOutliningCandidateInfo(
10261 std::vector<outliner::Candidate> &RepeatedSequenceLocs,
10262 unsigned MinRepeats)
const {
10263 unsigned SequenceSize = 0;
10264 for (
auto &
MI : RepeatedSequenceLocs[0])
10267 unsigned NumBytesToCreateFrame = 0;
10273 MachineInstr &LastMI = RepeatedSequenceLocs[0].back();
10274 MachineInstr &FirstMI = RepeatedSequenceLocs[0].front();
10275 if (LastMI.
getOpcode() == AArch64::ADRP &&
10278 return std::nullopt;
10283 if ((FirstMI.
getOpcode() == AArch64::ADDXri ||
10284 FirstMI.
getOpcode() == AArch64::LDRXui) &&
10287 return std::nullopt;
10298 if (std::adjacent_find(
10299 RepeatedSequenceLocs.begin(), RepeatedSequenceLocs.end(),
10300 [](
const outliner::Candidate &a,
const outliner::Candidate &b) {
10303 if (outliningCandidatesSigningScopeConsensus(a, b) &&
10304 outliningCandidatesSigningKeyConsensus(a, b) &&
10305 outliningCandidatesV8_3OpsConsensus(a, b)) {
10309 }) != RepeatedSequenceLocs.end()) {
10310 return std::nullopt;
10327 unsigned NumBytesToCheckLRInTCEpilogue = 0;
10328 const auto RASignCondition = RepeatedSequenceLocs[0]
10331 ->getSignReturnAddressCondition();
10334 NumBytesToCreateFrame += 8;
10337 auto LRCheckMethod = Subtarget.getAuthenticatedLRCheckMethod(
10338 *RepeatedSequenceLocs[0].getMF());
10339 NumBytesToCheckLRInTCEpilogue =
10343 if (isTailCallReturnInst(RepeatedSequenceLocs[0].
back()))
10344 SequenceSize += NumBytesToCheckLRInTCEpilogue;
10352 for (
auto &
MI :
C) {
10353 if (
MI.modifiesRegister(AArch64::SP, &
TRI)) {
10354 switch (
MI.getOpcode()) {
10355 case AArch64::ADDXri:
10356 case AArch64::ADDWri:
10357 assert(
MI.getNumOperands() == 4 &&
"Wrong number of operands");
10358 assert(
MI.getOperand(2).isImm() &&
10359 "Expected operand to be immediate");
10360 assert(
MI.getOperand(1).isReg() &&
10361 "Expected operand to be a register");
10365 if (
MI.getOperand(1).getReg() == AArch64::SP)
10366 SPValue +=
MI.getOperand(2).getImm();
10370 case AArch64::SUBXri:
10371 case AArch64::SUBWri:
10372 assert(
MI.getNumOperands() == 4 &&
"Wrong number of operands");
10373 assert(
MI.getOperand(2).isImm() &&
10374 "Expected operand to be immediate");
10375 assert(
MI.getOperand(1).isReg() &&
10376 "Expected operand to be a register");
10380 if (
MI.getOperand(1).getReg() == AArch64::SP)
10381 SPValue -=
MI.getOperand(2).getImm();
10398 if (RepeatedSequenceLocs.size() < MinRepeats)
10399 return std::nullopt;
10403 unsigned FlagsSetInAll = 0xF;
10407 FlagsSetInAll &=
C.Flags;
10409 unsigned LastInstrOpcode = RepeatedSequenceLocs[0].back().getOpcode();
10412 auto SetCandidateCallInfo =
10413 [&RepeatedSequenceLocs](
unsigned CallID,
unsigned NumBytesForCall) {
10415 C.setCallInfo(CallID, NumBytesForCall);
10419 NumBytesToCreateFrame += 4;
10427 unsigned CFICount = 0;
10428 for (
auto &
I : RepeatedSequenceLocs[0]) {
10429 if (
I.isCFIInstruction())
10439 std::vector<MCCFIInstruction> CFIInstructions =
10440 C.getMF()->getFrameInstructions();
10442 if (CFICount > 0 && CFICount != CFIInstructions.size())
10443 return std::nullopt;
10451 if (!
MI.modifiesRegister(AArch64::SP, &
TRI) &&
10452 !
MI.readsRegister(AArch64::SP, &
TRI))
10458 if (
MI.modifiesRegister(AArch64::SP, &
TRI))
10463 if (
MI.mayLoadOrStore()) {
10466 bool OffsetIsScalable;
10470 if (!getMemOperandWithOffset(
MI,
Base,
Offset, OffsetIsScalable, &
TRI) ||
10471 !
Base->isReg() ||
Base->getReg() != AArch64::SP)
10475 if (OffsetIsScalable)
10483 TypeSize Scale(0U,
false), DummyWidth(0U,
false);
10484 getMemOpInfo(
MI.getOpcode(), Scale, DummyWidth, MinOffset, MaxOffset);
10487 if (
Offset < MinOffset * (int64_t)Scale.getFixedValue() ||
10488 Offset > MaxOffset * (int64_t)Scale.getFixedValue())
10503 bool AllStackInstrsSafe =
10508 if (RepeatedSequenceLocs[0].
back().isTerminator()) {
10510 NumBytesToCreateFrame = 0;
10511 unsigned NumBytesForCall = 4 + NumBytesToCheckLRInTCEpilogue;
10515 else if (LastInstrOpcode == AArch64::BL ||
10516 ((LastInstrOpcode == AArch64::BLR ||
10517 LastInstrOpcode == AArch64::BLRNoIP) &&
10521 NumBytesToCreateFrame = NumBytesToCheckLRInTCEpilogue;
10529 unsigned NumBytesNoStackCalls = 0;
10530 std::vector<outliner::Candidate> CandidatesWithoutStackFixups;
10536 ?
C.isAvailableAcrossAndOutOfSeq(AArch64::LR,
TRI)
10545 C.getMF()->getFunction().hasFnAttribute(Attribute::NoReturn);
10548 if (LRAvailable && !IsNoReturn) {
10549 NumBytesNoStackCalls += 4;
10551 CandidatesWithoutStackFixups.push_back(
C);
10556 else if (findRegisterToSaveLRTo(
C)) {
10557 NumBytesNoStackCalls += 12;
10559 CandidatesWithoutStackFixups.push_back(
C);
10564 else if (
C.isAvailableInsideSeq(AArch64::SP,
TRI)) {
10565 NumBytesNoStackCalls += 12;
10567 CandidatesWithoutStackFixups.push_back(
C);
10573 NumBytesNoStackCalls += SequenceSize;
10580 if (!AllStackInstrsSafe ||
10581 NumBytesNoStackCalls <= RepeatedSequenceLocs.size() * 12) {
10582 RepeatedSequenceLocs = CandidatesWithoutStackFixups;
10584 if (RepeatedSequenceLocs.size() < MinRepeats)
10585 return std::nullopt;
10638 (!
C.isAvailableAcrossAndOutOfSeq(AArch64::LR,
TRI) ||
10639 !findRegisterToSaveLRTo(
C));
10645 if (RepeatedSequenceLocs.size() < MinRepeats)
10646 return std::nullopt;
10655 bool ModStackToSaveLR =
false;
10658 ModStackToSaveLR =
true;
10667 ModStackToSaveLR =
true;
10669 if (ModStackToSaveLR) {
10671 if (!AllStackInstrsSafe)
10672 return std::nullopt;
10675 NumBytesToCreateFrame += 8;
10682 return std::nullopt;
10684 return std::make_unique<outliner::OutlinedFunction>(
10685 RepeatedSequenceLocs, SequenceSize, NumBytesToCreateFrame, FrameID);
10688void AArch64InstrInfo::mergeOutliningCandidateAttributes(
10689 Function &
F, std::vector<outliner::Candidate> &Candidates)
const {
10693 const auto &CFn = Candidates.front().getMF()->getFunction();
10695 if (CFn.hasFnAttribute(
"ptrauth-returns"))
10696 F.addFnAttr(CFn.getFnAttribute(
"ptrauth-returns"));
10697 if (CFn.hasFnAttribute(
"ptrauth-auth-traps"))
10698 F.addFnAttr(CFn.getFnAttribute(
"ptrauth-auth-traps"));
10701 if (CFn.hasFnAttribute(
"sign-return-address"))
10702 F.addFnAttr(CFn.getFnAttribute(
"sign-return-address"));
10703 if (CFn.hasFnAttribute(
"sign-return-address-key"))
10704 F.addFnAttr(CFn.getFnAttribute(
"sign-return-address-key"));
10706 AArch64GenInstrInfo::mergeOutliningCandidateAttributes(
F, Candidates);
10709bool AArch64InstrInfo::isFunctionSafeToOutlineFrom(
10714 if (!OutlineFromLinkOnceODRs &&
F.hasLinkOnceODRLinkage())
10721 if (
F.hasSection())
10727 AArch64FunctionInfo *AFI = MF.
getInfo<AArch64FunctionInfo>();
10728 if (!AFI || AFI->
hasRedZone().value_or(
true))
10748 unsigned &Flags)
const {
10750 "Must track liveness!");
10752 std::pair<MachineBasicBlock::iterator, MachineBasicBlock::iterator>>
10767 auto AreAllUnsafeRegsDead = [&LRU]() {
10768 return LRU.available(AArch64::W16) && LRU.available(AArch64::W17) &&
10769 LRU.available(AArch64::NZCV);
10784 bool LRAvailableEverywhere =
true;
10786 LRU.addLiveOuts(
MBB);
10788 auto UpdateWholeMBBFlags = [&
Flags](
const MachineInstr &
MI) {
10789 if (
MI.isCall() && !
MI.isTerminator())
10795 auto CreateNewRangeStartingAt =
10796 [&RangeBegin, &RangeEnd,
10798 RangeBegin = NewBegin;
10799 RangeEnd = std::next(RangeBegin);
10802 auto SaveRangeIfNonEmpty = [&RangeLen, &
Ranges, &RangeBegin, &RangeEnd]() {
10808 if (!RangeBegin.isEnd() && RangeBegin->isBundledWithPred())
10810 if (!RangeEnd.isEnd() && RangeEnd->isBundledWithPred())
10812 Ranges.emplace_back(RangeBegin, RangeEnd);
10820 for (; FirstPossibleEndPt !=
MBB.
instr_rend(); ++FirstPossibleEndPt) {
10821 if (!FirstPossibleEndPt->isDebugInstr())
10822 LRU.stepBackward(*FirstPossibleEndPt);
10825 UpdateWholeMBBFlags(*FirstPossibleEndPt);
10826 if (AreAllUnsafeRegsDead())
10833 CreateNewRangeStartingAt(FirstPossibleEndPt->getIterator());
10838 if (!
MI.isDebugInstr())
10839 LRU.stepBackward(
MI);
10840 UpdateWholeMBBFlags(
MI);
10841 if (!AreAllUnsafeRegsDead()) {
10842 SaveRangeIfNonEmpty();
10843 CreateNewRangeStartingAt(
MI.getIterator());
10846 LRAvailableEverywhere &= LRU.available(AArch64::LR);
10847 RangeBegin =
MI.getIterator();
10852 if (AreAllUnsafeRegsDead())
10853 SaveRangeIfNonEmpty();
10861 if (!LRAvailableEverywhere)
10869 unsigned Flags)
const {
10870 MachineInstr &
MI = *MIT;
10874 switch (
MI.getOpcode()) {
10875 case AArch64::PACM:
10876 case AArch64::PACIASP:
10877 case AArch64::PACIBSP:
10878 case AArch64::PACIASPPC:
10879 case AArch64::PACIBSPPC:
10880 case AArch64::AUTIASP:
10881 case AArch64::AUTIBSP:
10882 case AArch64::AUTIASPPCi:
10883 case AArch64::AUTIASPPCr:
10884 case AArch64::AUTIBSPPCi:
10885 case AArch64::AUTIBSPPCr:
10886 case AArch64::RETAA:
10887 case AArch64::RETAB:
10888 case AArch64::RETAASPPCi:
10889 case AArch64::RETAASPPCr:
10890 case AArch64::RETABSPPCi:
10891 case AArch64::RETABSPPCr:
10892 case AArch64::EMITBKEY:
10893 case AArch64::PAUTH_PROLOGUE:
10894 case AArch64::PAUTH_EPILOGUE:
10904 if (
MI.isCFIInstruction())
10908 if (
MI.isTerminator())
10914 for (
const MachineOperand &MOP :
MI.operands()) {
10917 assert(!MOP.isCFIIndex());
10920 if (MOP.isReg() && !MOP.isImplicit() &&
10921 (MOP.getReg() == AArch64::LR || MOP.getReg() == AArch64::W30))
10928 if (
MI.getOpcode() == AArch64::ADRP)
10948 for (
const MachineOperand &MOP :
MI.operands()) {
10949 if (MOP.isGlobal()) {
10957 if (Callee &&
Callee->getName() ==
"\01_mcount")
10965 if (
MI.getOpcode() == AArch64::BLR ||
10966 MI.getOpcode() == AArch64::BLRNoIP ||
MI.getOpcode() == AArch64::BL)
10970 return UnknownCallOutlineType;
10978 return UnknownCallOutlineType;
10986 return UnknownCallOutlineType;
11007 for (MachineInstr &
MI :
MBB) {
11008 const MachineOperand *
Base;
11009 TypeSize Width(0,
false);
11011 bool OffsetIsScalable;
11014 if (!
MI.mayLoadOrStore() ||
11017 (
Base->isReg() &&
Base->getReg() != AArch64::SP))
11021 TypeSize Scale(0U,
false);
11022 int64_t Dummy1, Dummy2;
11025 assert(StackOffsetOperand.
isImm() &&
"Stack offset wasn't immediate!");
11027 assert(Scale != 0 &&
"Unexpected opcode!");
11028 assert(!OffsetIsScalable &&
"Expected offset to be a byte offset");
11033 int64_t NewImm = (
Offset + 16) / (int64_t)Scale.getFixedValue();
11034 StackOffsetOperand.
setImm(NewImm);
11040 bool ShouldSignReturnAddr) {
11041 if (!ShouldSignReturnAddr)
11049void AArch64InstrInfo::buildOutlinedFrame(
11053 AArch64FunctionInfo *FI = MF.
getInfo<AArch64FunctionInfo>();
11061 unsigned TailOpcode;
11063 TailOpcode = AArch64::TCRETURNdi;
11067 TailOpcode = AArch64::TCRETURNriALL;
11078 bool IsLeafFunction =
true;
11081 auto IsNonTailCall = [](
const MachineInstr &
MI) {
11082 return MI.isCall() && !
MI.isReturn();
11092 "Can only fix up stack references once");
11093 fixupPostOutline(
MBB);
11095 IsLeafFunction =
false;
11106 Et = std::prev(
MBB.
end());
11116 if (MF.
getInfo<AArch64FunctionInfo>()->needsDwarfUnwindInfo(MF)) {
11120 CFIBuilder.buildDefCFAOffset(16);
11124 CFIBuilder.buildOffset(AArch64::LR, -16);
11138 RASignCondition, !IsLeafFunction);
11167 fixupPostOutline(
MBB);
11178 .addGlobalAddress(
M.getNamedValue(MF.
getName()))
11188 .addGlobalAddress(
M.getNamedValue(MF.
getName())));
11197 MachineInstr *Save;
11198 MachineInstr *Restore;
11204 assert(
Reg &&
"No callee-saved register available?");
11238 .addGlobalAddress(
M.getNamedValue(MF.
getName())));
11246bool AArch64InstrInfo::shouldOutlineFromFunctionByDefault(
11254 bool AllowSideEffects)
const {
11256 const AArch64Subtarget &STI = MF.
getSubtarget<AArch64Subtarget>();
11259 if (
TRI.isGeneralPurposeRegister(MF,
Reg)) {
11272 assert(STI.hasNEON() &&
"Expected to have NEON.");
11278std::optional<DestSourcePair>
11283 if (((
MI.getOpcode() == AArch64::ORRWrs &&
11284 MI.getOperand(1).getReg() == AArch64::WZR &&
11285 MI.getOperand(3).getImm() == 0x0) ||
11286 (
MI.getOpcode() == AArch64::ORRWrr &&
11287 MI.getOperand(1).getReg() == AArch64::WZR)) &&
11289 (!
MI.getOperand(0).getReg().isVirtual() ||
11290 MI.getOperand(0).getSubReg() == 0) &&
11291 (!
MI.getOperand(0).getReg().isPhysical() ||
11296 if (
MI.getOpcode() == AArch64::ORRXrs &&
11297 MI.getOperand(1).getReg() == AArch64::XZR &&
11298 MI.getOperand(3).getImm() == 0x0)
11301 return std::nullopt;
11304std::optional<DestSourcePair>
11306 if ((
MI.getOpcode() == AArch64::ORRWrs &&
11307 MI.getOperand(1).getReg() == AArch64::WZR &&
11308 MI.getOperand(3).getImm() == 0x0) ||
11309 (
MI.getOpcode() == AArch64::ORRWrr &&
11310 MI.getOperand(1).getReg() == AArch64::WZR))
11312 return std::nullopt;
11315std::optional<RegImmPair>
11324 return std::nullopt;
11326 switch (
MI.getOpcode()) {
11328 return std::nullopt;
11329 case AArch64::SUBWri:
11330 case AArch64::SUBXri:
11331 case AArch64::SUBSWri:
11332 case AArch64::SUBSXri:
11335 case AArch64::ADDSWri:
11336 case AArch64::ADDSXri:
11337 case AArch64::ADDWri:
11338 case AArch64::ADDXri: {
11340 if (!
MI.getOperand(0).isReg() || !
MI.getOperand(1).isReg() ||
11341 !
MI.getOperand(2).isImm())
11342 return std::nullopt;
11343 int Shift =
MI.getOperand(3).getImm();
11344 assert((Shift == 0 || Shift == 12) &&
"Shift can be either 0 or 12");
11348 return RegImmPair{
MI.getOperand(1).getReg(),
Offset};
11354static std::optional<ParamLoadedValue>
11358 auto DestSrc =
TII->isCopyLikeInstr(
MI);
11360 return std::nullopt;
11362 Register DestReg = DestSrc->Destination->getReg();
11363 Register SrcReg = DestSrc->Source->getReg();
11366 return std::nullopt;
11371 if (DestReg == DescribedReg)
11375 if (
MI.getOpcode() == AArch64::ORRWrs &&
11376 TRI->isSuperRegister(DestReg, DescribedReg))
11380 if (
MI.getOpcode() == AArch64::ORRXrs &&
11381 TRI->isSubRegister(DestReg, DescribedReg)) {
11382 Register SrcSubReg =
TRI->getSubReg(SrcReg, AArch64::sub_32);
11386 assert(!
TRI->isSuperOrSubRegisterEq(DestReg, DescribedReg) &&
11387 "Unhandled ORR[XW]rs copy case");
11389 return std::nullopt;
11392bool AArch64InstrInfo::isFunctionSafeToSplit(
const MachineFunction &MF)
const {
11397 if (MF.
getInfo<AArch64FunctionInfo>()->hasRedZone().value_or(
true))
11403bool AArch64InstrInfo::isMBBSafeToSplitToCold(
11407 auto isAsmGoto = [](
const MachineInstr &
MI) {
11408 return MI.getOpcode() == AArch64::INLINEASM_BR;
11418 auto containsMBB = [&
MBB](
const MachineJumpTableEntry &JTE) {
11425 for (
const MachineInstr &
MI :
MBB) {
11426 switch (
MI.getOpcode()) {
11427 case TargetOpcode::G_BRJT:
11428 case AArch64::JumpTableDest32:
11429 case AArch64::JumpTableDest16:
11430 case AArch64::JumpTableDest8:
11441std::optional<ParamLoadedValue>
11444 const MachineFunction *MF =
MI.getMF();
11446 switch (
MI.getOpcode()) {
11447 case AArch64::MOVZWi:
11448 case AArch64::MOVZXi: {
11451 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(),
Reg))
11452 return std::nullopt;
11454 if (!
MI.getOperand(1).isImm())
11455 return std::nullopt;
11456 int64_t Immediate =
MI.getOperand(1).getImm();
11457 int Shift =
MI.getOperand(2).getImm();
11461 case AArch64::ORRWrs:
11462 case AArch64::ORRXrs:
11469bool AArch64InstrInfo::isExtendLikelyToBeFolded(
11472 ExtMI.
getOpcode() == TargetOpcode::G_ZEXT ||
11473 ExtMI.
getOpcode() == TargetOpcode::G_ANYEXT);
11476 if (ExtMI.
getOpcode() == TargetOpcode::G_ANYEXT)
11486 return UserMI->
getOpcode() == TargetOpcode::G_PTR_ADD;
11489uint64_t AArch64InstrInfo::getElementSizeForOpcode(
unsigned Opc)
const {
11493bool AArch64InstrInfo::isPTestLikeOpcode(
unsigned Opc)
const {
11497bool AArch64InstrInfo::isWhileOpcode(
unsigned Opc)
const {
11502AArch64InstrInfo::getTailDuplicateSize(
CodeGenOptLevel OptLevel)
const {
11506bool AArch64InstrInfo::isLegalAddressingMode(
unsigned NumBytes, int64_t
Offset,
11507 unsigned Scale)
const {
11518 unsigned Shift =
Log2_64(NumBytes);
11519 if (NumBytes &&
Offset > 0 && (
Offset / NumBytes) <= (1LL << 12) - 1 &&
11527 return Scale == 1 || (Scale > 0 && Scale == NumBytes);
11532 return AArch64::BLRNoIP;
11534 return AArch64::BLR;
11540 auto Builder =
BuildMI(
MBB, InsertPt,
DL,
get(AArch64::PAUTH_EPILOGUE))
11550 if (Subtarget.hasPAuthLR())
11561 Register TargetReg,
bool FrameSetup)
const {
11562 assert(TargetReg != AArch64::SP &&
"New top of stack cannot already be in SP");
11574 MF.
insert(MBBInsertPoint, LoopTestMBB);
11577 MF.
insert(MBBInsertPoint, LoopBodyMBB);
11579 MF.
insert(MBBInsertPoint, ExitMBB);
11589 BuildMI(*LoopTestMBB, LoopTestMBB->
end(),
DL,
TII->get(AArch64::SUBSXrx64),
11597 BuildMI(*LoopTestMBB, LoopTestMBB->
end(),
DL,
TII->get(AArch64::Bcc))
11603 BuildMI(*LoopBodyMBB, LoopBodyMBB->
end(),
DL,
TII->get(AArch64::LDRXui))
11620 BuildMI(*ExitMBB, ExitMBB->
end(),
DL,
TII->get(AArch64::ADDXri), AArch64::SP)
11639 MBB.addSuccessor(LoopTestMBB);
11645 return ExitMBB->
begin();
11650 MachineFunction *MF;
11651 const TargetInstrInfo *
TII;
11652 const TargetRegisterInfo *
TRI;
11653 MachineRegisterInfo &MRI;
11656 MachineBasicBlock *LoopBB;
11658 MachineInstr *CondBranch;
11660 MachineInstr *Comp;
11662 unsigned CompCounterOprNum;
11664 MachineInstr *Update;
11666 unsigned UpdateCounterOprNum;
11670 bool IsUpdatePriorComp;
11676 AArch64PipelinerLoopInfo(MachineBasicBlock *LoopBB, MachineInstr *CondBranch,
11677 MachineInstr *Comp,
unsigned CompCounterOprNum,
11678 MachineInstr *Update,
unsigned UpdateCounterOprNum,
11679 Register Init,
bool IsUpdatePriorComp,
11680 const SmallVectorImpl<MachineOperand> &
Cond)
11682 TII(MF->getSubtarget().getInstrInfo()),
11683 TRI(MF->getSubtarget().getRegisterInfo()), MRI(MF->getRegInfo()),
11684 LoopBB(LoopBB), CondBranch(CondBranch), Comp(Comp),
11685 CompCounterOprNum(CompCounterOprNum), Update(Update),
11686 UpdateCounterOprNum(UpdateCounterOprNum), Init(Init),
11689 bool shouldIgnoreForPipelining(
const MachineInstr *
MI)
const override {
11695 std::optional<bool> createTripCountGreaterCondition(
11696 int TC, MachineBasicBlock &
MBB,
11697 SmallVectorImpl<MachineOperand> &CondParam)
override {
11705 void createRemainingIterationsGreaterCondition(
11706 int TC, MachineBasicBlock &
MBB, SmallVectorImpl<MachineOperand> &
Cond,
11707 DenseMap<MachineInstr *, MachineInstr *> &LastStage0Insts)
override;
11709 void setPreheader(MachineBasicBlock *NewPreheader)
override {}
11711 void adjustTripCount(
int TripCountAdjust)
override {}
11713 bool isMVEExpanderSupported()
override {
return true; }
11732 }
else if (
I == ReplaceOprNum) {
11737 MBB.insert(InsertTo, NewMI);
11741void AArch64PipelinerLoopInfo::createRemainingIterationsGreaterCondition(
11757 assert(CondBranch->getOpcode() == AArch64::Bcc);
11761 if (CondBranch->getOperand(1).getMBB() == LoopBB)
11768 auto AccumulateCond = [&](
Register CurCond,
11779 if (!LastStage0Insts.
empty() && LastStage0Insts[Comp]->getParent() == &
MBB) {
11783 for (
int I = 0;
I <= TC; ++
I) {
11789 AccCond = AccumulateCond(AccCond, CC);
11793 if (Update != Comp && IsUpdatePriorComp) {
11795 LastStage0Insts[Comp]->getOperand(CompCounterOprNum).getReg();
11796 NextCounter =
cloneInstr(Update, UpdateCounterOprNum, Counter,
MBB,
11800 NextCounter = LastStage0Insts[Update]->getOperand(0).getReg();
11802 }
else if (Update != Comp) {
11807 Counter = NextCounter;
11811 if (LastStage0Insts.
empty()) {
11815 if (IsUpdatePriorComp)
11820 Counter = LastStage0Insts[Comp]->getOperand(CompCounterOprNum).getReg();
11823 for (
int I = 0;
I <= TC; ++
I) {
11827 AccCond = AccumulateCond(AccCond, CC);
11828 if (
I != TC && Update != Comp)
11831 Counter = NextCounter;
11847 assert(Phi.getNumOperands() == 5);
11848 if (Phi.getOperand(2).getMBB() ==
MBB) {
11849 RegMBB = Phi.getOperand(1).getReg();
11850 RegOther = Phi.getOperand(3).getReg();
11852 assert(Phi.getOperand(4).getMBB() ==
MBB);
11853 RegMBB = Phi.getOperand(3).getReg();
11854 RegOther = Phi.getOperand(1).getReg();
11859 if (!
Reg.isVirtual())
11868 unsigned &UpdateCounterOprNum,
Register &InitReg,
11869 bool &IsUpdatePriorComp) {
11883 if (!
Reg.isVirtual())
11886 UpdateInst =
nullptr;
11887 UpdateCounterOprNum = 0;
11889 IsUpdatePriorComp =
true;
11893 if (Def->getParent() != LoopBB)
11895 if (Def->isCopy()) {
11897 if (Def->getOperand(0).getSubReg() || Def->getOperand(1).getSubReg())
11899 CurReg = Def->getOperand(1).getReg();
11900 }
else if (Def->isPHI()) {
11904 IsUpdatePriorComp =
false;
11909 switch (Def->getOpcode()) {
11910 case AArch64::ADDSXri:
11911 case AArch64::ADDSWri:
11912 case AArch64::SUBSXri:
11913 case AArch64::SUBSWri:
11914 case AArch64::ADDXri:
11915 case AArch64::ADDWri:
11916 case AArch64::SUBXri:
11917 case AArch64::SUBWri:
11919 UpdateCounterOprNum = 1;
11921 case AArch64::ADDSXrr:
11922 case AArch64::ADDSWrr:
11923 case AArch64::SUBSXrr:
11924 case AArch64::SUBSWrr:
11925 case AArch64::ADDXrr:
11926 case AArch64::ADDWrr:
11927 case AArch64::SUBXrr:
11928 case AArch64::SUBWrr:
11931 UpdateCounterOprNum = 1;
11933 UpdateCounterOprNum = 2;
11940 CurReg = Def->getOperand(UpdateCounterOprNum).getReg();
11955std::unique_ptr<TargetInstrInfo::PipelinerLoopInfo>
11966 if (
MI.isCall() ||
MI.hasUnmodeledSideEffects())
11977 if (
TBB == LoopBB && FBB == LoopBB)
11981 if (
TBB != LoopBB && FBB ==
nullptr)
11984 assert((
TBB == LoopBB || FBB == LoopBB) &&
11985 "The Loop must be a single-basic-block loop");
11990 if (CondBranch->
getOpcode() != AArch64::Bcc)
11998 unsigned CompCounterOprNum = 0;
12000 if (
MI.modifiesRegister(AArch64::NZCV, &
TRI)) {
12004 switch (
MI.getOpcode()) {
12005 case AArch64::SUBSXri:
12006 case AArch64::SUBSWri:
12007 case AArch64::ADDSXri:
12008 case AArch64::ADDSWri:
12010 CompCounterOprNum = 1;
12012 case AArch64::ADDSWrr:
12013 case AArch64::ADDSXrr:
12014 case AArch64::SUBSWrr:
12015 case AArch64::SUBSXrr:
12019 if (isWhileOpcode(
MI.getOpcode())) {
12026 if (CompCounterOprNum == 0) {
12028 CompCounterOprNum = 2;
12030 CompCounterOprNum = 1;
12042 bool IsUpdatePriorComp;
12043 unsigned UpdateCounterOprNum;
12045 Update, UpdateCounterOprNum,
Init, IsUpdatePriorComp))
12048 return std::make_unique<AArch64PipelinerLoopInfo>(
12049 LoopBB, CondBranch, Comp, CompCounterOprNum, Update, UpdateCounterOprNum,
12059 TypeSize Scale(0U,
false), Width(0U,
false);
12060 int64_t MinOffset, MaxOffset;
12061 if (
getMemOpInfo(
MI.getOpcode(), Scale, Width, MinOffset, MaxOffset)) {
12063 if (
MI.getOperand(ImmIdx).isImm() && !
MI.getOperand(ImmIdx - 1).isFI()) {
12064 int64_t Imm =
MI.getOperand(ImmIdx).getImm();
12065 if (Imm < MinOffset || Imm > MaxOffset) {
12066 ErrInfo =
"Unexpected immediate on load/store instruction";
12072 const MCInstrDesc &MCID =
MI.getDesc();
12074 const MachineOperand &MO =
MI.getOperand(
Op);
12078 ErrInfo =
"OPERAND_IMPLICIT_IMM_0 should be 0";
12087 ErrInfo =
"OPERAND_SHIFT_MSL should be msl shift of 8 or 16";
12098#define GET_INSTRINFO_HELPERS
12099#define GET_INSTRMAP_INFO
12100#include "AArch64GenInstrInfo.inc"
MachineInstrBuilder & UseMI
MachineInstrBuilder MachineInstrBuilder & DefMI
static bool forwardCopyWillClobberTuple(unsigned DestReg, unsigned SrcReg, unsigned NumRegs)
static cl::opt< unsigned > BCCDisplacementBits("aarch64-bcc-offset-bits", cl::Hidden, cl::init(19), cl::desc("Restrict range of Bcc instructions (DEBUG)"))
static Register genNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned MnegOpc, const TargetRegisterClass *RC)
genNeg - Helper to generate an intermediate negation of the second operand of Root
static bool isFrameStoreOpcode(int Opcode)
static cl::opt< unsigned > GatherOptSearchLimit("aarch64-search-limit", cl::Hidden, cl::init(2048), cl::desc("Restrict range of instructions to search for the " "machine-combiner gather pattern optimization"))
static bool getMaddPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Find instructions that can be turned into madd.
static AArch64CC::CondCode findCondCodeUsedByInstr(const MachineInstr &Instr)
Find a condition code used by the instruction.
static MachineInstr * genFusedMultiplyAcc(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC)
genFusedMultiplyAcc - Helper to generate fused multiply accumulate instructions.
static MachineInstr * genFusedMultiplyAccNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned IdxMulOpd, unsigned MaddOpc, unsigned MnegOpc, const TargetRegisterClass *RC)
genFusedMultiplyAccNeg - Helper to generate fused multiply accumulate instructions with an additional...
static bool isCombineInstrCandidate64(unsigned Opc)
static bool isFrameLoadOpcode(int Opcode)
static unsigned removeCopies(const MachineRegisterInfo &MRI, unsigned VReg)
static bool areCFlagsAccessedBetweenInstrs(MachineBasicBlock::iterator From, MachineBasicBlock::iterator To, const TargetRegisterInfo *TRI, const AccessKind AccessToCheck=AK_All)
True when condition flags are accessed (either by writing or reading) on the instruction trace starti...
static bool getFMAPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Floating-Point Support.
static bool isADDSRegImm(unsigned Opcode)
static bool isCheapCopy(const MachineInstr &MI, const AArch64RegisterInfo &RI)
static bool isANDOpcode(MachineInstr &MI)
static void appendOffsetComment(int NumBytes, llvm::raw_string_ostream &Comment, StringRef RegScale={})
static unsigned sForm(MachineInstr &Instr)
Get opcode of S version of Instr.
static bool isCombineInstrSettingFlag(unsigned Opc)
static bool getFNEGPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
static bool getIndVarInfo(Register Reg, const MachineBasicBlock *LoopBB, MachineInstr *&UpdateInst, unsigned &UpdateCounterOprNum, Register &InitReg, bool &IsUpdatePriorComp)
If Reg is an induction variable, return true and set some parameters.
static bool canPairLdStOpc(unsigned FirstOpc, unsigned SecondOpc)
static bool mustAvoidNeonAtMBBI(const AArch64Subtarget &Subtarget, MachineBasicBlock &MBB, MachineBasicBlock::iterator I)
Returns true if in a streaming call site region without SME-FA64.
static bool isPostIndexLdStOpcode(unsigned Opcode)
Return true if the opcode is a post-index ld/st instruction, which really loads from base+0.
static std::optional< unsigned > getLFIInstSizeInBytes(const MachineInstr &MI)
Return the maximum number of bytes of code the specified instruction may be after LFI rewriting.
static unsigned getBranchDisplacementBits(unsigned Opc)
static cl::opt< unsigned > CBDisplacementBits("aarch64-cb-offset-bits", cl::Hidden, cl::init(9), cl::desc("Restrict range of CB instructions (DEBUG)"))
static std::optional< ParamLoadedValue > describeORRLoadedValue(const MachineInstr &MI, Register DescribedReg, const TargetInstrInfo *TII, const TargetRegisterInfo *TRI)
If the given ORR instruction is a copy, and DescribedReg overlaps with the destination register then,...
static bool getFMULPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
static void appendReadRegExpr(SmallVectorImpl< char > &Expr, unsigned RegNum)
static MachineInstr * genMaddR(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, unsigned VR, const TargetRegisterClass *RC)
genMaddR - Generate madd instruction and combine mul and add using an extra virtual register Example ...
static Register cloneInstr(const MachineInstr *MI, unsigned ReplaceOprNum, Register ReplaceReg, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertTo)
Clone an instruction from MI.
static bool scaleOffset(unsigned Opc, int64_t &Offset)
static bool canCombineWithFMUL(MachineBasicBlock &MBB, MachineOperand &MO, unsigned MulOpc)
unsigned scaledOffsetOpcode(unsigned Opcode, unsigned &Scale)
static MachineInstr * genFusedMultiplyIdx(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC)
genFusedMultiplyIdx - Helper to generate fused multiply accumulate instructions.
static MachineInstr * genIndexedMultiply(MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxDupOp, unsigned MulOpc, const TargetRegisterClass *RC, MachineRegisterInfo &MRI)
Fold (FMUL x (DUP y lane)) into (FMUL_indexed x y lane)
static bool isSUBSRegImm(unsigned Opcode)
static bool UpdateOperandRegClass(MachineInstr &Instr)
static const TargetRegisterClass * getRegClass(const MachineInstr &MI, Register Reg)
static bool isInStreamingCallSiteRegion(MachineBasicBlock &MBB, MachineBasicBlock::iterator I)
Returns true if the instruction at I is in a streaming call site region, within a single basic block.
static bool canCmpInstrBeRemoved(MachineInstr &MI, MachineInstr &CmpInstr, int CmpValue, const TargetRegisterInfo &TRI, SmallVectorImpl< MachineInstr * > &CCUseInstrs, bool &IsInvertCC)
unsigned unscaledOffsetOpcode(unsigned Opcode)
static bool getLoadPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Search for patterns of LD instructions we can optimize.
static bool canInstrSubstituteCmpInstr(MachineInstr &MI, MachineInstr &CmpInstr, const TargetRegisterInfo &TRI)
Check if CmpInstr can be substituted by MI.
static UsedNZCV getUsedNZCV(AArch64CC::CondCode CC)
static bool isCombineInstrCandidateFP(const MachineInstr &Inst)
static void appendLoadRegExpr(SmallVectorImpl< char > &Expr, int64_t OffsetFromDefCFA)
static void appendConstantExpr(SmallVectorImpl< char > &Expr, int64_t Constant, dwarf::LocationAtom Operation)
static unsigned convertToNonFlagSettingOpc(const MachineInstr &MI)
Return the opcode that does not set flags when possible - otherwise return the original opcode.
static bool outliningCandidatesV8_3OpsConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static bool isCombineInstrCandidate32(unsigned Opc)
static void parseCondBranch(MachineInstr *LastInst, MachineBasicBlock *&Target, SmallVectorImpl< MachineOperand > &Cond)
static unsigned offsetExtendOpcode(unsigned Opcode)
static void loadRegPairFromStackSlot(const TargetRegisterInfo &TRI, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertBefore, const MCInstrDesc &MCID, Register DestReg, unsigned SubIdx0, unsigned SubIdx1, int FI, MachineMemOperand *MMO)
static void generateGatherLanePattern(MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned Pattern, unsigned NumLanes)
Generate optimized instruction sequence for gather load patterns to improve Memory-Level Parallelism ...
static bool getMiscPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Find other MI combine patterns.
static bool outliningCandidatesSigningKeyConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static const MachineInstrBuilder & AddSubReg(const MachineInstrBuilder &MIB, MCRegister Reg, unsigned SubIdx, RegState State, const TargetRegisterInfo *TRI)
static bool outliningCandidatesSigningScopeConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static bool shouldClusterFI(const MachineFrameInfo &MFI, int FI1, int64_t Offset1, unsigned Opcode1, int FI2, int64_t Offset2, unsigned Opcode2)
static cl::opt< unsigned > TBZDisplacementBits("aarch64-tbz-offset-bits", cl::Hidden, cl::init(14), cl::desc("Restrict range of TB[N]Z instructions (DEBUG)"))
static void extractPhiReg(const MachineInstr &Phi, const MachineBasicBlock *MBB, Register &RegMBB, Register &RegOther)
static MCCFIInstruction createDefCFAExpression(const TargetRegisterInfo &TRI, unsigned Reg, const StackOffset &Offset)
static bool isDefinedOutside(Register Reg, const MachineBasicBlock *BB)
static MachineInstr * genFusedMultiply(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC, FMAInstKind kind=FMAInstKind::Default, const Register *ReplacedAddend=nullptr)
genFusedMultiply - Generate fused multiply instructions.
static bool getGatherLanePattern(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, unsigned LoadLaneOpCode, unsigned NumLanes)
Check if the given instruction forms a gather load pattern that can be optimized for better Memory-Le...
static MachineInstr * genFusedMultiplyIdxNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned IdxMulOpd, unsigned MaddOpc, unsigned MnegOpc, const TargetRegisterClass *RC)
genFusedMultiplyAccNeg - Helper to generate fused multiply accumulate instructions with an additional...
static bool isCombineInstrCandidate(unsigned Opc)
static unsigned regOffsetOpcode(unsigned Opcode)
MachineOutlinerClass
Constants defining how certain sequences should be outlined.
@ MachineOutlinerTailCall
Emit a save, restore, call, and return.
@ MachineOutlinerRegSave
Emit a call and tail-call.
@ MachineOutlinerNoLRSave
Only emit a branch.
@ MachineOutlinerThunk
Emit a call and return.
static cl::opt< unsigned > BDisplacementBits("aarch64-b-offset-bits", cl::Hidden, cl::init(26), cl::desc("Restrict range of B instructions (DEBUG)"))
static bool areCFlagsAliveInSuccessors(const MachineBasicBlock *MBB)
Check if AArch64::NZCV should be alive in successors of MBB.
static void emitFrameOffsetAdj(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, unsigned DestReg, unsigned SrcReg, int64_t Offset, unsigned Opc, const TargetInstrInfo *TII, MachineInstr::MIFlag Flag, bool NeedsWinCFI, bool *HasWinCFI, bool EmitCFAOffset, StackOffset CFAOffset, unsigned FrameReg)
static bool isCheapImmediate(const MachineInstr &MI, unsigned BitSize)
static cl::opt< unsigned > CBZDisplacementBits("aarch64-cbz-offset-bits", cl::Hidden, cl::init(19), cl::desc("Restrict range of CB[N]Z instructions (DEBUG)"))
static void genSubAdd2SubSub(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, unsigned IdxOpd1, DenseMap< Register, unsigned > &InstrIdxForVirtReg)
Do the following transformation A - (B + C) ==> (A - B) - C A - (B + C) ==> (A - C) - B.
static unsigned canFoldIntoCSel(const MachineRegisterInfo &MRI, unsigned VReg, unsigned *NewReg=nullptr)
static void signOutlinedFunction(MachineFunction &MF, MachineBasicBlock &MBB, const AArch64InstrInfo *TII, bool ShouldSignReturnAddr)
static MachineInstr * genFNegatedMAD(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs)
static bool canCombineWithMUL(MachineBasicBlock &MBB, MachineOperand &MO, unsigned MulOpc, unsigned ZeroReg)
static void storeRegPairToStackSlot(const TargetRegisterInfo &TRI, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertBefore, const MCInstrDesc &MCID, Register SrcReg, bool IsKill, unsigned SubIdx0, unsigned SubIdx1, int FI, MachineMemOperand *MMO)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
MachineBasicBlock MachineBasicBlock::iterator MBBI
static const Function * getParent(const Value *V)
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
DXIL Forward Handle Accesses
const HexagonInstrInfo * TII
Module.h This file contains the declarations for the Module class.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
This file implements the LivePhysRegs utility for tracking liveness of physical registers.
Machine Check Debug Module
Register const TargetRegisterInfo * TRI
Promote Memory to Register
static MCRegister getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
MachineInstr unsigned OpIdx
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
PowerPC Reduce CR logical Operation
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
This file declares the machine register scavenger class.
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
This file defines the SmallSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
#define DEBUG_WITH_TYPE(TYPE,...)
DEBUG_WITH_TYPE macro - This macro should be used by passes to emit debug information.
static bool canCombine(MachineBasicBlock &MBB, MachineOperand &MO, unsigned CombineOpc=0)
AArch64FunctionInfo - This class is derived from MachineFunctionInfo and contains private AArch64-spe...
bool branchTargetEnforcement() const
unsigned getArgumentStackToRestore() const
SignReturnAddress getSignReturnAddressCondition() const
bool hasStreamingModeChanges() const
void setOutliningStyle(const std::string &Style)
bool branchProtectionPAuthLR() const
std::optional< bool > hasRedZone() const
static bool shouldSignReturnAddress(SignReturnAddress Condition, bool IsLRSpilled)
bool shouldSignWithBKey() const
static bool isHForm(const MachineInstr &MI)
Returns whether the instruction is in H form (16 bit operands)
void insertSelect(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, const DebugLoc &DL, Register DstReg, ArrayRef< MachineOperand > Cond, Register TrueReg, Register FalseReg) const override
static bool hasBTISemantics(const MachineInstr &MI)
Returns whether the instruction can be compatible with non-zero BTYPE.
static bool isQForm(const MachineInstr &MI)
Returns whether the instruction is in Q form (128 bit operands)
static bool getMemOpInfo(unsigned Opcode, TypeSize &Scale, TypeSize &Width, int64_t &MinOffset, int64_t &MaxOffset)
Returns true if opcode Opc is a memory operation.
static bool isTailCallReturnInst(const MachineInstr &MI)
Returns true if MI is one of the TCRETURN* instructions.
static bool isFPRCopy(const MachineInstr &MI)
Does this instruction rename an FPR without modifying bits?
MachineInstr * emitLdStWithAddr(MachineInstr &MemI, const ExtAddrMode &AM) const override
std::optional< DestSourcePair > isCopyInstrImpl(const MachineInstr &MI) const override
If the specific machine instruction is an instruction that moves/copies value from one register to an...
MachineBasicBlock * getBranchDestBlock(const MachineInstr &MI) const override
unsigned getInstSizeInBytes(const MachineInstr &MI) const override
GetInstSize - Return the number of bytes of code the specified instruction may be.
static bool isZExtLoad(const MachineInstr &MI)
Returns whether the instruction is a zero-extending load.
bool areMemAccessesTriviallyDisjoint(const MachineInstr &MIa, const MachineInstr &MIb) const override
void copyPhysReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, Register DestReg, Register SrcReg, bool KillSrc, bool RenamableDest=false, bool RenamableSrc=false) const override
static bool isGPRCopy(const MachineInstr &MI)
Does this instruction rename a GPR without modifying bits?
static unsigned convertToFlagSettingOpc(unsigned Opc)
Return the opcode that set flags when possible.
void createPauthEpilogueInstr(MachineBasicBlock &MBB, DebugLoc DL) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
bool isBranchOffsetInRange(unsigned BranchOpc, int64_t BrOffset) const override
bool canInsertSelect(const MachineBasicBlock &, ArrayRef< MachineOperand > Cond, Register, Register, Register, int &, int &, int &) const override
Register isLoadFromStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
Check for post-frame ptr elimination stack locations as well.
static const MachineOperand & getLdStOffsetOp(const MachineInstr &MI)
Returns the immediate offset operator of a load/store.
bool isCoalescableExtInstr(const MachineInstr &MI, Register &SrcReg, Register &DstReg, unsigned &SubIdx) const override
static std::optional< unsigned > getUnscaledLdSt(unsigned Opc)
Returns the unscaled load/store for the scaled load/store opcode, if there is a corresponding unscale...
static bool hasUnscaledLdStOffset(unsigned Opc)
Return true if it has an unscaled load/store offset.
static const MachineOperand & getLdStAmountOp(const MachineInstr &MI)
Returns the shift amount operator of a load/store.
static bool isPreLdSt(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed load/store.
std::optional< ExtAddrMode > getAddrModeFromMemoryOp(const MachineInstr &MemI, const TargetRegisterInfo *TRI) const override
bool getMemOperandsWithOffsetWidth(const MachineInstr &MI, SmallVectorImpl< const MachineOperand * > &BaseOps, int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width, const TargetRegisterInfo *TRI) const override
bool analyzeBranchPredicate(MachineBasicBlock &MBB, MachineBranchPredicate &MBP, bool AllowModify) const override
void insertIndirectBranch(MachineBasicBlock &MBB, MachineBasicBlock &NewDestBB, MachineBasicBlock &RestoreBB, const DebugLoc &DL, int64_t BrOffset, RegScavenger *RS) const override
void loadRegFromStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register DestReg, int FrameIndex, const TargetRegisterClass *RC, Register VReg, unsigned SubReg=0, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
static bool isPairableLdStInst(const MachineInstr &MI)
Return true if pairing the given load or store may be paired with another.
void storeRegToStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register SrcReg, bool isKill, int FrameIndex, const TargetRegisterClass *RC, Register VReg, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
static bool isSExtLoad(const MachineInstr &MI)
Returns whether the instruction is a sign-extending load.
const AArch64RegisterInfo & getRegisterInfo() const
getRegisterInfo - TargetInstrInfo is a superset of MRegister info.
static bool isPreSt(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed store.
void insertNoop(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI) const override
AArch64InstrInfo(const AArch64Subtarget &STI)
static bool isPairedLdSt(const MachineInstr &MI)
Returns whether the instruction is a paired load/store.
MachineInstr * foldMemoryOperandImpl(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, int FrameIndex, MachineInstr *&CopyMI, LiveIntervals *LIS=nullptr, VirtRegMap *VRM=nullptr) const override
bool getMemOperandWithOffsetWidth(const MachineInstr &MI, const MachineOperand *&BaseOp, int64_t &Offset, bool &OffsetIsScalable, TypeSize &Width, const TargetRegisterInfo *TRI) const
If OffsetIsScalable is set to 'true', the offset is scaled by vscale.
Register isLoadFromStackSlot(const MachineInstr &MI, int &FrameIndex) const override
bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const override
static bool isStridedAccess(const MachineInstr &MI)
Return true if the given load or store is a strided memory access.
bool shouldClusterMemOps(ArrayRef< const MachineOperand * > BaseOps1, int64_t Offset1, bool OffsetIsScalable1, ArrayRef< const MachineOperand * > BaseOps2, int64_t Offset2, bool OffsetIsScalable2, unsigned ClusterSize, unsigned NumBytes) const override
Detect opportunities for ldp/stp formation.
unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const override
bool isThroughputPattern(unsigned Pattern) const override
Return true when a code sequence can improve throughput.
MachineOperand & getMemOpBaseRegImmOfsOffsetOperand(MachineInstr &LdSt) const
Return the immediate offset of the base register in a load/store LdSt.
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify=false) const override
bool canFoldIntoAddrMode(const MachineInstr &MemI, Register Reg, const MachineInstr &AddrI, ExtAddrMode &AM) const override
static bool isLdStPairSuppressed(const MachineInstr &MI)
Return true if pairing the given load or store is hinted to be unprofitable.
Register isStoreToStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
Check for post-frame ptr elimination stack locations as well.
std::unique_ptr< TargetInstrInfo::PipelinerLoopInfo > analyzeLoopForPipelining(MachineBasicBlock *LoopBB) const override
bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const override
unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &DL, int *BytesAdded=nullptr) const override
bool optimizeCompareInstr(MachineInstr &CmpInstr, Register SrcReg, Register SrcReg2, int64_t CmpMask, int64_t CmpValue, const MachineRegisterInfo *MRI) const override
optimizeCompareInstr - Convert the instruction supplying the argument to the comparison into one that...
static unsigned getLoadStoreImmIdx(unsigned Opc)
Returns the index for the immediate for a given instruction.
static bool isGPRZero(const MachineInstr &MI)
Does this instruction set its full destination register to zero?
void copyGPRRegTuple(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, MCRegister DestReg, MCRegister SrcReg, bool KillSrc, unsigned Opcode, unsigned ZeroReg, llvm::ArrayRef< unsigned > Indices) const
bool analyzeCompare(const MachineInstr &MI, Register &SrcReg, Register &SrcReg2, int64_t &CmpMask, int64_t &CmpValue) const override
analyzeCompare - For a comparison instruction, return the source registers in SrcReg and SrcReg2,...
CombinerObjective getCombinerObjective(unsigned Pattern) const override
static bool isFpOrNEON(Register Reg)
Returns whether the physical register is FP or NEON.
bool isAsCheapAsAMove(const MachineInstr &MI) const override
std::optional< DestSourcePair > isCopyLikeInstrImpl(const MachineInstr &MI) const override
static void suppressLdStPair(MachineInstr &MI)
Hint that pairing the given load or store is unprofitable.
Register isStoreToStackSlot(const MachineInstr &MI, int &FrameIndex) const override
static bool isPreLd(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed load.
void copyPhysRegTuple(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, MCRegister DestReg, MCRegister SrcReg, bool KillSrc, unsigned Opcode, llvm::ArrayRef< unsigned > Indices) const
bool optimizeCondBranch(MachineInstr &MI) const override
Replace csincr-branch sequence by simple conditional branch.
static int getMemScale(unsigned Opc)
Scaling factor for (scaled or unscaled) load or store.
bool isCandidateToMergeOrPair(const MachineInstr &MI) const
Return true if this is a load/store that can be potentially paired/merged.
MCInst getNop() const override
static const MachineOperand & getLdStBaseOp(const MachineInstr &MI)
Returns the base register operator of a load/store.
bool isReservedReg(const MachineFunction &MF, MCRegister Reg) const
const AArch64RegisterInfo * getRegisterInfo() const override
bool isNeonAvailable() const
Returns true if the target has NEON and the function at runtime is known to have NEON enabled (e....
bool isSVEorStreamingSVEAvailable() const
Returns true if the target has access to either the full range of SVE instructions,...
Represent a constant reference to an array (0 or more elements consecutively in memory),...
const T & front() const
Get the first element.
size_t size() const
Get the array size.
This is an important base class in LLVM.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
bool hasOptSize() const
Optimize this function for size (-Os) or minimum size (-Oz).
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
Module * getParent()
Get the module that this global value is contained inside of...
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
static LocationSize precise(uint64_t Value)
This class is intended to be used as a base class for asm properties and features specific to the tar...
bool usesWindowsCFI() const
static MCCFIInstruction cfiDefCfa(MCSymbol *L, unsigned Register, int64_t Offset, SMLoc Loc={})
.cfi_def_cfa defines a rule for computing CFA as: take address from Register and add Offset to it.
static MCCFIInstruction createOffset(MCSymbol *L, unsigned Register, int64_t Offset, SMLoc Loc={})
.cfi_offset Previous value of Register is saved at offset Offset from CFA.
static MCCFIInstruction cfiDefCfaOffset(MCSymbol *L, int64_t Offset, SMLoc Loc={})
.cfi_def_cfa_offset modifies a rule for computing CFA.
static MCCFIInstruction createEscape(MCSymbol *L, StringRef Vals, SMLoc Loc={}, StringRef Comment="")
.cfi_escape Allows the user to add arbitrary bytes to the unwind info.
Instances of this class represent a single low-level machine instruction.
Describe properties that are true of each instruction in the target description file.
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
ArrayRef< MCOperandInfo > operands() const
Wrapper class representing physical registers. Should be passed by value.
constexpr bool isValid() const
static constexpr unsigned NoRegister
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
bool isInlineAsmBrIndirectTarget() const
Returns true if this is the indirect dest of an INLINEASM_BR.
unsigned pred_size() const
LLVM_ABI void transferSuccessorsAndUpdatePHIs(MachineBasicBlock *FromMBB)
Transfers all the successors, as in transferSuccessors, and update PHI operands in the successor bloc...
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
reverse_instr_iterator instr_rbegin()
LLVM_ABI iterator getFirstTerminator()
Returns an iterator to the first terminator instruction of this basic block.
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
reverse_instr_iterator instr_rend()
Instructions::iterator instr_iterator
instr_iterator instr_end()
void addLiveIn(MCRegister PhysReg, LaneBitmask LaneMask=LaneBitmask::getAll())
Adds the specified register as a live in.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
LLVM_ABI instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
MachineInstrBundleIterator< MachineInstr > iterator
void setMachineBlockAddressTaken()
Set this block to indicate that its address is used as something other than the target of a terminato...
LLVM_ABI bool isLiveIn(MCRegister Reg, LaneBitmask LaneMask=LaneBitmask::getAll()) const
Return true if the specified register is in the live in set.
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
uint64_t getStackSize() const
Return the number of bytes that must be allocated to hold all of the fixed size frame objects.
void setStackID(int ObjectIdx, uint8_t ID)
bool isCalleeSavedInfoValid() const
Has the callee saved info been calculated yet?
Align getObjectAlign(int ObjectIdx) const
Return the alignment of the specified stack object.
int64_t getObjectSize(int ObjectIdx) const
Return the size of the specified object.
unsigned getNumObjects() const
Return the number of objects.
int64_t getObjectOffset(int ObjectIdx) const
Return the assigned stack offset of the specified object from the incoming stack pointer.
bool isFixedObjectIndex(int ObjectIdx) const
Returns true if the specified index corresponds to a fixed stack object.
unsigned addFrameInst(const MCCFIInstruction &Inst)
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
BasicBlockListType::iterator iterator
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
const MachineJumpTableInfo * getJumpTableInfo() const
getJumpTableInfo - Return the jump table info object for the current function.
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineInstr - Allocate a new MachineInstr.
void insert(iterator MBBI, MachineBasicBlock *MBB)
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
const MachineInstrBuilder & setMemRefs(ArrayRef< MachineMemOperand * > MMOs) const
const MachineInstrBuilder & addCFIIndex(unsigned CFIIndex) const
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & setMIFlag(MachineInstr::MIFlag Flag) const
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addSym(MCSymbol *Sym, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addFrameIndex(int Idx) const
const MachineInstrBuilder & addGlobalAddress(const GlobalValue *GV, int64_t Offset=0, unsigned TargetFlags=0) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
const MachineInstrBuilder & setMIFlags(unsigned Flags) const
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
reverse_iterator getReverse() const
Get a reverse iterator to the same node.
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
bool mayLoadOrStore(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read or modify memory.
const MachineBasicBlock * getParent() const
bool isCall(QueryType Type=AnyInBundle) const
bool getFlag(MIFlag Flag) const
Return whether an MI flag is set.
LLVM_ABI uint32_t mergeFlagsWith(const MachineInstr &Other) const
Return the MIFlags which represent both MachineInstrs.
unsigned getNumOperands() const
Retuns the total number of operands.
LLVM_ABI unsigned getNumExplicitOperands() const
Returns the number of non-implicit operands.
bool mayLoad(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read memory.
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
LLVM_ABI bool hasUnmodeledSideEffects() const
Return true if this instruction has side effects that are not modeled by mayLoad / mayStore,...
bool registerDefIsDead(Register Reg, const TargetRegisterInfo *TRI) const
Returns true if the register is dead in this machine instruction.
bool definesRegister(Register Reg, const TargetRegisterInfo *TRI) const
Return true if the MachineInstr fully defines the specified register.
LLVM_ABI void setDesc(const MCInstrDesc &TID)
Replace the instruction descriptor (thus opcode) of the current instruction with a new one.
LLVM_ABI bool hasOrderedMemoryRef() const
Return true if this instruction may have an ordered or volatile memory reference, or if the informati...
LLVM_ABI const MachineFunction * getMF() const
Return the function that contains the basic block that this instruction belongs to.
ArrayRef< MachineMemOperand * > memoperands() const
Access to memory operands of the instruction.
LLVM_ABI bool isLoadFoldBarrier() const
Returns true if it is illegal to fold a load across this instruction.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
LLVM_ABI void removeOperand(unsigned OpNo)
Erase an operand from an instruction, leaving it with one fewer operand than it started with.
LLVM_ABI void addRegisterDefined(Register Reg, const TargetRegisterInfo *RegInfo=nullptr)
We have determined MI defines a register.
const MachineOperand & getOperand(unsigned i) const
uint32_t getFlags() const
Return the MI flags bitvector.
LLVM_ABI int findRegisterDefOperandIdx(Register Reg, const TargetRegisterInfo *TRI, bool isDead=false, bool Overlap=false) const
Returns the operand index that is a def of the specified register or -1 if it is not found.
LLVM_ABI MachineInstrBundleIterator< MachineInstr > eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
const std::vector< MachineJumpTableEntry > & getJumpTables() const
A description of a memory reference used in the backend.
@ MOVolatile
The memory access is volatile.
@ MOLoad
The memory access reads data.
@ MOStore
The memory access writes data.
This class contains meta information specific to a module.
LLVM_ABI MachineFunction * getMachineFunction(const Function &F) const
Returns the MachineFunction associated to IR function F if there is one, otherwise nullptr.
MachineOperand class - Representation of each machine instruction operand.
void setSubReg(unsigned subReg)
unsigned getSubReg() const
void setImm(int64_t immVal)
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
void setIsDead(bool Val=true)
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
void setIsKill(bool Val=true)
MachineInstr * getParent()
getParent - Return the instruction that this operand belongs to.
unsigned getTargetFlags() const
static MachineOperand CreateImm(int64_t Val)
MachineOperandType getType() const
getType - Returns the MachineOperandType for this operand.
void setIsUndef(bool Val=true)
Register getReg() const
getReg - Returns the register number.
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
LLVM_ABI bool isIdenticalTo(const MachineOperand &Other) const
Returns true if this operand is identical to the specified operand except for liveness related flags ...
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
bool tracksLiveness() const
tracksLiveness - Returns true when tracking register liveness accurately.
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
LLVM_ABI void clearKillFlags(Register Reg) const
clearKillFlags - Iterate over all the uses of the given register and clear the kill flag from the Mac...
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
bool use_nodbg_empty(Register RegNo) const
use_nodbg_empty - Return true if there are no non-Debug instructions using the specified register.
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
bool reservedRegsFrozen() const
reservedRegsFrozen - Returns true after freezeReservedRegs() was called to ensure the set of reserved...
bool def_empty(Register RegNo) const
def_empty - Return true if there are no instructions defining the specified register (it may be live-...
use_instr_nodbg_iterator use_instr_nodbg_begin(Register RegNo) const
bool hasOneDef(Register RegNo) const
Return true if there is exactly one operand defining the specified register.
const TargetRegisterClass * getRegClassOrNull(Register Reg) const
Return the register class of Reg, or null if Reg has not been assigned a register class yet.
LLVM_ABI const TargetRegisterClass * constrainRegClass(Register Reg, const TargetRegisterClass *RC, unsigned MinNumRegs=0)
constrainRegClass - Constrain the register class of the specified virtual register to be a common sub...
LLVM_ABI MachineInstr * getUniqueVRegDef(Register Reg) const
getUniqueVRegDef - Return the unique machine instr that defines the specified virtual register or nul...
A Module instance is used to store all the information related to an LLVM module.
MI-level patchpoint operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given patchpoint should emit.
Wrapper class representing virtual and physical registers.
MCRegister asMCReg() const
Utility to check-convert this value to a MCRegister.
constexpr bool isValid() const
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
static constexpr bool isVirtualRegister(unsigned Reg)
Return true if the specified register number is in the virtual register namespace.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
Represents a location in source code.
bool erase(PtrType Ptr)
Remove pointer from the set.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
void append(StringRef RHS)
Append from a StringRef.
StringRef str() const
Explicit conversion to StringRef.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
MI-level stackmap operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given stackmap should emit.
StackOffset holds a fixed and a scalable offset in bytes.
int64_t getFixed() const
Returns the fixed component of the stack.
int64_t getScalable() const
Returns the scalable component of the stack.
static StackOffset get(int64_t Fixed, int64_t Scalable)
static StackOffset getScalable(int64_t Scalable)
static StackOffset getFixed(int64_t Fixed)
MI-level Statepoint operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given statepoint should emit.
Represent a constant reference to a string, i.e.
Object returned by analyzeLoopForPipelining.
TargetInstrInfo - Interface to description of machine instruction set.
virtual void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstIdxForVirtReg) const
When getMachineCombinerPatterns() finds patterns, this function generates the instructions that could...
virtual std::optional< ParamLoadedValue > describeLoadedValue(const MachineInstr &MI, Register Reg) const
Produce the expression describing the MI loading a value into the physical register Reg.
virtual bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
virtual bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const
Test if the given instruction should be considered a scheduling boundary.
virtual CombinerObjective getCombinerObjective(unsigned Pattern) const
Return the objective of a combiner pattern.
virtual bool isFunctionSafeToSplit(const MachineFunction &MF) const
Return true if the function is a viable candidate for machine function splitting.
const MCAsmInfo & getMCAsmInfo() const
Return target specific asm information.
CodeModel::Model getCodeModel() const
Returns the code model.
bool contains(Register Reg) const
Return true if the specified register is included in this register class.
bool hasSubClassEq(const TargetRegisterClass *RC) const
Returns true if RC is a sub-class of or equal to this class.
bool hasSuperClassEq(const TargetRegisterClass *RC) const
Returns true if RC is a super-class of or equal to this class.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
Target - Wrapper for Target specific information.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Value * getOperand(unsigned i) const
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
self_iterator getIterator()
A raw_ostream that writes to an std::string.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
static CondCode getInvertedCondCode(CondCode Code)
@ MO_DLLIMPORT
MO_DLLIMPORT - On a symbol operand, this represents that the reference to the symbol is for an import...
@ MO_NC
MO_NC - Indicates whether the linker is expected to check the symbol reference for overflow.
@ MO_G1
MO_G1 - A symbol operand with this flag (granule 1) represents the bits 16-31 of a 64-bit address,...
@ MO_S
MO_S - Indicates that the bits of the symbol operand represented by MO_G0 etc are signed.
@ MO_PAGEOFF
MO_PAGEOFF - A symbol operand with this flag represents the offset of that symbol within a 4K page.
@ MO_GOT
MO_GOT - This flag indicates that a symbol operand represents the address of the GOT entry for the sy...
@ MO_PREL
MO_PREL - Indicates that the bits of the symbol operand represented by MO_G0 etc are PC relative.
@ MO_G0
MO_G0 - A symbol operand with this flag (granule 0) represents the bits 0-15 of a 64-bit address,...
@ MO_ARM64EC_CALLMANGLE
MO_ARM64EC_CALLMANGLE - Operand refers to the Arm64EC-mangled version of a symbol,...
@ MO_PAGE
MO_PAGE - A symbol operand with this flag represents the pc-relative offset of the 4K page containing...
@ MO_HI12
MO_HI12 - This flag indicates that a symbol operand represents the bits 13-24 of a 64-bit address,...
@ MO_TLS
MO_TLS - Indicates that the operand being accessed is some kind of thread-local symbol.
@ MO_G2
MO_G2 - A symbol operand with this flag (granule 2) represents the bits 32-47 of a 64-bit address,...
@ MO_TAGGED
MO_TAGGED - With MO_PAGE, indicates that the page includes a memory tag in bits 56-63.
@ MO_G3
MO_G3 - A symbol operand with this flag (granule 3) represents the high 16-bits of a 64-bit address,...
@ MO_COFFSTUB
MO_COFFSTUB - On a symbol operand "FOO", this indicates that the reference is actually to the "....
unsigned getCheckerSizeInBytes(AuthCheckMethod Method)
Returns the number of bytes added by checkAuthenticatedRegister.
static uint64_t decodeLogicalImmediate(uint64_t val, unsigned regSize)
decodeLogicalImmediate - Decode a logical immediate value in the form "N:immr:imms" (where the immr a...
static unsigned getShiftValue(unsigned Imm)
getShiftValue - Extract the shift value.
static unsigned getArithExtendImm(AArch64_AM::ShiftExtendType ET, unsigned Imm)
getArithExtendImm - Encode the extend type and shift amount for an arithmetic instruction: imm: 3-bit...
static unsigned getArithShiftValue(unsigned Imm)
getArithShiftValue - get the arithmetic shift value.
static uint64_t encodeLogicalImmediate(uint64_t imm, unsigned regSize)
encodeLogicalImmediate - Return the encoded immediate value for a logical immediate instruction of th...
static AArch64_AM::ShiftExtendType getExtendType(unsigned Imm)
getExtendType - Extract the extend type for operands of arithmetic ops.
static AArch64_AM::ShiftExtendType getArithExtendType(unsigned Imm)
static AArch64_AM::ShiftExtendType getShiftType(unsigned Imm)
getShiftType - Extract the shift type.
static unsigned getShifterImm(AArch64_AM::ShiftExtendType ST, unsigned Imm)
getShifterImm - Encode the shift type and amount: imm: 6-bit shift amount shifter: 000 ==> lsl 001 ==...
void expandMOVAddr(unsigned Opcode, unsigned TargetFlags, bool IsTargetMachO, SmallVectorImpl< AddrInsnModel > &Insn)
void expandMOVImm(uint64_t Imm, unsigned BitSize, SmallVectorImpl< ImmInsnModel > &Insn)
Expand a MOVi32imm or MOVi64imm pseudo instruction to one or more real move-immediate instructions to...
static const uint64_t InstrFlagIsWhile
static const uint64_t InstrFlagIsPTestLike
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
@ ScalablePredicateVector
initializer< Ty > init(const Ty &Val)
InstrType
Represents how an instruction should be mapped by the outliner.
NodeAddr< InstrNode * > Instr
LLVM_ABI Instruction & back() const
LLVM_ABI iterator begin() const
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
static bool isCondBranchOpcode(int Opc)
MCCFIInstruction createDefCFA(const TargetRegisterInfo &TRI, unsigned FrameReg, unsigned Reg, const StackOffset &Offset, bool LastAdjustmentWasScalable=true)
static bool isPTrueOpcode(unsigned Opc)
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
bool succeeded(LogicalResult Result)
Utility function that returns true if the provided LogicalResult corresponds to a success value.
int isAArch64FrameOffsetLegal(const MachineInstr &MI, StackOffset &Offset, bool *OutUseUnscaledOp=nullptr, unsigned *OutUnscaledOp=nullptr, int64_t *EmittableOffset=nullptr)
Check if the Offset is a valid frame offset for MI.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
RegState
Flags to represent properties of register accesses.
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Kill
The last use of a register.
@ Undef
Value of the register doesn't matter.
@ Define
Register definition.
@ Renamable
Register that may be renamed.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
constexpr RegState getKillRegState(bool B)
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
static bool isIndirectBranchOpcode(int Opc)
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
unsigned getBLRCallOpcode(const MachineFunction &MF)
Return opcode to be used for indirect calls.
@ AArch64FrameOffsetIsLegal
Offset is legal.
@ AArch64FrameOffsetCanUpdate
Offset can apply, at least partly.
@ AArch64FrameOffsetCannotUpdate
Offset cannot apply.
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
unsigned Log2_64(uint64_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
static bool isSEHInstruction(const MachineInstr &MI)
bool isLFIPrePostMemAccess(unsigned Opcode)
Returns true if Opcode is a pre- or post-indexed memory access that the LFI rewriter expands with a b...
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
auto reverse(ContainerTy &&C)
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
void sort(IteratorTy Start, IteratorTy End)
AArch64MachineCombinerPattern
@ MULSUBv2i32_indexed_OP1
@ MULADDv4i16_indexed_OP2
@ MULSUBv8i16_indexed_OP2
@ MULSUBv4i16_indexed_OP2
@ MULSUBv4i32_indexed_OP2
@ MULADDv2i32_indexed_OP1
@ MULADDv4i32_indexed_OP1
@ MULADDv2i32_indexed_OP2
@ MULSUBv4i16_indexed_OP1
@ MULADDv4i32_indexed_OP2
@ MULSUBv8i16_indexed_OP1
@ MULSUBv2i32_indexed_OP2
@ MULADDv8i16_indexed_OP1
@ MULSUBv4i32_indexed_OP1
@ MULADDv8i16_indexed_OP2
@ MULADDv4i16_indexed_OP1
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
void emitFrameOffset(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, unsigned DestReg, unsigned SrcReg, StackOffset Offset, const TargetInstrInfo *TII, MachineInstr::MIFlag=MachineInstr::NoFlags, bool SetNZCV=false, bool NeedsWinCFI=false, bool *HasWinCFI=nullptr, bool EmitCFAOffset=false, StackOffset InitialOffset={}, unsigned FrameReg=AArch64::SP)
emitFrameOffset - Emit instructions as needed to set DestReg to SrcReg plus Offset.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
constexpr RegState getDefRegState(bool B)
CombinerObjective
The combiner's goal may differ based on which pattern it is attempting to optimize.
std::optional< UsedNZCV > examineCFlagsUse(MachineInstr &MI, MachineInstr &CmpInstr, const TargetRegisterInfo &TRI, SmallVectorImpl< MachineInstr * > *CCUseInstrs=nullptr)
CodeGenOptLevel
Code generation optimization level.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
auto instructionsWithoutDebug(IterT It, IterT End, bool SkipPseudoOp=true)
Construct a range iterator which begins at It and moves forwards until End is reached,...
LLVM_ABI raw_fd_ostream & errs()
This returns a reference to a raw_ostream for standard error.
auto drop_end(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the last N elements excluded.
static MCRegister getXRegFromWReg(MCRegister Reg)
MCCFIInstruction createCFAOffset(const TargetRegisterInfo &MRI, unsigned Reg, const StackOffset &OffsetFromDefCFA, std::optional< int64_t > IncomingVGOffsetFromDefCFA)
FunctionAddr VTableAddr Next
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
static bool isUncondBranchOpcode(int Opc)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
constexpr bool isIntN(unsigned N, int64_t x)
Checks if an signed integer fits into the given (dynamic) bit width.
bool rewriteAArch64FrameIndex(MachineInstr &MI, unsigned FrameRegIdx, unsigned FrameReg, StackOffset &Offset, const AArch64InstrInfo *TII)
rewriteAArch64FrameIndex - Rewrite MI to access 'Offset' bytes from the FP.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
static const MachineMemOperand::Flags MOSuppressPair
constexpr int64_t SignExtend64(uint64_t x)
Sign-extend the number in the bottom B bits of X to a 64-bit integer.
void appendLEB128(SmallVectorImpl< U > &Buffer, T Value)
bool optimizeTerminators(MachineBasicBlock *MBB, const TargetInstrInfo &TII)
std::pair< MachineOperand, DIExpression * > ParamLoadedValue
bool isNZCVTouchedInInstructionRange(const MachineInstr &DefMI, const MachineInstr &UseMI, const TargetRegisterInfo *TRI)
Return true if there is an instruction /after/ DefMI and before UseMI which either reads or clobbers ...
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
static const MachineMemOperand::Flags MOStridedAccess
constexpr RegState getUndefRegState(bool B)
void fullyRecomputeLiveIns(ArrayRef< MachineBasicBlock * > MBBs)
Convenience function for recomputing live-in's for a set of MBBs until the computation converges.
LLVM_ABI Printable printReg(Register Reg, const TargetRegisterInfo *TRI=nullptr, unsigned SubIdx=0, const MachineRegisterInfo *MRI=nullptr)
Prints virtual and physical registers with or without a TRI instance.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Used to describe addressing mode similar to ExtAddrMode in CodeGenPrepare.
LLVM_ABI static const MBBSectionID ColdSectionID
This class contains a discriminated union of information about pointers in memory operands,...
static LLVM_ABI MachinePointerInfo getUnknownStack(MachineFunction &MF)
Stack memory without other information.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
An individual sequence of instructions to be replaced with a call to an outlined function.
MachineFunction * getMF() const
The information necessary to create an outlined function for some class of candidate.