46#define DEBUG_TYPE "gi-combiner"
55 cl::desc(
"Force all indexed operations to be "
56 "legal for the GlobalISel combiner"));
65 TII(
Builder.getMF().getSubtarget().getInstrInfo()),
66 RBI(
Builder.getMF().getSubtarget().getRegBankInfo()),
67 TRI(
Builder.getMF().getSubtarget().getRegisterInfo()) {
72 return *
Builder.getMF().getSubtarget().getTargetLowering();
90 assert(
I < ByteWidth &&
"I must be in [0, ByteWidth)");
98 LLT Ty = MRI.getType(V);
109 assert(
I < ByteWidth &&
"I must be in [0, ByteWidth)");
110 return ByteWidth -
I - 1;
130static std::optional<bool>
134 unsigned Width = MemOffset2Idx.
size();
137 bool BigEndian =
true, LittleEndian =
true;
138 for (
unsigned MemOffset = 0; MemOffset < Width; ++ MemOffset) {
139 auto MemOffsetAndIdx = MemOffset2Idx.
find(MemOffset);
140 if (MemOffsetAndIdx == MemOffset2Idx.
end())
142 const int64_t Idx = MemOffsetAndIdx->second - LowestIdx;
143 assert(Idx >= 0 &&
"Expected non-negative byte offset?");
146 if (!BigEndian && !LittleEndian)
150 assert((BigEndian != LittleEndian) &&
151 "Pattern cannot be both big and little endian!");
158 assert(
LI &&
"Must have LegalizerInfo to query isLegal!");
186 return isLegal({TargetOpcode::G_BUILD_VECTOR, {Ty, EltTy}}) &&
187 isLegal({TargetOpcode::G_CONSTANT, {EltTy}});
194 if (
MRI.constrainRegAttrs(ToReg, FromReg))
195 MRI.replaceRegWith(FromReg, ToReg);
197 Builder.buildCopy(FromReg, ToReg);
199 Observer.finishedChangingAllUsesOfReg();
214 unsigned ToOpcode)
const {
229 MRI.setRegBank(Reg, *RegBank);
240 if (
MI.getOpcode() != TargetOpcode::COPY)
250 MI.eraseFromParent();
259 if (!
MRI.hasOneNonDBGUse(OrigOp))
278 std::optional<MachineOperand> MaybePoisonOperand;
280 if (!Operand.isReg())
286 if (!MaybePoisonOperand)
287 MaybePoisonOperand = Operand;
296 if (!MaybePoisonOperand) {
301 B.buildCopy(
DstOp, OrigOp);
306 Register MaybePoisonOperandReg = MaybePoisonOperand->getReg();
307 LLT MaybePoisonOperandRegTy =
MRI.getType(MaybePoisonOperandReg);
314 auto Freeze =
B.buildFreeze(MaybePoisonOperandRegTy, MaybePoisonOperandReg);
325 assert(
MI.getOpcode() == TargetOpcode::G_CONCAT_VECTORS &&
326 "Invalid instruction");
336 assert(Def &&
"Operand not defined");
337 if (!
MRI.hasOneNonDBGUse(Reg))
339 switch (Def->getOpcode()) {
340 case TargetOpcode::G_BUILD_VECTOR:
345 Ops.push_back(BuildVecMO.getReg());
347 case TargetOpcode::G_IMPLICIT_DEF: {
348 LLT OpType =
MRI.getType(Reg);
355 OpType.getScalarType() &&
356 "All undefs should have the same type");
359 for (
unsigned EltIdx = 0, EltEnd = OpType.getNumElements();
360 EltIdx != EltEnd; ++EltIdx)
361 Ops.push_back(
Undef->getOperand(0).getReg());
370 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
372 {TargetOpcode::G_BUILD_VECTOR, {DstTy,
MRI.getType(
Ops[0])}})) {
387 Register NewDstReg =
MRI.cloneVirtualRegister(DstReg);
400 MI.eraseFromParent();
409 if (!Unmerge || Unmerge->
getReg(0) != BV.getSourceReg(0))
412 if (BC->
getOpcode() != TargetOpcode::G_BITCAST)
416 if (!InputTy.
isScalar() || BV.getNumSources() % Factor != 0)
421 if (!
isLegal({TargetOpcode::G_BUILD_VECTOR, {BVDstTy, InputTy}}))
425 for (
unsigned Idx = 0; Idx < BV.getNumSources(); Idx += Factor) {
429 if (Src->getOpcode() == TargetOpcode::G_IMPLICIT_DEF)
438 if (BC->
getOpcode() != TargetOpcode::G_BITCAST ||
462 auto BV =
Builder.buildBuildVector(BVDstTy,
Ops);
463 Builder.buildBitcast(
MI.getOperand(0).getReg(), BV);
464 MI.eraseFromParent();
470 Register SrcVec1 = Shuffle.getSrc1Reg();
471 Register SrcVec2 = Shuffle.getSrc2Reg();
472 LLT EltTy =
MRI.getType(SrcVec1).getElementType();
473 int Width =
MRI.getType(SrcVec1).getNumElements();
475 auto Unmerge1 =
Builder.buildUnmerge(EltTy, SrcVec1);
476 auto Unmerge2 =
Builder.buildUnmerge(EltTy, SrcVec2);
480 for (
int Val : Shuffle.getMask()) {
483 else if (Val < Width)
484 Extracts.
push_back(Unmerge1.getReg(Val));
486 Extracts.
push_back(Unmerge2.getReg(Val - Width));
488 assert(Extracts.
size() > 0 &&
"Expected at least one element in the shuffle");
489 if (Extracts.
size() == 1)
490 Builder.buildCopy(
MI.getOperand(0).getReg(), Extracts[0]);
492 Builder.buildBuildVector(
MI.getOperand(0).getReg(), Extracts);
493 MI.eraseFromParent();
503 if (!ConcatMI1 || !ConcatMI2)
507 if (
MRI.getType(ConcatMI1->getSourceReg(0)) !=
508 MRI.getType(ConcatMI2->getSourceReg(0)))
511 LLT ConcatSrcTy =
MRI.getType(ConcatMI1->getReg(1));
512 LLT ShuffleSrcTy1 =
MRI.getType(
MI.getOperand(1).getReg());
514 for (
unsigned i = 0; i < Mask.size(); i += ConcatSrcNumElt) {
518 for (
unsigned j = 1; j < ConcatSrcNumElt; j++) {
519 if (i + j >= Mask.size())
521 if (Mask[i + j] != -1)
525 {TargetOpcode::G_IMPLICIT_DEF, {ConcatSrcTy}}))
528 }
else if (Mask[i] % ConcatSrcNumElt == 0) {
529 for (
unsigned j = 1; j < ConcatSrcNumElt; j++) {
530 if (i + j >= Mask.size())
532 if (Mask[i + j] != Mask[i] +
static_cast<int>(j))
538 Ops.push_back(ConcatMI1->getSourceReg(Mask[i] / ConcatSrcNumElt));
540 Ops.push_back(ConcatMI2->getSourceReg(Mask[i] / ConcatSrcNumElt -
541 ConcatMI1->getNumSources()));
549 {TargetOpcode::G_CONCAT_VECTORS,
550 {
MRI.getType(
MI.getOperand(0).getReg()), ConcatSrcTy}}))
561 SrcTy =
MRI.getType(Reg);
563 assert(SrcTy.isValid() &&
"Unexpected full undef vector in concat combine");
570 UndefReg =
Builder.buildUndef(SrcTy).getReg(0);
576 Builder.buildConcatVectors(
MI.getOperand(0).getReg(),
Ops);
579 MI.eraseFromParent();
584 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR &&
585 "Invalid instruction kind");
586 LLT DstType =
MRI.getType(
MI.getOperand(0).getReg());
588 LLT SrcType =
MRI.getType(Src1);
590 unsigned DstNumElts = DstType.getNumElements();
591 unsigned SrcNumElts = SrcType.getNumElements();
608 if (DstNumElts < 2 * SrcNumElts)
613 if (DstNumElts % SrcNumElts != 0)
619 unsigned NumConcat = DstNumElts / SrcNumElts;
622 for (
unsigned i = 0; i != DstNumElts; ++i) {
629 if ((Idx % SrcNumElts != (i % SrcNumElts)) ||
630 (ConcatSrcs[i / SrcNumElts] >= 0 &&
631 ConcatSrcs[i / SrcNumElts] != (
int)(Idx / SrcNumElts)))
634 ConcatSrcs[i / SrcNumElts] = Idx / SrcNumElts;
641 for (
auto Src : ConcatSrcs) {
645 UndefReg =
Builder.buildUndef(SrcType).getReg(0);
647 Ops.push_back(UndefReg);
660 Register NewDstReg =
MRI.cloneVirtualRegister(DstReg);
668 MI.eraseFromParent();
677 const LLT TyForCandidate,
678 unsigned OpcodeForCandidate,
683 return {TyForCandidate, OpcodeForCandidate, MIForCandidate};
694 if (OpcodeForCandidate == TargetOpcode::G_ANYEXT &&
697 else if (CurrentUse.
ExtendOpcode == TargetOpcode::G_ANYEXT &&
698 OpcodeForCandidate != TargetOpcode::G_ANYEXT)
699 return {TyForCandidate, OpcodeForCandidate, MIForCandidate};
707 OpcodeForCandidate == TargetOpcode::G_ZEXT)
709 else if (CurrentUse.
ExtendOpcode == TargetOpcode::G_ZEXT &&
710 OpcodeForCandidate == TargetOpcode::G_SEXT)
711 return {TyForCandidate, OpcodeForCandidate, MIForCandidate};
720 return {TyForCandidate, OpcodeForCandidate, MIForCandidate};
731static void InsertInsnsWithoutSideEffectsBeforeUse(
743 InsertBB = PredBB->
getMBB();
748 if (InsertBB ==
DefMI.getParent()) {
750 Inserter(InsertBB, std::next(InsertPt), UseMO);
769 unsigned CandidateLoadOpc;
771 case TargetOpcode::G_ANYEXT:
772 CandidateLoadOpc = TargetOpcode::G_LOAD;
774 case TargetOpcode::G_SEXT:
775 CandidateLoadOpc = TargetOpcode::G_SEXTLOAD;
777 case TargetOpcode::G_ZEXT:
778 CandidateLoadOpc = TargetOpcode::G_ZEXTLOAD;
783 return CandidateLoadOpc;
800 LLT LoadValueTy =
MRI.getType(LoadReg);
822 unsigned PreferredOpcode =
824 ? TargetOpcode::G_ANYEXT
826 Preferred = {
LLT(), PreferredOpcode,
nullptr};
827 for (
auto &
UseMI :
MRI.use_nodbg_instructions(LoadReg)) {
828 if (
UseMI.getOpcode() == TargetOpcode::G_SEXT ||
829 UseMI.getOpcode() == TargetOpcode::G_ZEXT ||
830 (
UseMI.getOpcode() == TargetOpcode::G_ANYEXT)) {
831 const auto &MMO = LoadMI->
getMMO();
839 LLT UseTy =
MRI.getType(
UseMI.getOperand(0).getReg());
841 if (
LI->getAction({CandidateLoadOpc, {UseTy, SrcTy}, {MMDesc}})
845 Preferred = ChoosePreferredUse(
MI, Preferred,
846 MRI.getType(
UseMI.getOperand(0).getReg()),
856 assert(Preferred.Ty != LoadValueTy &&
"Extending to same type?");
874 if (PreviouslyEmitted) {
881 Builder.setInsertPt(*InsertIntoBB, InsertBefore);
882 Register NewDstReg =
MRI.cloneVirtualRegister(
MI.getOperand(0).getReg());
884 EmittedInsns[InsertIntoBB] = NewMI;
890 MI.setDesc(
Builder.getTII().get(LoadOpc));
897 for (
auto *UseMO :
Uses) {
903 UseMI->getOpcode() == TargetOpcode::G_ANYEXT) {
906 const LLT UseDstTy =
MRI.getType(UseDstReg);
907 if (UseDstReg != ChosenDstReg) {
908 if (Preferred.
Ty == UseDstTy) {
945 InsertInsnsWithoutSideEffectsBeforeUse(
Builder,
MI, *UseMO,
960 InsertInsnsWithoutSideEffectsBeforeUse(
Builder,
MI, *UseMO, InsertTruncAt);
963 MI.getOperand(0).setReg(ChosenDstReg);
969 assert(
MI.getOpcode() == TargetOpcode::G_AND);
980 if (
MRI.getType(Dst).isVector())
988 APInt MaskVal = MaybeMask->Value;
1001 LLT RegTy =
MRI.getType(LoadReg);
1005 unsigned MaskSizeBits = MaskVal.
countr_one();
1008 !
MRI.hasOneNonDBGUse(LoadReg))
1013 if (MaskSizeBits > LoadSizeBits)
1033 else if (LoadSizeBits > MaskSizeBits || LoadSizeBits ==
RegSize)
1038 {TargetOpcode::G_ZEXTLOAD, {RegTy,
MRI.getType(PtrReg)}, {MemDesc}}))
1042 B.setInstrAndDebugLoc(*LoadMI);
1043 auto &MF =
B.getMF();
1045 auto *NewMMO = MF.getMachineMemOperand(&MMO, PtrInfo, MemDesc.
MemoryTy);
1046 B.buildLoadInstr(TargetOpcode::G_ZEXTLOAD, Dst, PtrReg, *NewMMO);
1056 "shouldn't consider debug uses");
1064 if (DefOrUse ==
MBB.end())
1066 return &*DefOrUse == &
DefMI;
1072 "shouldn't consider debug uses");
1075 else if (
DefMI.getParent() !=
UseMI.getParent())
1082 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
1086 if (
MRI.getType(SrcReg).isVector())
1091 LoadUser = TruncSrc;
1093 uint64_t SizeInBits =
MI.getOperand(2).getImm();
1098 auto LoadSizeBits = LoadMI->getMemSizeInBits();
1100 MRI.getType(TruncSrc).getSizeInBits() < LoadSizeBits.getValue())
1102 if (LoadSizeBits == SizeInBits)
1109 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
1110 Builder.buildCopy(
MI.getOperand(0).getReg(),
MI.getOperand(1).getReg());
1111 MI.eraseFromParent();
1115 MachineInstr &
MI, std::tuple<Register, unsigned> &MatchInfo)
const {
1116 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
1119 LLT RegTy =
MRI.getType(DstReg);
1130 uint64_t MemBits = LoadDef->getMemSizeInBits().getValue();
1131 uint64_t ExtFrom =
MI.getOperand(2).getImm();
1133 if (MemBits > ExtFrom && !
MRI.hasOneNonDBGUse(SrcReg))
1139 unsigned NewSizeBits = std::min(ExtFrom, MemBits);
1142 if (NewSizeBits < 8)
1154 if (LoadDef->isSimple())
1156 else if (MemBits > NewSizeBits || MemBits == RegTy.
getSizeInBits())
1161 {
MRI.getType(LoadDef->getDstReg()),
1162 MRI.getType(LoadDef->getPointerReg())},
1166 MatchInfo = std::make_tuple(LoadDef->getDstReg(), NewSizeBits);
1171 MachineInstr &
MI, std::tuple<Register, unsigned> &MatchInfo)
const {
1172 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
1174 unsigned ScalarSizeBits;
1175 std::tie(LoadReg, ScalarSizeBits) = MatchInfo;
1184 auto &MMO = LoadDef->
getMMO();
1185 Builder.setInstrAndDebugLoc(*LoadDef);
1187 auto PtrInfo = MMO.getPointerInfo();
1188 auto *NewMMO = MF.getMachineMemOperand(&MMO, PtrInfo, ScalarSizeBits / 8);
1189 Builder.buildLoadInstr(TargetOpcode::G_SEXTLOAD,
MI.getOperand(0).getReg(),
1192 MI.eraseFromParent();
1203 auto *MF =
MI->getMF();
1210 AM.
BaseOffs = CstOff->getSExtValue();
1215 MF->getDataLayout(), AM,
1217 MF->getFunction().getContext()),
1218 MI->getMMO().getAddrSpace());
1223 case TargetOpcode::G_LOAD:
1224 return TargetOpcode::G_INDEXED_LOAD;
1225 case TargetOpcode::G_STORE:
1226 return TargetOpcode::G_INDEXED_STORE;
1227 case TargetOpcode::G_ZEXTLOAD:
1228 return TargetOpcode::G_INDEXED_ZEXTLOAD;
1229 case TargetOpcode::G_SEXTLOAD:
1230 return TargetOpcode::G_INDEXED_SEXTLOAD;
1236bool CombinerHelper::isIndexedLoadStoreLegal(
GLoadStore &LdSt)
const {
1246 if (IndexedOpc == TargetOpcode::G_INDEXED_STORE)
1247 OpTys = {PtrTy, Ty, Ty};
1249 OpTys = {Ty, PtrTy};
1251 LegalityQuery Q(IndexedOpc, OpTys, MemDescrs);
1257 cl::desc(
"Number of uses of a base pointer to check before it is no longer "
1258 "considered for post-indexing."));
1262 bool &RematOffset)
const {
1275 if (!isIndexedLoadStoreLegal(LdSt))
1284 unsigned NumUsesChecked = 0;
1297 if (StoredValDef == &
Use)
1300 Offset = PtrAdd->getOffsetReg();
1302 !TLI.isIndexingLegal(LdSt, PtrAdd->getBaseReg(),
Offset,
1308 RematOffset =
false;
1312 if (OffsetDef->
getOpcode() != TargetOpcode::G_CONSTANT)
1317 for (
auto &BasePtrUse :
MRI.use_nodbg_instructions(PtrAdd->getBaseReg())) {
1318 if (&BasePtrUse == PtrDef)
1324 if (BasePtrLdSt && BasePtrLdSt != &LdSt &&
1326 isIndexedLoadStoreLegal(*BasePtrLdSt))
1332 Register PtrAddDefReg = BasePtrUseDef->getReg(0);
1333 for (
auto &BaseUseUse :
MRI.use_nodbg_instructions(PtrAddDefReg)) {
1336 if (BaseUseUse.getParent() != LdSt.
getParent())
1348 Addr = PtrAdd->getReg(0);
1349 Base = PtrAdd->getBaseReg();
1364 MRI.hasOneNonDBGUse(Addr))
1371 if (!isIndexedLoadStoreLegal(LdSt))
1375 if (BaseDef->
getOpcode() == TargetOpcode::G_FRAME_INDEX)
1380 if (
Base == St->getValueReg())
1385 if (St->getValueReg() == Addr)
1390 for (
auto &AddrUse :
MRI.use_nodbg_instructions(Addr))
1391 if (AddrUse.getParent() != LdSt.
getParent())
1396 bool RealUse =
false;
1397 for (
auto &AddrUse :
MRI.use_nodbg_instructions(Addr)) {
1415 assert(
MI.getOpcode() == TargetOpcode::G_EXTRACT_VECTOR_ELT);
1425 assert(
MRI.getType(
MI.getOperand(0).getReg()) == VecEltTy);
1432 if (!LoadMI->isSimple())
1444 const unsigned MaxIter = 20;
1447 if (
II->isLoadFoldBarrier())
1449 if (Iter++ == MaxIter)
1465 int Elt = CVal->getZExtValue();
1478 Register VecPtr = LoadMI->getPointerReg();
1479 LLT PtrTy =
MRI.getType(VecPtr);
1487 {TargetOpcode::G_LOAD, {VecEltTy, PtrTy}, {MMDesc}}))
1510 B.buildLoad(Result, finalPtr, PtrInfo, Alignment);
1525 MatchInfo.
IsPre = findPreIndexCandidate(LdSt, MatchInfo.
Addr, MatchInfo.
Base,
1527 if (!MatchInfo.
IsPre &&
1528 !findPostIndexCandidate(LdSt, MatchInfo.
Addr, MatchInfo.
Base,
1538 unsigned Opcode =
MI.getOpcode();
1539 bool IsStore = Opcode == TargetOpcode::G_STORE;
1545 auto *OldCst =
MRI.getVRegDef(MatchInfo.
Offset);
1547 *OldCst->getOperand(1).getCImm());
1548 MatchInfo.
Offset = NewCst.getReg(0);
1551 auto MIB =
Builder.buildInstr(NewOpcode);
1553 MIB.addDef(MatchInfo.
Addr);
1554 MIB.addUse(
MI.getOperand(0).getReg());
1556 MIB.addDef(
MI.getOperand(0).getReg());
1557 MIB.addDef(MatchInfo.
Addr);
1560 MIB.addUse(MatchInfo.
Base);
1561 MIB.addUse(MatchInfo.
Offset);
1562 MIB.addImm(MatchInfo.
IsPre);
1563 MIB->cloneMemRefs(*
MI.getMF(),
MI);
1564 MI.eraseFromParent();
1572 unsigned Opcode =
MI.getOpcode();
1573 bool IsDiv, IsSigned;
1578 case TargetOpcode::G_SDIV:
1579 case TargetOpcode::G_UDIV: {
1581 IsSigned = Opcode == TargetOpcode::G_SDIV;
1584 case TargetOpcode::G_SREM:
1585 case TargetOpcode::G_UREM: {
1587 IsSigned = Opcode == TargetOpcode::G_SREM;
1593 unsigned DivOpcode, RemOpcode, DivremOpcode;
1595 DivOpcode = TargetOpcode::G_SDIV;
1596 RemOpcode = TargetOpcode::G_SREM;
1597 DivremOpcode = TargetOpcode::G_SDIVREM;
1599 DivOpcode = TargetOpcode::G_UDIV;
1600 RemOpcode = TargetOpcode::G_UREM;
1601 DivremOpcode = TargetOpcode::G_UDIVREM;
1619 for (
auto &
UseMI :
MRI.use_nodbg_instructions(Src1)) {
1620 if (
MI.getParent() ==
UseMI.getParent() &&
1621 ((IsDiv &&
UseMI.getOpcode() == RemOpcode) ||
1622 (!IsDiv &&
UseMI.getOpcode() == DivOpcode)) &&
1635 unsigned Opcode =
MI.getOpcode();
1636 assert(OtherMI &&
"OtherMI shouldn't be empty.");
1639 if (Opcode == TargetOpcode::G_SDIV || Opcode == TargetOpcode::G_UDIV) {
1640 DestDivReg =
MI.getOperand(0).getReg();
1644 DestRemReg =
MI.getOperand(0).getReg();
1648 Opcode == TargetOpcode::G_SDIV || Opcode == TargetOpcode::G_SREM;
1655 Builder.setInstrAndDebugLoc(*FirstInst);
1657 Builder.buildInstr(IsSigned ? TargetOpcode::G_SDIVREM
1658 : TargetOpcode::G_UDIVREM,
1659 {DestDivReg, DestRemReg},
1661 MI.eraseFromParent();
1667 assert(
MI.getOpcode() == TargetOpcode::G_BR);
1684 if (BrIt ==
MBB->begin())
1686 assert(std::next(BrIt) ==
MBB->end() &&
"expected G_BR to be a terminator");
1688 BrCond = &*std::prev(BrIt);
1689 if (BrCond->
getOpcode() != TargetOpcode::G_BRCOND)
1695 return BrCondTarget !=
MI.getOperand(0).getMBB() &&
1696 MBB->isLayoutSuccessor(BrCondTarget);
1702 Builder.setInstrAndDebugLoc(*BrCond);
1707 auto True =
Builder.buildConstant(
1713 MI.getOperand(0).setMBB(FallthroughBB);
1726 unsigned MaxLen)
const {
1727 auto &[Dst, Src, KnownLen, Alignment, DstAlignCanChange, MemOps] = MatchInfo;
1729 DstAlignCanChange, MemOps);
1734 auto &[Dst, Src, KnownLen, Alignment, DstAlignCanChange, MemOps] = MatchInfo;
1739 DstAlignCanChange, MemOps) ==
1741 assert(
Changed &&
"expected memcpy-family instruction to lower");
1746 unsigned MaxLen)
const {
1758 switch (
MI.getOpcode()) {
1761 case TargetOpcode::G_FNEG: {
1762 Result.changeSign();
1765 case TargetOpcode::G_FABS: {
1769 case TargetOpcode::G_FCEIL:
1772 case TargetOpcode::G_FFLOOR:
1775 case TargetOpcode::G_INTRINSIC_TRUNC:
1778 case TargetOpcode::G_INTRINSIC_ROUND:
1781 case TargetOpcode::G_INTRINSIC_ROUNDEVEN:
1784 case TargetOpcode::G_FRINT:
1785 case TargetOpcode::G_FNEARBYINT:
1789 case TargetOpcode::G_FPEXT:
1790 case TargetOpcode::G_FPTRUNC: {
1797 case TargetOpcode::G_FSQRT: {
1801 Result =
APFloat(sqrt(Result.convertToDouble()));
1804 case TargetOpcode::G_FLOG2: {
1824 Builder.buildFConstant(
MI.getOperand(0), *NewCst);
1825 MI.eraseFromParent();
1836 if (
MI.getOpcode() != TargetOpcode::G_PTR_ADD)
1846 if (!Add2Def || Add2Def->
getOpcode() != TargetOpcode::G_PTR_ADD)
1859 Type *AccessTy =
nullptr;
1860 auto &MF = *
MI.getMF();
1861 for (
auto &
UseMI :
MRI.use_nodbg_instructions(
MI.getOperand(0).getReg())) {
1864 MF.getFunction().getContext());
1869 APInt CombinedImm = MaybeImmVal->Value + MaybeImm2Val->Value;
1874 AMOld.
BaseOffs = MaybeImmVal->Value.getSExtValue();
1876 unsigned AS =
MRI.getType(Add2).getAddressSpace();
1877 const auto &TLI = *MF.getSubtarget().getTargetLowering();
1878 if (TLI.isLegalAddressingMode(MF.getDataLayout(), AMOld, AccessTy, AS) &&
1879 !TLI.isLegalAddressingMode(MF.getDataLayout(), AMNew, AccessTy, AS))
1888 unsigned PtrAddFlags =
MI.getFlags();
1889 unsigned LHSPtrAddFlags = Add2Def->
getFlags();
1905 MatchInfo.
Flags = Flags;
1911 assert(
MI.getOpcode() == TargetOpcode::G_PTR_ADD &&
"Expected G_PTR_ADD");
1913 LLT OffsetTy =
MRI.getType(
MI.getOperand(2).getReg());
1917 MI.getOperand(1).setReg(MatchInfo.
Base);
1918 MI.getOperand(2).setReg(NewOffset.getReg(0));
1932 unsigned Opcode =
MI.getOpcode();
1933 assert((Opcode == TargetOpcode::G_SHL || Opcode == TargetOpcode::G_ASHR ||
1934 Opcode == TargetOpcode::G_LSHR || Opcode == TargetOpcode::G_SSHLSAT ||
1935 Opcode == TargetOpcode::G_USHLSAT) &&
1936 "Expected G_SHL, G_ASHR, G_LSHR, G_SSHLSAT or G_USHLSAT");
1956 (MaybeImmVal->Value.getZExtValue() + MaybeImm2Val->Value).getZExtValue();
1961 if (Opcode == TargetOpcode::G_USHLSAT &&
1962 MatchInfo.
Imm >=
MRI.getType(Shl2).getScalarSizeInBits())
1970 unsigned Opcode =
MI.getOpcode();
1971 assert((Opcode == TargetOpcode::G_SHL || Opcode == TargetOpcode::G_ASHR ||
1972 Opcode == TargetOpcode::G_LSHR || Opcode == TargetOpcode::G_SSHLSAT ||
1973 Opcode == TargetOpcode::G_USHLSAT) &&
1974 "Expected G_SHL, G_ASHR, G_LSHR, G_SSHLSAT or G_USHLSAT");
1976 LLT Ty =
MRI.getType(
MI.getOperand(1).getReg());
1977 unsigned const ScalarSizeInBits = Ty.getScalarSizeInBits();
1978 auto Imm = MatchInfo.
Imm;
1980 if (Imm >= ScalarSizeInBits) {
1982 if (Opcode == TargetOpcode::G_SHL || Opcode == TargetOpcode::G_LSHR) {
1983 Builder.buildConstant(
MI.getOperand(0), 0);
1984 MI.eraseFromParent();
1989 Imm = ScalarSizeInBits - 1;
1992 LLT ImmTy =
MRI.getType(
MI.getOperand(2).getReg());
1995 MI.getOperand(1).setReg(MatchInfo.
Reg);
1996 MI.getOperand(2).setReg(NewImm);
2012 unsigned ShiftOpcode =
MI.getOpcode();
2013 assert((ShiftOpcode == TargetOpcode::G_SHL ||
2014 ShiftOpcode == TargetOpcode::G_ASHR ||
2015 ShiftOpcode == TargetOpcode::G_LSHR ||
2016 ShiftOpcode == TargetOpcode::G_USHLSAT ||
2017 ShiftOpcode == TargetOpcode::G_SSHLSAT) &&
2018 "Expected G_SHL, G_ASHR, G_LSHR, G_USHLSAT and G_SSHLSAT");
2021 Register LogicDest =
MI.getOperand(1).getReg();
2022 if (!
MRI.hasOneNonDBGUse(LogicDest))
2026 unsigned LogicOpcode = LogicMI->
getOpcode();
2027 if (LogicOpcode != TargetOpcode::G_AND && LogicOpcode != TargetOpcode::G_OR &&
2028 LogicOpcode != TargetOpcode::G_XOR)
2032 const Register C1 =
MI.getOperand(2).getReg();
2034 if (!MaybeImmVal || MaybeImmVal->Value == 0)
2037 const uint64_t C1Val = MaybeImmVal->Value.getZExtValue();
2041 if (
MI->getOpcode() != ShiftOpcode ||
2042 !
MRI.hasOneNonDBGUse(
MI->getOperand(0).getReg()))
2051 ShiftVal = MaybeImmVal->Value.getSExtValue();
2062 if (matchFirstShift(LogicMIOp1, C0Val)) {
2064 MatchInfo.
Shift2 = LogicMIOp1;
2065 }
else if (matchFirstShift(LogicMIOp2, C0Val)) {
2067 MatchInfo.
Shift2 = LogicMIOp2;
2071 MatchInfo.
ValSum = C0Val + C1Val;
2074 if (MatchInfo.
ValSum >=
MRI.getType(LogicDest).getScalarSizeInBits())
2077 MatchInfo.
Logic = LogicMI;
2083 unsigned Opcode =
MI.getOpcode();
2084 assert((Opcode == TargetOpcode::G_SHL || Opcode == TargetOpcode::G_ASHR ||
2085 Opcode == TargetOpcode::G_LSHR || Opcode == TargetOpcode::G_USHLSAT ||
2086 Opcode == TargetOpcode::G_SSHLSAT) &&
2087 "Expected G_SHL, G_ASHR, G_LSHR, G_USHLSAT and G_SSHLSAT");
2089 LLT ShlType =
MRI.getType(
MI.getOperand(2).getReg());
2090 LLT DestType =
MRI.getType(
MI.getOperand(0).getReg());
2096 Builder.buildInstr(Opcode, {DestType}, {Shift1Base, Const}).
getReg(0);
2105 Register Shift2Const =
MI.getOperand(2).getReg();
2107 .buildInstr(Opcode, {DestType},
2117 MI.eraseFromParent();
2122 assert(
MI.getOpcode() == TargetOpcode::G_SHL &&
"Expected G_SHL");
2144 auto *SrcDef =
MRI.getVRegDef(SrcReg);
2145 assert((SrcDef->getOpcode() == TargetOpcode::G_ADD ||
2146 SrcDef->getOpcode() == TargetOpcode::G_OR) &&
"Unexpected op");
2147 LLT SrcTy =
MRI.getType(SrcReg);
2149 auto S1 =
B.buildShl(SrcTy,
X, ShiftReg);
2150 auto S2 =
B.buildShl(SrcTy, C1, ShiftReg);
2151 B.buildInstr(SrcDef->getOpcode(), {DstReg}, {S1, S2});
2159 assert(
MI.getOpcode() == TargetOpcode::G_LSHR &&
"Expected a G_LSHR");
2163 unsigned OpSizeInBits =
MRI.getType(N0).getScalarSizeInBits();
2178 LLT InnerShiftTy =
MRI.getType(InnerShift);
2180 if ((N1C + N001C).ult(InnerShiftSize)) {
2186 if ((N001C + OpSizeInBits) == InnerShiftSize)
2188 if (
MRI.hasOneUse(N0) &&
MRI.hasOneUse(InnerShift)) {
2189 MatchInfo.
Mask =
true;
2199 assert(
MI.getOpcode() == TargetOpcode::G_LSHR &&
"Expected a G_LSHR");
2206 if (MatchInfo.
Mask ==
true) {
2214 Builder.buildTrunc(Dst, Shift);
2215 MI.eraseFromParent();
2219 unsigned &ShiftVal)
const {
2220 assert(
MI.getOpcode() == TargetOpcode::G_MUL &&
"Expected a G_MUL");
2226 ShiftVal = MaybeImmVal->Value.exactLogBase2();
2227 return (
static_cast<int32_t
>(ShiftVal) != -1);
2231 unsigned &ShiftVal)
const {
2232 assert(
MI.getOpcode() == TargetOpcode::G_MUL &&
"Expected a G_MUL");
2234 LLT ShiftTy =
MRI.getType(
MI.getOperand(0).getReg());
2237 MI.setDesc(MIB.
getTII().
get(TargetOpcode::G_SHL));
2238 MI.getOperand(2).setReg(ShiftCst.getReg(0));
2259 auto NegCst =
B.buildConstant(Ty, -Imm);
2261 MI.setDesc(
B.getTII().get(TargetOpcode::G_ADD));
2262 MI.getOperand(2).setReg(NegCst.getReg(0));
2264 if (Imm.isMinSignedValue())
2274 assert(
MI.getOpcode() == TargetOpcode::G_SHL &&
VT);
2289 if (!MaybeShiftAmtVal)
2293 LLT SrcTy =
MRI.getType(ExtSrc);
2303 int64_t ShiftAmt = MaybeShiftAmtVal->getSExtValue();
2304 MatchData.
Reg = ExtSrc;
2305 MatchData.
Imm = ShiftAmt;
2307 unsigned MinLeadingZeros =
VT->getKnownZeroes(ExtSrc).countl_one();
2308 unsigned SrcTySize =
MRI.getType(ExtSrc).getScalarSizeInBits();
2309 return MinLeadingZeros >= ShiftAmt && ShiftAmt < SrcTySize;
2315 int64_t ShiftAmtVal = MatchData.
Imm;
2317 LLT ExtSrcTy =
MRI.getType(ExtSrcReg);
2318 auto ShiftAmt =
Builder.buildConstant(ExtSrcTy, ShiftAmtVal);
2320 Builder.buildShl(ExtSrcTy, ExtSrcReg, ShiftAmt,
MI.getFlags());
2321 Builder.buildZExt(
MI.getOperand(0), NarrowShift);
2322 MI.eraseFromParent();
2329 for (
unsigned I = 0;
I <
Merge.getNumSources(); ++
I)
2333 if (!Unmerge || Unmerge->getNumDefs() !=
Merge.getNumSources())
2336 for (
unsigned I = 0;
I < MergedValues.
size(); ++
I)
2337 if (MergedValues[
I] != Unmerge->getReg(
I))
2340 MatchInfo = Unmerge->getSourceReg();
2354 assert(
MI.getOpcode() == TargetOpcode::G_UNMERGE_VALUES &&
2355 "Expected an unmerge");
2364 LLT SrcMergeTy =
MRI.getType(SrcInstr->getSourceReg(0));
2365 LLT Dst0Ty =
MRI.getType(Unmerge.getReg(0));
2367 if (SrcMergeTy != Dst0Ty && !SameSize)
2371 for (
unsigned Idx = 0; Idx < SrcInstr->getNumSources(); ++Idx)
2372 Operands.
push_back(SrcInstr->getSourceReg(Idx));
2378 assert(
MI.getOpcode() == TargetOpcode::G_UNMERGE_VALUES &&
2379 "Expected an unmerge");
2381 "Not enough operands to replace all defs");
2382 unsigned NumElems =
MI.getNumOperands() - 1;
2384 LLT SrcTy =
MRI.getType(Operands[0]);
2385 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
2386 bool CanReuseInputDirectly = DstTy == SrcTy;
2387 for (
unsigned Idx = 0; Idx < NumElems; ++Idx) {
2388 Register DstReg =
MI.getOperand(Idx).getReg();
2393 const auto &DstCB =
MRI.getRegClassOrRegBank(DstReg);
2394 if (!DstCB.isNull() && DstCB !=
MRI.getRegClassOrRegBank(SrcReg)) {
2395 SrcReg =
Builder.buildCopy(
MRI.getType(SrcReg), SrcReg).getReg(0);
2396 MRI.setRegClassOrRegBank(SrcReg, DstCB);
2399 if (CanReuseInputDirectly)
2402 Builder.buildCast(DstReg, SrcReg);
2404 MI.eraseFromParent();
2409 unsigned SrcIdx =
MI.getNumOperands() - 1;
2410 Register SrcReg =
MI.getOperand(SrcIdx).getReg();
2412 if (SrcInstr->
getOpcode() != TargetOpcode::G_CONSTANT &&
2413 SrcInstr->
getOpcode() != TargetOpcode::G_FCONSTANT)
2421 LLT Dst0Ty =
MRI.getType(
MI.getOperand(0).getReg());
2424 for (
unsigned Idx = 0; Idx != SrcIdx; ++Idx) {
2426 Val = Val.
lshr(ShiftAmt);
2434 assert(
MI.getOpcode() == TargetOpcode::G_UNMERGE_VALUES &&
2435 "Expected an unmerge");
2437 "Not enough operands to replace all defs");
2438 unsigned NumElems =
MI.getNumOperands() - 1;
2439 for (
unsigned Idx = 0; Idx < NumElems; ++Idx) {
2440 Register DstReg =
MI.getOperand(Idx).getReg();
2441 Builder.buildConstant(DstReg, Csts[Idx]);
2444 MI.eraseFromParent();
2450 unsigned SrcIdx =
MI.getNumOperands() - 1;
2451 Register SrcReg =
MI.getOperand(SrcIdx).getReg();
2453 unsigned NumElems =
MI.getNumOperands() - 1;
2454 for (
unsigned Idx = 0; Idx < NumElems; ++Idx) {
2455 Register DstReg =
MI.getOperand(Idx).getReg();
2456 B.buildUndef(DstReg);
2464 assert(
MI.getOpcode() == TargetOpcode::G_UNMERGE_VALUES &&
2465 "Expected an unmerge");
2466 if (
MRI.getType(
MI.getOperand(0).getReg()).isVector() ||
2467 MRI.getType(
MI.getOperand(
MI.getNumDefs()).getReg()).isVector())
2470 for (
unsigned Idx = 1, EndIdx =
MI.getNumDefs(); Idx != EndIdx; ++Idx) {
2471 if (!
MRI.use_nodbg_empty(
MI.getOperand(Idx).getReg()))
2479 Register SrcReg =
MI.getOperand(
MI.getNumDefs()).getReg();
2480 Register Dst0Reg =
MI.getOperand(0).getReg();
2481 Builder.buildTrunc(Dst0Reg, SrcReg);
2482 MI.eraseFromParent();
2486 assert(
MI.getOpcode() == TargetOpcode::G_UNMERGE_VALUES &&
2487 "Expected an unmerge");
2488 Register Dst0Reg =
MI.getOperand(0).getReg();
2489 LLT Dst0Ty =
MRI.getType(Dst0Reg);
2495 Register SrcReg =
MI.getOperand(
MI.getNumDefs()).getReg();
2496 LLT SrcTy =
MRI.getType(SrcReg);
2497 if (SrcTy.isVector())
2507 LLT ZExtSrcTy =
MRI.getType(ZExtSrcReg);
2512 assert(
MI.getOpcode() == TargetOpcode::G_UNMERGE_VALUES &&
2513 "Expected an unmerge");
2515 Register Dst0Reg =
MI.getOperand(0).getReg();
2518 MRI.getVRegDef(
MI.getOperand(
MI.getNumDefs()).getReg());
2520 "Expecting a G_ZEXT");
2523 LLT Dst0Ty =
MRI.getType(Dst0Reg);
2524 LLT ZExtSrcTy =
MRI.getType(ZExtSrcReg);
2527 Builder.buildZExt(Dst0Reg, ZExtSrcReg);
2530 "ZExt src doesn't fit in destination");
2535 for (
unsigned Idx = 1, EndIdx =
MI.getNumDefs(); Idx != EndIdx; ++Idx) {
2537 ZeroReg =
Builder.buildConstant(Dst0Ty, 0).getReg(0);
2540 MI.eraseFromParent();
2544 unsigned TargetShiftSize,
2545 unsigned &ShiftVal)
const {
2546 assert((
MI.getOpcode() == TargetOpcode::G_SHL ||
2547 MI.getOpcode() == TargetOpcode::G_LSHR ||
2548 MI.getOpcode() == TargetOpcode::G_ASHR) &&
"Expected a shift");
2550 LLT Ty =
MRI.getType(
MI.getOperand(0).getReg());
2555 unsigned Size = Ty.getSizeInBits();
2556 if (
Size <= TargetShiftSize)
2564 ShiftVal = MaybeImmVal->Value.getSExtValue();
2565 return ShiftVal >=
Size / 2 && ShiftVal <
Size;
2572 LLT Ty =
MRI.getType(SrcReg);
2573 unsigned Size = Ty.getSizeInBits();
2574 unsigned HalfSize =
Size / 2;
2575 assert(ShiftVal >= HalfSize);
2579 auto Unmerge =
Builder.buildUnmerge(HalfTy, SrcReg);
2580 unsigned NarrowShiftAmt = ShiftVal - HalfSize;
2582 if (
MI.getOpcode() == TargetOpcode::G_LSHR) {
2583 Register Narrowed = Unmerge.getReg(1);
2590 if (NarrowShiftAmt != 0) {
2591 Narrowed =
Builder.buildLShr(HalfTy, Narrowed,
2592 Builder.buildConstant(HalfTy, NarrowShiftAmt)).getReg(0);
2595 auto Zero =
Builder.buildConstant(HalfTy, 0);
2596 Builder.buildMergeLikeInstr(DstReg, {Narrowed, Zero});
2597 }
else if (
MI.getOpcode() == TargetOpcode::G_SHL) {
2598 Register Narrowed = Unmerge.getReg(0);
2603 if (NarrowShiftAmt != 0) {
2604 Narrowed =
Builder.buildShl(HalfTy, Narrowed,
2605 Builder.buildConstant(HalfTy, NarrowShiftAmt)).getReg(0);
2608 auto Zero =
Builder.buildConstant(HalfTy, 0);
2609 Builder.buildMergeLikeInstr(DstReg, {Zero, Narrowed});
2611 assert(
MI.getOpcode() == TargetOpcode::G_ASHR);
2613 HalfTy, Unmerge.getReg(1),
2614 Builder.buildConstant(HalfTy, HalfSize - 1));
2616 if (ShiftVal == HalfSize) {
2619 Builder.buildMergeLikeInstr(DstReg, {Unmerge.getReg(1),
Hi});
2620 }
else if (ShiftVal ==
Size - 1) {
2628 HalfTy, Unmerge.getReg(1),
2629 Builder.buildConstant(HalfTy, ShiftVal - HalfSize));
2637 MI.eraseFromParent();
2653 assert(
MI.getOpcode() == TargetOpcode::G_INTTOPTR &&
"Expected a G_INTTOPTR");
2655 LLT DstTy =
MRI.getType(DstReg);
2663 assert(
MI.getOpcode() == TargetOpcode::G_INTTOPTR &&
"Expected a G_INTTOPTR");
2665 Builder.buildCopy(DstReg, Reg);
2666 MI.eraseFromParent();
2671 assert(
MI.getOpcode() == TargetOpcode::G_PTRTOINT &&
"Expected a G_PTRTOINT");
2673 Builder.buildZExtOrTrunc(DstReg, Reg);
2674 MI.eraseFromParent();
2679 assert(
MI.getOpcode() == TargetOpcode::G_ADD);
2682 LLT IntTy =
MRI.getType(LHS);
2686 PtrReg.second =
false;
2687 for (
Register SrcReg : {LHS, RHS}) {
2691 LLT PtrTy =
MRI.getType(PtrReg.first);
2696 PtrReg.second =
true;
2708 const bool DoCommute = PtrReg.second;
2713 LLT PtrTy =
MRI.getType(LHS);
2715 auto PtrAdd =
Builder.buildPtrAdd(PtrTy, LHS, RHS);
2716 Builder.buildPtrToInt(Dst, PtrAdd);
2717 MI.eraseFromParent();
2721 APInt &NewCst)
const {
2723 Register LHS = PtrAdd.getBaseReg();
2724 Register RHS = PtrAdd.getOffsetReg();
2730 auto DstTy =
MRI.getType(PtrAdd.getReg(0));
2733 NewCst += RHSCst->
sextOrTrunc(DstTy.getSizeInBits());
2742 APInt &NewCst)
const {
2746 Builder.buildConstant(Dst, NewCst);
2747 PtrAdd.eraseFromParent();
2752 assert(
MI.getOpcode() == TargetOpcode::G_ANYEXT &&
"Expected a G_ANYEXT");
2757 SrcReg = OriginalSrcReg;
2758 LLT DstTy =
MRI.getType(DstReg);
2766 assert(
MI.getOpcode() == TargetOpcode::G_ZEXT &&
"Expected a G_ZEXT");
2769 LLT DstTy =
MRI.getType(DstReg);
2774 unsigned SrcSize =
MRI.getType(SrcReg).getScalarSizeInBits();
2775 return VT->getKnownBits(Reg).countMinLeadingZeros() >= DstSize - SrcSize;
2785 if (ShiftSize > 32 && TruncSize < 32)
2798 MachineInstr &
MI, std::pair<MachineInstr *, LLT> &MatchInfo)
const {
2799 assert(
MI.getOpcode() == TargetOpcode::G_TRUNC &&
"Expected a G_TRUNC");
2803 if (!
MRI.hasOneNonDBGUse(SrcReg))
2806 LLT SrcTy =
MRI.getType(SrcReg);
2807 LLT DstTy =
MRI.getType(DstReg);
2816 case TargetOpcode::G_SHL: {
2825 case TargetOpcode::G_LSHR:
2826 case TargetOpcode::G_ASHR: {
2832 for (
auto &
User :
MRI.use_instructions(DstReg))
2833 if (
User.getOpcode() == TargetOpcode::G_STORE)
2837 if (NewShiftTy == SrcTy)
2851 {NewShiftTy, TL.getPreferredShiftAmountTy(NewShiftTy)}}))
2854 MatchInfo = std::make_pair(SrcMI, NewShiftTy);
2859 MachineInstr &
MI, std::pair<MachineInstr *, LLT> &MatchInfo)
const {
2861 LLT NewShiftTy = MatchInfo.second;
2864 LLT DstTy =
MRI.getType(Dst);
2868 ShiftSrc =
Builder.buildTrunc(NewShiftTy, ShiftSrc).getReg(0);
2872 .buildInstr(ShiftMI->
getOpcode(), {NewShiftTy}, {ShiftSrc, ShiftAmt})
2875 if (NewShiftTy == DstTy)
2878 Builder.buildTrunc(Dst, NewShift);
2885 return MO.isReg() &&
2886 getOpcodeDef(TargetOpcode::G_IMPLICIT_DEF, MO.getReg(), MRI);
2892 return !MO.isReg() ||
2893 getOpcodeDef(TargetOpcode::G_IMPLICIT_DEF, MO.getReg(), MRI);
2898 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
2900 return all_of(Mask, [](
int Elt) {
return Elt < 0; });
2904 assert(
MI.getOpcode() == TargetOpcode::G_STORE);
2905 return getOpcodeDef(TargetOpcode::G_IMPLICIT_DEF,
MI.getOperand(0).getReg(),
2910 assert(
MI.getOpcode() == TargetOpcode::G_SELECT);
2911 return getOpcodeDef(TargetOpcode::G_IMPLICIT_DEF,
MI.getOperand(1).getReg(),
2917 assert((
MI.getOpcode() == TargetOpcode::G_INSERT_VECTOR_ELT ||
2918 MI.getOpcode() == TargetOpcode::G_EXTRACT_VECTOR_ELT) &&
2919 "Expected an insert/extract element op");
2920 LLT VecTy =
MRI.getType(
MI.getOperand(1).getReg());
2925 MI.getOpcode() == TargetOpcode::G_EXTRACT_VECTOR_ELT ? 2 : 3;
2933 unsigned &
OpIdx)
const {
2939 OpIdx = Cst->isZero() ? 3 : 2;
2984 if (I1->mayLoadOrStore() && !I1->isDereferenceableInvariantLoad())
3011 return MO.isReg() && MO.getReg().isPhysical();
3021 return I1->isIdenticalTo(*I2);
3029 if (
Builder.getTII().produceSameValue(*I1, *I2, &
MRI)) {
3036 return I1->findRegisterDefOperandIdx(InstAndDef1->Reg,
nullptr) ==
3048 return MaybeCst && MaybeCst->getBitWidth() <= 64 &&
3049 MaybeCst->getSExtValue() ==
C;
3056 std::optional<FPValueAndVReg> MaybeCst;
3060 return MaybeCst->Value.isExactlyValue(
C);
3064 unsigned OpIdx)
const {
3065 assert(
MI.getNumExplicitDefs() == 1 &&
"Expected one explicit def?");
3070 MI.eraseFromParent();
3075 assert(
MI.getNumExplicitDefs() == 1 &&
"Expected one explicit def?");
3079 MI.eraseFromParent();
3083 unsigned ConstIdx)
const {
3084 Register ConstReg =
MI.getOperand(ConstIdx).getReg();
3085 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
3097 assert((
MI.getOpcode() == TargetOpcode::G_FSHL ||
3098 MI.getOpcode() == TargetOpcode::G_FSHR) &&
3099 "This is not a funnel shift operation");
3101 Register ConstReg =
MI.getOperand(3).getReg();
3102 LLT ConstTy =
MRI.getType(ConstReg);
3103 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
3106 assert((VRegAndVal) &&
"Value is not a constant");
3109 APInt NewConst = VRegAndVal->Value.
urem(
3114 MI.getOpcode(), {MI.getOperand(0)},
3115 {MI.getOperand(1), MI.getOperand(2), NewConstInstr.getReg(0)});
3117 MI.eraseFromParent();
3121 assert(
MI.getOpcode() == TargetOpcode::G_SELECT);
3135 unsigned OpIdx)
const {
3137 return MO.
isReg() &&
3148 assert(
MI.getNumDefs() == 1 &&
"Expected only one def?");
3150 MI.eraseFromParent();
3155 assert(
MI.getNumDefs() == 1 &&
"Expected only one def?");
3157 MI.eraseFromParent();
3161 assert(
MI.getNumDefs() == 1 &&
"Expected only one def?");
3163 MI.eraseFromParent();
3168 assert(
MI.getNumDefs() == 1 &&
"Expected only one def?");
3170 MI.eraseFromParent();
3174 assert(
MI.getNumDefs() == 1 &&
"Expected only one def?");
3176 MI.eraseFromParent();
3180 MachineInstr &
MI, std::tuple<Register, Register> &MatchInfo)
const {
3183 Register &NewLHS = std::get<0>(MatchInfo);
3184 Register &NewRHS = std::get<1>(MatchInfo);
3192 NewLHS = MaybeNewLHS;
3196 return CheckFold(LHS, RHS) || CheckFold(RHS, LHS);
3201 assert(
MI.getOpcode() == TargetOpcode::G_INSERT_VECTOR_ELT &&
3204 LLT DstTy =
MRI.getType(DstReg);
3213 if (
MRI.hasOneUse(DstReg) &&
MRI.use_instr_begin(DstReg)->getOpcode() ==
3214 TargetOpcode::G_INSERT_VECTOR_ELT)
3220 MatchInfo.
resize(NumElts);
3224 if (IntImm >= NumElts || IntImm < 0)
3226 if (!MatchInfo[IntImm])
3227 MatchInfo[IntImm] = TmpReg;
3231 if (CurrInst->
getOpcode() == TargetOpcode::G_INSERT_VECTOR_ELT)
3233 if (TmpInst->
getOpcode() == TargetOpcode::G_BUILD_VECTOR) {
3242 return TmpInst->
getOpcode() == TargetOpcode::G_IMPLICIT_DEF ||
3249 auto GetUndef = [&]() {
3252 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
3260 Builder.buildBuildVector(
MI.getOperand(0).getReg(), MatchInfo);
3261 MI.eraseFromParent();
3265 MachineInstr &
MI, std::tuple<Register, Register> &MatchInfo)
const {
3267 std::tie(SubLHS, SubRHS) = MatchInfo;
3268 Builder.buildSub(
MI.getOperand(0).getReg(), SubLHS, SubRHS);
3269 MI.eraseFromParent();
3282 unsigned InnerOpc = InnerDef->
getOpcode();
3283 if (InnerOpc != TargetOpcode::G_ADD && InnerOpc != TargetOpcode::G_SUB)
3307 if (!TryMatch(InnerLHS, InnerRHS) &&
3308 !(InnerOpc == TargetOpcode::G_ADD && TryMatch(InnerRHS, InnerLHS)))
3312 unsigned FlippedOpc = (InnerOpc == TargetOpcode::G_ADD) ? TargetOpcode::G_SUB
3313 : TargetOpcode::G_ADD;
3316 MatchInfo = [=](MachineIRBuilder &
Builder) {
3317 auto NewInner =
Builder.buildInstr(FlippedOpc, {Ty}, {
B,
C});
3318 auto NewNot =
Builder.buildNot(Ty, NewInner);
3319 Builder.buildInstr(RootOpc, {Dst}, {
A, NewNot});
3331 unsigned RootOpc =
MI.getOpcode();
3333 LLT Ty =
MRI.getType(Dst);
3338 return matchBinopWithNegInner(LHS, RHS, RootOpc, Dst, Ty, MatchInfo) ||
3339 matchBinopWithNegInner(RHS, LHS, RootOpc, Dst, Ty, MatchInfo);
3350 unsigned LogicOpcode =
MI.getOpcode();
3351 assert(LogicOpcode == TargetOpcode::G_AND ||
3352 LogicOpcode == TargetOpcode::G_OR ||
3353 LogicOpcode == TargetOpcode::G_XOR);
3360 if (!
MRI.hasOneNonDBGUse(LHSReg) || !
MRI.hasOneNonDBGUse(RHSReg))
3366 if (!LeftHandInst || !RightHandInst)
3368 unsigned HandOpcode = LeftHandInst->
getOpcode();
3369 if (HandOpcode != RightHandInst->
getOpcode())
3383 if (!XTy.
isValid() || XTy != YTy)
3388 switch (HandOpcode) {
3391 case TargetOpcode::G_ANYEXT:
3392 case TargetOpcode::G_SEXT:
3393 case TargetOpcode::G_ZEXT: {
3397 case TargetOpcode::G_TRUNC: {
3402 LLT DstTy =
MRI.getType(Dst);
3411 case TargetOpcode::G_AND:
3412 case TargetOpcode::G_ASHR:
3413 case TargetOpcode::G_LSHR:
3414 case TargetOpcode::G_SHL: {
3419 ExtraHandOpSrcReg = ZOp.
getReg();
3430 auto NewLogicDst =
MRI.createGenericVirtualRegister(XTy);
3441 if (ExtraHandOpSrcReg.
isValid())
3453 "Expected at least one instr to build?");
3455 assert(InstrToBuild.Opcode &&
"Expected a valid opcode?");
3456 assert(InstrToBuild.OperandFns.size() &&
"Expected at least one operand?");
3458 for (
auto &OperandFn : InstrToBuild.OperandFns)
3461 MI.eraseFromParent();
3465 MachineInstr &
MI, std::tuple<Register, int64_t> &MatchInfo)
const {
3466 assert(
MI.getOpcode() == TargetOpcode::G_ASHR);
3467 int64_t ShlCst, AshrCst;
3473 if (ShlCst != AshrCst)
3476 {TargetOpcode::G_SEXT_INREG, {
MRI.getType(Src)}}))
3478 MatchInfo = std::make_tuple(Src, ShlCst);
3483 MachineInstr &
MI, std::tuple<Register, int64_t> &MatchInfo)
const {
3484 assert(
MI.getOpcode() == TargetOpcode::G_ASHR);
3487 std::tie(Src, ShiftAmt) = MatchInfo;
3488 unsigned Size =
MRI.getType(Src).getScalarSizeInBits();
3489 Builder.buildSExtInReg(
MI.getOperand(0).getReg(), Src,
Size - ShiftAmt);
3490 MI.eraseFromParent();
3497 assert(
MI.getOpcode() == TargetOpcode::G_AND);
3500 LLT Ty =
MRI.getType(Dst);
3512 B.buildAnd(Dst, R,
B.buildConstant(Ty, C1 & C2));
3515 auto Zero =
B.buildConstant(Ty, 0);
3538 assert(
MI.getOpcode() == TargetOpcode::G_AND);
3562 (LHSBits.
Zero | RHSBits.
One).isAllOnes()) {
3569 (LHSBits.
One | RHSBits.
Zero).isAllOnes()) {
3586 assert(
MI.getOpcode() == TargetOpcode::G_OR);
3604 (LHSBits.
One | RHSBits.
Zero).isAllOnes()) {
3611 (LHSBits.
Zero | RHSBits.
One).isAllOnes()) {
3622 unsigned ExtBits =
MI.getOperand(2).getImm();
3623 unsigned TypeSize =
MRI.getType(Src).getScalarSizeInBits();
3624 return VT->computeNumSignBits(Src) >= (
TypeSize - ExtBits + 1);
3628 int64_t Cst,
bool IsVector,
bool IsFP) {
3630 return (ScalarSizeBits == 1 && Cst == -1) ||
3652 unsigned BuildUseCount = BV.getNumSources();
3653 if (BuildUseCount % 2 != 0)
3656 unsigned NumUnmerge = BuildUseCount / 2;
3662 if (!Unmerge || Unmerge->getNumDefs() != NumUnmerge)
3665 UnmergeSrc = Unmerge->getSourceReg();
3667 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
3668 LLT UnmergeSrcTy =
MRI.getType(UnmergeSrc);
3675 !
isLegal({TargetOpcode::G_CONCAT_VECTORS, {DstTy, UnmergeSrcTy}}))
3680 for (
unsigned I = 0;
I < NumUnmerge; ++
I) {
3681 auto MaybeUnmergeReg = BV.getSourceReg(
I);
3684 if (!LoopUnmerge || LoopUnmerge != Unmerge)
3687 if (LoopUnmerge->getOperand(
I).getReg() != MaybeUnmergeReg)
3692 if (Unmerge->getNumDefs() != NumUnmerge)
3696 for (
unsigned I = NumUnmerge;
I < BuildUseCount; ++
I) {
3699 if (
Undef->getOpcode() != TargetOpcode::G_IMPLICIT_DEF)
3710 assert(UnmergeSrc &&
"Expected there to be one matching G_UNMERGE_VALUES");
3711 B.setInstrAndDebugLoc(
MI);
3713 Register UndefVec =
B.buildUndef(
MRI.getType(UnmergeSrc)).getReg(0);
3714 B.buildConcatVectors(
MI.getOperand(0), {UnmergeSrc, UndefVec});
3716 MI.eraseFromParent();
3738 unsigned NumOperands =
BuildMI->getNumSources();
3748 for (
I = 0;
I < NumOperands; ++
I) {
3749 auto SrcMI =
MRI.getVRegDef(
BuildMI->getSourceReg(
I));
3750 auto SrcMIOpc = SrcMI->getOpcode();
3753 if (SrcMIOpc == TargetOpcode::G_TRUNC) {
3754 Register TruncSrcReg = SrcMI->getOperand(1).getReg();
3756 UnmergeMI =
MRI.getVRegDef(TruncSrcReg);
3757 if (UnmergeMI->
getOpcode() != TargetOpcode::G_UNMERGE_VALUES)
3760 auto UnmergeSrcMI =
MRI.getVRegDef(TruncSrcReg);
3761 if (UnmergeMI != UnmergeSrcMI)
3776 for (;
I < NumOperands; ++
I) {
3777 auto SrcMI =
MRI.getVRegDef(
BuildMI->getSourceReg(
I));
3778 auto SrcMIOpc = SrcMI->getOpcode();
3780 if (SrcMIOpc != TargetOpcode::G_IMPLICIT_DEF)
3786 LLT UnmergeSrcTy =
MRI.getType(MatchInfo);
3793 LLT UnmergeDstEltTy =
MRI.getType(UnmergeDstReg);
3794 if (UnmergeSrcEltTy != UnmergeDstEltTy)
3802 !
isLegal({TargetOpcode::G_CONCAT_VECTORS, {MidTy, UnmergeSrcTy}}))
3805 if (!
isLegal({TargetOpcode::G_TRUNC, {DstTy, MidTy}}))
3817 LLT DstTy =
MRI.getType(DstReg);
3818 LLT UnmergeSrcTy =
MRI.getType(MatchInfo);
3823 if (DstTyNumElt / UnmergeSrcTyNumElt == 1) {
3828 for (
unsigned I = 1;
I < DstTyNumElt / UnmergeSrcTyNumElt; ++
I)
3832 MidReg =
Builder.buildConcatVectors(MidTy, ConcatRegs).getReg(0);
3835 Builder.buildTrunc(DstReg, MidReg);
3836 MI.eraseFromParent();
3841 assert(
MI.getOpcode() == TargetOpcode::G_XOR);
3842 LLT Ty =
MRI.getType(
MI.getOperand(0).getReg());
3843 const auto &TLI = *
Builder.getMF().getSubtarget().getTargetLowering();
3851 if (!
MRI.hasOneNonDBGUse(XorSrc))
3861 for (
unsigned I = 0;
I < RegsToNegate.
size(); ++
I) {
3863 if (!
MRI.hasOneNonDBGUse(Reg))
3866 switch (Def->getOpcode()) {
3871 case TargetOpcode::G_ICMP:
3877 case TargetOpcode::G_FCMP:
3883 case TargetOpcode::G_AND:
3884 case TargetOpcode::G_OR:
3890 RegsToNegate.
push_back(Def->getOperand(1).getReg());
3891 RegsToNegate.
push_back(Def->getOperand(2).getReg());
3899 if (Ty.isVector()) {
3904 if (!
isConstValidTrue(TLI, Ty.getScalarSizeInBits(), *MaybeCst,
true, IsFP))
3918 for (
Register Reg : RegsToNegate) {
3923 switch (Def->getOpcode()) {
3926 case TargetOpcode::G_ICMP:
3927 case TargetOpcode::G_FCMP: {
3934 case TargetOpcode::G_AND:
3935 Def->setDesc(
Builder.getTII().get(TargetOpcode::G_OR));
3937 case TargetOpcode::G_OR:
3938 Def->setDesc(
Builder.getTII().get(TargetOpcode::G_AND));
3945 MI.eraseFromParent();
3949 MachineInstr &
MI, std::pair<Register, Register> &MatchInfo)
const {
3951 assert(
MI.getOpcode() == TargetOpcode::G_XOR);
3955 Register SharedReg =
MI.getOperand(2).getReg();
3969 if (!
MRI.hasOneNonDBGUse(AndReg))
3976 return Y == SharedReg;
3980 MachineInstr &
MI, std::pair<Register, Register> &MatchInfo)
const {
3983 std::tie(
X,
Y) = MatchInfo;
3986 MI.setDesc(
Builder.getTII().get(TargetOpcode::G_AND));
3987 MI.getOperand(1).setReg(Not->getOperand(0).getReg());
3988 MI.getOperand(2).setReg(
Y);
3994 Register DstReg = PtrAdd.getReg(0);
3995 LLT Ty =
MRI.getType(DstReg);
3998 if (
DL.isNonIntegralAddressSpace(Ty.getScalarType().getAddressSpace()))
4001 if (Ty.isPointer()) {
4003 return ConstVal && *ConstVal == 0;
4006 assert(Ty.isVector() &&
"Expecting a vector type");
4013 Builder.buildIntToPtr(PtrAdd.getReg(0), PtrAdd.getOffsetReg());
4014 PtrAdd.eraseFromParent();
4021 Register Pow2Src1 =
MI.getOperand(2).getReg();
4022 LLT Ty =
MRI.getType(DstReg);
4025 auto NegOne =
Builder.buildConstant(Ty, -1);
4026 auto Add =
Builder.buildAdd(Ty, Pow2Src1, NegOne);
4028 MI.eraseFromParent();
4032 unsigned &SelectOpNo)
const {
4042 if (
Select->getOpcode() != TargetOpcode::G_SELECT ||
4043 !
MRI.hasOneNonDBGUse(LHS)) {
4044 OtherOperandReg = LHS;
4047 if (
Select->getOpcode() != TargetOpcode::G_SELECT ||
4048 !
MRI.hasOneNonDBGUse(RHS))
4064 unsigned BinOpcode =
MI.getOpcode();
4069 bool CanFoldNonConst =
4070 (BinOpcode == TargetOpcode::G_AND || BinOpcode == TargetOpcode::G_OR) &&
4075 if (CanFoldNonConst)
4096 LLT Ty =
MRI.getType(Dst);
4097 unsigned BinOpcode =
MI.getOpcode();
4104 if (SelectOperand == 1) {
4108 FoldTrue =
Builder.buildInstr(BinOpcode, {Ty}, {SelectTrue, RHS}).
getReg(0);
4110 Builder.buildInstr(BinOpcode, {Ty}, {SelectFalse, RHS}).
getReg(0);
4112 FoldTrue =
Builder.buildInstr(BinOpcode, {Ty}, {LHS, SelectTrue}).
getReg(0);
4114 Builder.buildInstr(BinOpcode, {Ty}, {LHS, SelectFalse}).
getReg(0);
4117 Builder.buildSelect(Dst, SelectCond, FoldTrue, FoldFalse,
MI.getFlags());
4118 MI.eraseFromParent();
4121std::optional<SmallVector<Register, 8>>
4122CombinerHelper::findCandidatesForLoadOrCombine(
const MachineInstr *Root)
const {
4123 assert(Root->
getOpcode() == TargetOpcode::G_OR &&
"Expected G_OR only!");
4152 const unsigned MaxIter =
4154 for (
unsigned Iter = 0; Iter < MaxIter; ++Iter) {
4163 return std::nullopt;
4179 if (RegsToVisit.
empty() || RegsToVisit.
size() % 2 != 0)
4180 return std::nullopt;
4192static std::optional<std::pair<GZExtLoad *, int64_t>>
4196 "Expected Reg to only have one non-debug use?");
4205 if (Shift % MemSizeInBits != 0)
4206 return std::nullopt;
4211 return std::nullopt;
4213 if (!Load->isUnordered() || Load->getMemSizeInBits() != MemSizeInBits)
4214 return std::nullopt;
4216 return std::make_pair(Load, Shift / MemSizeInBits);
4219std::optional<std::tuple<GZExtLoad *, int64_t, GZExtLoad *>>
4220CombinerHelper::findLoadOffsetsForLoadOrCombine(
4223 const unsigned MemSizeInBits)
const {
4226 SmallSetVector<const MachineInstr *, 8> Loads;
4232 GZExtLoad *LowestIdxLoad =
nullptr;
4235 SmallSet<int64_t, 8> SeenIdx;
4239 MachineBasicBlock *
MBB =
nullptr;
4240 const MachineMemOperand *MMO =
nullptr;
4243 GZExtLoad *EarliestLoad =
nullptr;
4246 GZExtLoad *LatestLoad =
nullptr;
4255 for (
auto Reg : RegsToVisit) {
4260 return std::nullopt;
4263 std::tie(Load, DstPos) = *LoadAndPos;
4267 MachineBasicBlock *LoadMBB =
Load->getParent();
4271 return std::nullopt;
4274 auto &LoadMMO =
Load->getMMO();
4278 return std::nullopt;
4285 LoadPtr =
Load->getOperand(1).getReg();
4290 if (!SeenIdx.
insert(Idx).second)
4291 return std::nullopt;
4298 if (BasePtr != LoadPtr)
4299 return std::nullopt;
4301 if (Idx < LowestIdx) {
4303 LowestIdxLoad =
Load;
4310 if (!MemOffset2Idx.
try_emplace(DstPos, Idx).second)
4311 return std::nullopt;
4319 if (!EarliestLoad ||
dominates(*Load, *EarliestLoad))
4320 EarliestLoad =
Load;
4321 if (!LatestLoad ||
dominates(*LatestLoad, *Load))
4328 "Expected to find a load for each register?");
4329 assert(EarliestLoad != LatestLoad && EarliestLoad &&
4330 LatestLoad &&
"Expected at least two loads?");
4339 const unsigned MaxIter = 20;
4345 if (
MI.isLoadFoldBarrier())
4346 return std::nullopt;
4347 if (Iter++ == MaxIter)
4348 return std::nullopt;
4351 return std::make_tuple(LowestIdxLoad, LowestIdx, LatestLoad);
4357 assert(
MI.getOpcode() == TargetOpcode::G_OR);
4370 LLT Ty =
MRI.getType(Dst);
4376 const unsigned WideMemSizeInBits = Ty.getSizeInBits();
4377 if (WideMemSizeInBits < 16 || WideMemSizeInBits % 8 != 0)
4381 auto RegsToVisit = findCandidatesForLoadOrCombine(&
MI);
4388 const unsigned NarrowMemSizeInBits = WideMemSizeInBits / RegsToVisit->size();
4389 if (NarrowMemSizeInBits % 8 != 0)
4402 auto MaybeLoadInfo = findLoadOffsetsForLoadOrCombine(
4403 MemOffset2Idx, *RegsToVisit, NarrowMemSizeInBits);
4406 std::tie(LowestIdxLoad, LowestIdx, LatestLoad) = *MaybeLoadInfo;
4413 std::optional<bool> IsBigEndian =
isBigEndian(MemOffset2Idx, LowestIdx);
4416 bool NeedsBSwap = IsBigEndianTarget != *IsBigEndian;
4428 const unsigned NumLoadsInTy = WideMemSizeInBits / NarrowMemSizeInBits;
4429 const unsigned ZeroByteOffset =
4433 auto ZeroOffsetIdx = MemOffset2Idx.
find(ZeroByteOffset);
4434 if (ZeroOffsetIdx == MemOffset2Idx.
end() ||
4435 ZeroOffsetIdx->second != LowestIdx)
4445 {TargetOpcode::G_LOAD, {Ty,
MRI.getType(Ptr)}, {MMDesc}}))
4459 MIB.setInstrAndDebugLoc(*LatestLoad);
4460 Register LoadDst = NeedsBSwap ?
MRI.cloneVirtualRegister(Dst) : Dst;
4461 MIB.buildLoad(LoadDst, Ptr, *NewMMO);
4463 MIB.buildBSwap(Dst, LoadDst);
4475 if (
MRI.getType(DstReg).isVector())
4479 if (!
MRI.hasOneNonDBGUse(DstReg))
4481 ExtMI = &*
MRI.use_instr_nodbg_begin(DstReg);
4483 case TargetOpcode::G_ANYEXT:
4485 case TargetOpcode::G_ZEXT:
4486 case TargetOpcode::G_SEXT:
4493 if (
Builder.getTII().isExtendLikelyToBeFolded(*ExtMI,
MRI))
4500 for (
unsigned I = 0;
I <
PHI.getNumIncomingValues(); ++
I) {
4502 switch (
DefMI->getOpcode()) {
4503 case TargetOpcode::G_LOAD:
4504 case TargetOpcode::G_TRUNC:
4505 case TargetOpcode::G_SEXT:
4506 case TargetOpcode::G_ZEXT:
4507 case TargetOpcode::G_ANYEXT:
4508 case TargetOpcode::G_CONSTANT:
4512 if (InSrcs.
size() > 2)
4526 LLT ExtTy =
MRI.getType(DstReg);
4533 for (
unsigned I = 0;
I <
PHI.getNumIncomingValues(); ++
I) {
4534 auto SrcReg =
PHI.getIncomingValue(
I);
4535 auto *SrcMI =
MRI.getVRegDef(SrcReg);
4536 if (!SrcMIs.
insert(SrcMI))
4540 auto *
MBB = SrcMI->getParent();
4542 if (InsertPt !=
MBB->end() && InsertPt->isPHI())
4543 InsertPt =
MBB->getFirstNonPHI();
4545 Builder.setInsertPt(*SrcMI->getParent(), InsertPt);
4548 OldToNewSrcMap[SrcMI] = NewExt;
4553 auto NewPhi =
Builder.buildInstrNoInsert(TargetOpcode::G_PHI);
4554 NewPhi.addDef(DstReg);
4557 NewPhi.addMBB(MO.getMBB());
4560 auto *NewSrc = OldToNewSrcMap[
MRI.getVRegDef(MO.getReg())];
4561 NewPhi.addUse(NewSrc->getOperand(0).getReg());
4569 assert(
MI.getOpcode() == TargetOpcode::G_EXTRACT_VECTOR_ELT);
4573 LLT SrcTy =
MRI.getType(SrcVec);
4574 if (SrcTy.isScalableVector())
4578 if (!Cst || Cst->Value.getZExtValue() >= SrcTy.getNumElements())
4581 unsigned VecIdx = Cst->Value.getZExtValue();
4586 if (SrcVecMI->
getOpcode() == TargetOpcode::G_TRUNC) {
4590 if (SrcVecMI->
getOpcode() != TargetOpcode::G_BUILD_VECTOR &&
4591 SrcVecMI->
getOpcode() != TargetOpcode::G_BUILD_VECTOR_TRUNC)
4595 if (!
MRI.hasOneNonDBGUse(SrcVec) &&
4607 LLT ScalarTy =
MRI.getType(Reg);
4609 LLT DstTy =
MRI.getType(DstReg);
4611 if (ScalarTy != DstTy) {
4613 Builder.buildTrunc(DstReg, Reg);
4614 MI.eraseFromParent();
4622 SmallVectorImpl<std::pair<Register, MachineInstr *>> &SrcDstPairs)
const {
4623 assert(
MI.getOpcode() == TargetOpcode::G_BUILD_VECTOR);
4641 LLT DstTy =
MRI.getType(DstReg);
4646 if (
II.getOpcode() != TargetOpcode::G_EXTRACT_VECTOR_ELT)
4651 unsigned Idx = Cst->getZExtValue();
4654 ExtractedElts.
set(Idx);
4655 SrcDstPairs.emplace_back(
4656 std::make_pair(
MI.getOperand(Idx + 1).getReg(), &
II));
4659 return ExtractedElts.
all();
4664 SmallVectorImpl<std::pair<Register, MachineInstr *>> &SrcDstPairs)
const {
4665 assert(
MI.getOpcode() == TargetOpcode::G_BUILD_VECTOR);
4666 for (
auto &Pair : SrcDstPairs) {
4667 auto *ExtMI = Pair.second;
4669 ExtMI->eraseFromParent();
4671 MI.eraseFromParent();
4678 MI.eraseFromParent();
4688 bool AllowScalarConstants,
4690 assert(
MI.getOpcode() == TargetOpcode::G_OR);
4693 LLT Ty =
MRI.getType(Dst);
4694 unsigned BitWidth = Ty.getScalarSizeInBits();
4696 Register ShlSrc, ShlAmt, LShrSrc, LShrAmt, Amt;
4697 unsigned FshOpc = 0;
4708 int64_t CstShlAmt = 0, CstLShrAmt;
4711 CstShlAmt + CstLShrAmt ==
BitWidth) {
4712 FshOpc = TargetOpcode::G_FSHR;
4718 FshOpc = TargetOpcode::G_FSHL;
4723 FshOpc = TargetOpcode::G_FSHR;
4728 LLT AmtTy =
MRI.getType(Amt);
4730 (!AllowScalarConstants || CstShlAmt == 0 || !Ty.isScalar()))
4734 B.buildInstr(FshOpc, {Dst}, {ShlSrc, LShrSrc, Amt});
4741 unsigned Opc =
MI.getOpcode();
4742 assert(
Opc == TargetOpcode::G_FSHL ||
Opc == TargetOpcode::G_FSHR);
4747 unsigned RotateOpc =
4748 Opc == TargetOpcode::G_FSHL ? TargetOpcode::G_ROTL : TargetOpcode::G_ROTR;
4753 unsigned Opc =
MI.getOpcode();
4754 assert(
Opc == TargetOpcode::G_FSHL ||
Opc == TargetOpcode::G_FSHR);
4755 bool IsFSHL =
Opc == TargetOpcode::G_FSHL;
4757 MI.setDesc(
Builder.getTII().get(IsFSHL ? TargetOpcode::G_ROTL
4758 : TargetOpcode::G_ROTR));
4759 MI.removeOperand(2);
4765 assert(
MI.getOpcode() == TargetOpcode::G_ROTL ||
4766 MI.getOpcode() == TargetOpcode::G_ROTR);
4768 MRI.getType(
MI.getOperand(0).getReg()).getScalarSizeInBits();
4770 bool OutOfRange =
false;
4771 auto MatchOutOfRange = [Bitsize, &OutOfRange](
const Constant *
C) {
4773 OutOfRange |= CI->getValue().uge(Bitsize);
4780 assert(
MI.getOpcode() == TargetOpcode::G_ROTL ||
4781 MI.getOpcode() == TargetOpcode::G_ROTR);
4783 MRI.getType(
MI.getOperand(0).getReg()).getScalarSizeInBits();
4785 LLT AmtTy =
MRI.getType(Amt);
4786 auto Bits =
Builder.buildConstant(AmtTy, Bitsize);
4787 Amt =
Builder.buildURem(AmtTy,
MI.getOperand(2).getReg(), Bits).getReg(0);
4789 MI.getOperand(2).setReg(Amt);
4794 int64_t &MatchInfo)
const {
4795 assert(
MI.getOpcode() == TargetOpcode::G_ICMP);
4806 auto KnownRHS =
VT->getKnownBits(
MI.getOperand(3).getReg());
4807 if (KnownRHS.isUnknown())
4810 std::optional<bool> KnownVal;
4811 if (KnownRHS.isZero()) {
4821 auto KnownLHS =
VT->getKnownBits(
MI.getOperand(2).getReg());
4831 MRI.getType(
MI.getOperand(0).getReg()).isVector(),
4840 assert(
MI.getOpcode() == TargetOpcode::G_ICMP);
4856 LLT DstTy =
MRI.getType(Dst);
4864 auto KnownLHS =
VT->getKnownBits(LHS);
4865 if (KnownLHS.getMinValue() != 0 || KnownLHS.getMaxValue() != 1)
4868 LLT LHSTy =
MRI.getType(LHS);
4871 unsigned Op = TargetOpcode::COPY;
4872 if (DstSize != LHSSize)
4873 Op = DstSize < LHSSize ? TargetOpcode::G_TRUNC : TargetOpcode::G_ZEXT;
4884 assert(
MI.getOpcode() == TargetOpcode::G_AND);
4888 LLT Ty =
MRI.getType(
MI.getOperand(0).getReg());
4894 int64_t AndMaskBits;
4902 if (AndMaskBits & OrMaskBits)
4908 if (
MI.getOperand(1).getReg() == AndMaskReg)
4909 MI.getOperand(2).setReg(AndMaskReg);
4910 MI.getOperand(1).setReg(Src);
4920 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
4923 LLT Ty =
MRI.getType(Src);
4925 if (!
LI || !
LI->isLegalOrCustom({TargetOpcode::G_SBFX, {Ty, ExtractTy}}))
4927 int64_t Width =
MI.getOperand(2).getImm();
4935 if (ShiftImm < 0 || ShiftImm + Width > Ty.getScalarSizeInBits())
4939 auto Cst1 =
B.buildConstant(ExtractTy, ShiftImm);
4940 auto Cst2 =
B.buildConstant(ExtractTy, Width);
4941 B.buildSbfx(Dst, ShiftSrc, Cst1, Cst2);
4951 LLT Ty =
MRI.getType(Dst);
4955 if (
LI && !
LI->isLegalOrCustom({TargetOpcode::G_UBFX, {Ty, ExtractTy}}))
4958 int64_t AndImm, LSBImm;
4960 const unsigned Size = Ty.getScalarSizeInBits();
4967 auto MaybeMask =
static_cast<uint64_t>(AndImm);
4968 if (MaybeMask & (MaybeMask + 1))
4977 auto WidthCst =
B.buildConstant(ExtractTy, Width);
4978 auto LSBCst =
B.buildConstant(ExtractTy, LSBImm);
4979 B.buildInstr(TargetOpcode::G_UBFX, {Dst}, {ShiftSrc, LSBCst, WidthCst});
4987 const unsigned Opcode =
MI.getOpcode();
4988 assert(Opcode == TargetOpcode::G_ASHR || Opcode == TargetOpcode::G_LSHR);
4990 const Register Dst =
MI.getOperand(0).getReg();
4992 const unsigned ExtrOpcode = Opcode == TargetOpcode::G_ASHR
4993 ? TargetOpcode::G_SBFX
4994 : TargetOpcode::G_UBFX;
4997 LLT Ty =
MRI.getType(Dst);
4999 if (!
LI || !
LI->isLegalOrCustom({ExtrOpcode, {Ty, ExtractTy}}))
5005 const unsigned Size = Ty.getScalarSizeInBits();
5015 if (ShlAmt < 0 || ShlAmt > ShrAmt || ShrAmt >=
Size)
5019 if (Opcode == TargetOpcode::G_ASHR && ShlAmt == ShrAmt)
5023 const int64_t Pos = ShrAmt - ShlAmt;
5024 const int64_t Width =
Size - ShrAmt;
5027 auto WidthCst =
B.buildConstant(ExtractTy, Width);
5028 auto PosCst =
B.buildConstant(ExtractTy, Pos);
5029 B.buildInstr(ExtrOpcode, {Dst}, {ShlSrc, PosCst, WidthCst});
5037 const unsigned Opcode =
MI.getOpcode();
5038 assert(Opcode == TargetOpcode::G_LSHR || Opcode == TargetOpcode::G_ASHR);
5040 const Register Dst =
MI.getOperand(0).getReg();
5041 LLT Ty =
MRI.getType(Dst);
5043 if (
LI && !
LI->isLegalOrCustom({TargetOpcode::G_UBFX, {Ty, ExtractTy}}))
5056 const unsigned Size = Ty.getScalarSizeInBits();
5057 if (ShrAmt < 0 || ShrAmt >=
Size)
5061 if (0 == (SMask >> ShrAmt)) {
5063 B.buildConstant(Dst, 0);
5069 uint64_t UMask = SMask;
5076 const int64_t Pos = ShrAmt;
5081 if (Opcode == TargetOpcode::G_ASHR && Width + ShrAmt ==
Size)
5085 auto WidthCst =
B.buildConstant(ExtractTy, Width);
5086 auto PosCst =
B.buildConstant(ExtractTy, Pos);
5087 B.buildInstr(TargetOpcode::G_UBFX, {Dst}, {AndSrc, PosCst, WidthCst});
5092bool CombinerHelper::reassociationCanBreakAddressingModePattern(
5096 Register Src1Reg = PtrAdd.getBaseReg();
5101 Register Src2Reg = PtrAdd.getOffsetReg();
5103 if (
MRI.hasOneNonDBGUse(Src1Reg))
5113 const APInt &C1APIntVal = *C1;
5114 const APInt &C2APIntVal = *C2;
5115 const int64_t CombinedValue = (C1APIntVal + C2APIntVal).getSExtValue();
5117 for (
auto &
UseMI :
MRI.use_nodbg_instructions(PtrAdd.getReg(0))) {
5120 MachineInstr *ConvUseMI = &
UseMI;
5121 unsigned ConvUseOpc = ConvUseMI->
getOpcode();
5122 while (ConvUseOpc == TargetOpcode::G_INTTOPTR ||
5123 ConvUseOpc == TargetOpcode::G_PTRTOINT) {
5125 if (!
MRI.hasOneNonDBGUse(DefReg))
5127 ConvUseMI = &*
MRI.use_instr_nodbg_begin(DefReg);
5136 TargetLoweringBase::AddrMode AM;
5139 unsigned AS =
MRI.getType(LdStMI->getPointerReg()).getAddressSpace();
5141 PtrAdd.getMF()->getFunction().getContext());
5142 const auto &TLI = *PtrAdd.getMF()->getSubtarget().getTargetLowering();
5143 if (!TLI.isLegalAddressingMode(PtrAdd.getMF()->getDataLayout(), AM,
5149 if (!TLI.isLegalAddressingMode(PtrAdd.getMF()->getDataLayout(), AM,
5161 Register Src1Reg =
MI.getOperand(1).getReg();
5162 if (RHS->getOpcode() != TargetOpcode::G_ADD)
5174 unsigned PtrAddFlags =
MI.getFlags();
5175 unsigned AddFlags = RHS->getFlags();
5188 LLT PtrTy =
MRI.getType(
MI.getOperand(0).getReg());
5191 Builder.buildPtrAdd(PtrTy, Src1Reg, RHS->getOperand(1).getReg(), Flags);
5193 MI.getOperand(1).setReg(NewBase.getReg(0));
5194 MI.getOperand(2).setReg(RHS->getOperand(2).getReg());
5198 return !reassociationCanBreakAddressingModePattern(
MI);
5208 std::optional<ValueAndVReg> LHSCstOff;
5218 unsigned PtrAddFlags =
MI.getFlags();
5219 unsigned LHSPtrAddFlags = LHSPtrAdd->getFlags();
5221 bool IsNoUSWrap = IsNoUWrap && (PtrAddFlags & LHSPtrAddFlags &
5223 bool IsInBounds = IsNoUWrap && (PtrAddFlags & LHSPtrAddFlags &
5237 LHSPtrAdd->moveBefore(&
MI);
5240 auto NewCst =
B.buildConstant(
MRI.getType(RHSReg), LHSCstOff->Value);
5242 MI.getOperand(2).setReg(NewCst.getReg(0));
5245 Observer.changingInstr(*LHSPtrAdd);
5246 LHSPtrAdd->getOperand(2).setReg(RHSReg);
5247 LHSPtrAdd->setFlags(Flags);
5250 return !reassociationCanBreakAddressingModePattern(
MI);
5261 Register Src2Reg =
MI.getOperand(2).getReg();
5262 Register LHSSrc1 = LHSPtrAdd->getBaseReg();
5263 Register LHSSrc2 = LHSPtrAdd->getOffsetReg();
5276 unsigned PtrAddFlags =
MI.getFlags();
5277 unsigned LHSPtrAddFlags = LHSPtrAdd->getFlags();
5290 auto NewCst =
B.buildConstant(
MRI.getType(Src2Reg), *C1 + *C2);
5292 MI.getOperand(1).setReg(LHSSrc1);
5293 MI.getOperand(2).setReg(NewCst.getReg(0));
5297 return !reassociationCanBreakAddressingModePattern(
MI);
5335 LLT OpRHSTy =
MRI.getType(OpRHS);
5354 auto NewCst =
B.buildInstr(
Opc, {OpRHSTy}, {OpLHSRHS, OpRHS});
5355 B.buildInstr(
Opc, {DstReg}, {OpLHSLHS, NewCst});
5363 auto NewLHSLHS =
B.buildInstr(
Opc, {OpRHSTy}, {OpLHSLHS, OpRHS});
5364 B.buildInstr(
Opc, {DstReg}, {NewLHSLHS, OpLHSRHS});
5377 unsigned Opc =
MI.getOpcode();
5390 APInt &MatchInfo)
const {
5391 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
5395 MatchInfo = *MaybeCst;
5406 MI.getOperand(1).getReg(),
MRI);
5411 if (Csts.size() == 1)
5412 B.buildConstant(Dst, Csts[0]);
5414 B.buildBuildVectorConstant(Dst, Csts);
5420 APInt &MatchInfo)
const {
5426 MatchInfo = *MaybeCst;
5438 ConstantFP::get(
MI.getMF()->getFunction().getContext(), *MaybeCst);
5444 assert(
MI.getOpcode() == TargetOpcode::G_FMA ||
5445 MI.getOpcode() == TargetOpcode::G_FMAD);
5446 auto [
_, Op1, Op2, Op3] =
MI.getFirst4Regs();
5463 MatchInfo = ConstantFP::get(
MI.getMF()->getFunction().getContext(), Op1F);
5486 assert(
MI.getOpcode() == TargetOpcode::G_AND);
5490 LLT WideTy =
MRI.getType(Dst);
5494 if (!WideTy.
isScalar() || !
MRI.hasOneNonDBGUse(AndLHS))
5510 case TargetOpcode::G_ADD:
5511 case TargetOpcode::G_SUB:
5512 case TargetOpcode::G_MUL:
5513 case TargetOpcode::G_AND:
5514 case TargetOpcode::G_OR:
5515 case TargetOpcode::G_XOR:
5523 auto Mask = Cst->Value;
5528 unsigned NarrowWidth = Mask.countr_one();
5534 auto &MF = *
MI.getMF();
5537 if (!TLI.isTruncateFree(WideTy, NarrowTy, Ctx) ||
5538 !TLI.isZExtFree(NarrowTy, WideTy, Ctx))
5546 auto NarrowLHS =
Builder.buildTrunc(NarrowTy, BinOpLHS);
5547 auto NarrowRHS =
Builder.buildTrunc(NarrowTy, BinOpRHS);
5549 Builder.buildInstr(LHSOpc, {NarrowTy}, {NarrowLHS, NarrowRHS});
5550 auto Ext =
Builder.buildZExt(WideTy, NarrowBinOp);
5552 MI.getOperand(1).setReg(Ext.getReg(0));
5560 unsigned Opc =
MI.getOpcode();
5561 assert(
Opc == TargetOpcode::G_UMULO ||
Opc == TargetOpcode::G_SMULO);
5568 unsigned NewOpc =
Opc == TargetOpcode::G_UMULO ? TargetOpcode::G_UADDO
5569 : TargetOpcode::G_SADDO;
5570 MI.setDesc(
Builder.getTII().get(NewOpc));
5571 MI.getOperand(3).setReg(
MI.getOperand(2).getReg());
5580 assert(
MI.getOpcode() == TargetOpcode::G_UMULO ||
5581 MI.getOpcode() == TargetOpcode::G_SMULO);
5590 B.buildConstant(Dst, 0);
5591 B.buildConstant(Carry, 0);
5600 assert(
MI.getOpcode() == TargetOpcode::G_UADDE ||
5601 MI.getOpcode() == TargetOpcode::G_SADDE ||
5602 MI.getOpcode() == TargetOpcode::G_USUBE ||
5603 MI.getOpcode() == TargetOpcode::G_SSUBE);
5608 switch (
MI.getOpcode()) {
5609 case TargetOpcode::G_UADDE:
5610 NewOpcode = TargetOpcode::G_UADDO;
5612 case TargetOpcode::G_SADDE:
5613 NewOpcode = TargetOpcode::G_SADDO;
5615 case TargetOpcode::G_USUBE:
5616 NewOpcode = TargetOpcode::G_USUBO;
5618 case TargetOpcode::G_SSUBE:
5619 NewOpcode = TargetOpcode::G_SSUBO;
5623 MI.setDesc(
B.getTII().get(NewOpcode));
5624 MI.removeOperand(4);
5632 assert(
MI.getOpcode() == TargetOpcode::G_SUB);
5665 auto Zero =
B.buildConstant(
MRI.getType(Dst), 0);
5666 B.buildSub(Dst, Zero, ReplaceReg);
5675 unsigned Opcode =
MI.getOpcode();
5676 assert(Opcode == TargetOpcode::G_UDIV || Opcode == TargetOpcode::G_UREM);
5678 Register Dst = UDivorRem.getReg(0);
5679 Register LHS = UDivorRem.getReg(1);
5680 Register RHS = UDivorRem.getReg(2);
5681 LLT Ty =
MRI.getType(Dst);
5689 bool UseSRL =
false;
5694 auto BuildExactUDIVPattern = [&](
const Constant *
C) {
5696 if (IsSplat && !Factors.
empty()) {
5703 APInt Divisor = CI->getValue();
5712 Shifts.
push_back(MIB.buildConstant(ScalarShiftAmtTy, Shift).getReg(0));
5713 Factors.
push_back(MIB.buildConstant(ScalarTy, Factor).getReg(0));
5723 if (Ty.isVector()) {
5724 Shift = MIB.buildBuildVector(ShiftAmtTy, Shifts).getReg(0);
5725 Factor = MIB.buildBuildVector(Ty, Factors).getReg(0);
5728 Factor = Factors[0];
5736 return MIB.buildMul(Ty, Res, Factor);
5739 unsigned KnownLeadingZeros =
5740 VT ?
VT->getKnownBits(LHS).countMinLeadingZeros() : 0;
5742 bool UseNPQ =
false;
5744 auto BuildUDIVPattern = [&](
const Constant *
C) {
5746 const APInt &Divisor = CI->getValue();
5748 bool SelNPQ =
false;
5750 unsigned PreShift = 0, PostShift = 0;
5755 if (!Divisor.
isOne()) {
5761 Divisor, std::min(KnownLeadingZeros, Divisor.
countl_zero()));
5763 Magic = std::move(magics.
Magic);
5766 "We shouldn't generate an undefined shift!");
5768 "We shouldn't generate an undefined shift!");
5772 SelNPQ = magics.
IsAdd;
5776 MIB.buildConstant(ScalarShiftAmtTy, PreShift).getReg(0));
5777 MagicFactors.
push_back(MIB.buildConstant(ScalarTy, Magic).getReg(0));
5779 MIB.buildConstant(ScalarTy,
5784 MIB.buildConstant(ScalarShiftAmtTy, PostShift).getReg(0));
5792 assert(Matched &&
"Expected unary predicate match to succeed");
5794 Register PreShift, PostShift, MagicFactor, NPQFactor;
5797 PreShift = MIB.buildBuildVector(ShiftAmtTy, PreShifts).getReg(0);
5798 MagicFactor = MIB.buildBuildVector(Ty, MagicFactors).getReg(0);
5799 NPQFactor = MIB.buildBuildVector(Ty, NPQFactors).getReg(0);
5800 PostShift = MIB.buildBuildVector(ShiftAmtTy, PostShifts).getReg(0);
5803 "Non-build_vector operation should have been a scalar");
5804 PreShift = PreShifts[0];
5805 MagicFactor = MagicFactors[0];
5806 PostShift = PostShifts[0];
5810 Q = MIB.buildLShr(Ty, Q, PreShift).getReg(0);
5813 Q = MIB.buildUMulH(Ty, Q, MagicFactor).getReg(0);
5816 Register NPQ = MIB.buildSub(Ty, LHS, Q).getReg(0);
5821 NPQ = MIB.buildUMulH(Ty, NPQ, NPQFactor).getReg(0);
5823 NPQ = MIB.buildLShr(Ty, NPQ, MIB.buildConstant(ShiftAmtTy, 1)).getReg(0);
5825 Q = MIB.buildAdd(Ty, NPQ, Q).getReg(0);
5828 Q = MIB.buildLShr(Ty, Q, PostShift).getReg(0);
5829 auto One = MIB.buildConstant(Ty, 1);
5830 auto IsOne = MIB.buildICmp(
5834 auto ret = MIB.buildSelect(Ty, IsOne, LHS, Q);
5836 if (Opcode == TargetOpcode::G_UREM) {
5837 auto Prod = MIB.buildMul(Ty, ret, RHS);
5838 return MIB.buildSub(Ty, LHS, Prod);
5844 unsigned Opcode =
MI.getOpcode();
5845 assert(Opcode == TargetOpcode::G_UDIV || Opcode == TargetOpcode::G_UREM);
5848 LLT DstTy =
MRI.getType(Dst);
5850 auto &MF = *
MI.getMF();
5851 AttributeList Attr = MF.getFunction().getAttributes();
5860 if (MF.getFunction().hasMinSize())
5863 if (Opcode == TargetOpcode::G_UDIV &&
5866 MRI, RHS, [](
const Constant *
C) {
return C && !
C->isNullValue(); });
5869 auto *RHSDef =
MRI.getVRegDef(RHS);
5880 {TargetOpcode::G_ICMP,
5884 if (Opcode == TargetOpcode::G_UREM &&
5890 MRI, RHS, [](
const Constant *
C) {
return C && !
C->isNullValue(); });
5899 unsigned Opcode =
MI.getOpcode();
5900 assert(Opcode == TargetOpcode::G_SDIV || Opcode == TargetOpcode::G_SREM);
5903 LLT DstTy =
MRI.getType(Dst);
5907 auto &MF = *
MI.getMF();
5908 AttributeList Attr = MF.getFunction().getAttributes();
5917 if (MF.getFunction().hasMinSize())
5921 if (Opcode == TargetOpcode::G_SDIV &&
5924 MRI, RHS, [](
const Constant *
C) {
return C && !
C->isNullValue(); });
5927 auto *RHSDef =
MRI.getVRegDef(RHS);
5935 if (!
isLegal({TargetOpcode::G_SMULH, {DstTy}}) &&
5938 if (Opcode == TargetOpcode::G_SREM &&
5944 MRI, RHS, [](
const Constant *
C) {
return C && !
C->isNullValue(); });
5953 unsigned Opcode =
MI.getOpcode();
5954 assert(
MI.getOpcode() == TargetOpcode::G_SDIV ||
5955 Opcode == TargetOpcode::G_SREM);
5957 Register Dst = SDivorRem.getReg(0);
5958 Register LHS = SDivorRem.getReg(1);
5959 Register RHS = SDivorRem.getReg(2);
5960 LLT Ty =
MRI.getType(Dst);
5967 bool UseSRA =
false;
5973 auto BuildExactSDIVPattern = [&](
const Constant *
C) {
5975 if (IsSplat && !ExactFactors.
empty()) {
5977 ExactFactors.
push_back(ExactFactors[0]);
5982 APInt Divisor = CI->getValue();
5992 ExactShifts.
push_back(MIB.buildConstant(ScalarShiftAmtTy, Shift).getReg(0));
5993 ExactFactors.
push_back(MIB.buildConstant(ScalarTy, Factor).getReg(0));
6001 assert(Matched &&
"Expected unary predicate match to succeed");
6004 if (Ty.isVector()) {
6005 Shift = MIB.buildBuildVector(ShiftAmtTy, ExactShifts).getReg(0);
6006 Factor = MIB.buildBuildVector(Ty, ExactFactors).getReg(0);
6008 Shift = ExactShifts[0];
6009 Factor = ExactFactors[0];
6017 return MIB.buildMul(Ty, Res, Factor);
6022 auto BuildSDIVPattern = [&](
const Constant *
C) {
6024 const APInt &Divisor = CI->getValue();
6028 int NumeratorFactor = 0;
6039 NumeratorFactor = 1;
6042 NumeratorFactor = -1;
6045 MagicFactors.
push_back(MIB.buildConstant(ScalarTy, Magics.
Magic).getReg(0));
6046 Factors.
push_back(MIB.buildConstant(ScalarTy, NumeratorFactor).getReg(0));
6048 MIB.buildConstant(ScalarShiftAmtTy, Magics.
ShiftAmount).getReg(0));
6049 ShiftMasks.
push_back(MIB.buildConstant(ScalarTy, ShiftMask).getReg(0));
6057 assert(Matched &&
"Expected unary predicate match to succeed");
6059 Register MagicFactor, Factor, Shift, ShiftMask;
6062 MagicFactor = MIB.buildBuildVector(Ty, MagicFactors).getReg(0);
6063 Factor = MIB.buildBuildVector(Ty, Factors).getReg(0);
6064 Shift = MIB.buildBuildVector(ShiftAmtTy, Shifts).getReg(0);
6065 ShiftMask = MIB.buildBuildVector(Ty, ShiftMasks).getReg(0);
6068 "Non-build_vector operation should have been a scalar");
6069 MagicFactor = MagicFactors[0];
6070 Factor = Factors[0];
6072 ShiftMask = ShiftMasks[0];
6076 Q = MIB.buildSMulH(Ty, LHS, MagicFactor).getReg(0);
6079 Factor = MIB.buildMul(Ty, LHS, Factor).getReg(0);
6080 Q = MIB.buildAdd(Ty, Q, Factor).getReg(0);
6083 Q = MIB.buildAShr(Ty, Q, Shift).getReg(0);
6086 auto SignShift = MIB.buildConstant(ShiftAmtTy, EltBits - 1);
6087 auto T = MIB.buildLShr(Ty, Q, SignShift);
6088 T = MIB.buildAnd(Ty,
T, ShiftMask);
6089 auto ret = MIB.buildAdd(Ty, Q,
T);
6091 if (Opcode == TargetOpcode::G_SREM) {
6092 auto Prod = MIB.buildMul(Ty, ret, RHS);
6093 return MIB.buildSub(Ty, LHS, Prod);
6099 assert((
MI.getOpcode() == TargetOpcode::G_SDIV ||
6100 MI.getOpcode() == TargetOpcode::G_UDIV) &&
6101 "Expected SDIV or UDIV");
6104 auto MatchPow2 = [&](
const Constant *
C) {
6106 return CI && (CI->getValue().isPowerOf2() ||
6107 (IsSigned && CI->getValue().isNegatedPowerOf2()));
6113 assert(
MI.getOpcode() == TargetOpcode::G_SDIV &&
"Expected SDIV");
6118 LLT Ty =
MRI.getType(Dst);
6138 unsigned BitWidth = Ty.getScalarSizeInBits();
6139 auto Zero =
Builder.buildConstant(Ty, 0);
6142 auto C1 =
Builder.buildCTTZ(ShiftAmtTy, RHS);
6143 auto Inexact =
Builder.buildSub(ShiftAmtTy, Bits, C1);
6145 auto Sign =
Builder.buildAShr(
6149 auto LSrl =
Builder.buildLShr(Ty, Sign, Inexact);
6155 auto One =
Builder.buildConstant(Ty, 1);
6156 auto MinusOne =
Builder.buildConstant(Ty, -1);
6160 auto IsOneOrMinusOne =
Builder.buildOr(CCVT, IsOne, IsMinusOne);
6161 AShr =
Builder.buildSelect(Ty, IsOneOrMinusOne, LHS, AShr);
6165 auto Neg =
Builder.buildNeg(Ty, AShr);
6167 Builder.buildSelect(
MI.getOperand(0).getReg(), IsNeg, Neg, AShr);
6168 MI.eraseFromParent();
6172 assert(
MI.getOpcode() == TargetOpcode::G_UDIV &&
"Expected UDIV");
6177 LLT Ty =
MRI.getType(Dst);
6180 auto C1 =
Builder.buildCTTZ(ShiftAmtTy, RHS);
6181 Builder.buildLShr(
MI.getOperand(0).getReg(), LHS, C1);
6182 MI.eraseFromParent();
6186 assert(
MI.getOpcode() == TargetOpcode::G_SREM &&
"Expected SREM");
6191 LLT Ty =
MRI.getType(Dst);
6210 unsigned BitWidth = Ty.getScalarSizeInBits();
6211 auto AbsRHS =
Builder.buildAbs(Ty, RHS);
6212 auto Mask =
Builder.buildSub(Ty, AbsRHS,
Builder.buildConstant(Ty, 1));
6214 auto Sign =
Builder.buildAShr(Ty, LHS, BWMinusOne);
6215 auto Bias =
Builder.buildAnd(Ty, Sign, Mask);
6216 auto Biased =
Builder.buildAdd(Ty, LHS, Bias);
6219 MI.eraseFromParent();
6223 assert(
MI.getOpcode() == TargetOpcode::G_UMULH);
6226 LLT Ty =
MRI.getType(Dst);
6227 LLT RHSTy =
MRI.getType(RHS);
6229 auto MatchPow2ExceptOne = [&](
const Constant *
C) {
6231 return CI->getValue().isPowerOf2() && !CI->getValue().isOne();
6246 LLT Ty =
MRI.getType(Dst);
6252 Builder.buildSub(Ty,
Builder.buildConstant(Ty, NumEltBits), LogBase2);
6253 auto Trunc =
Builder.buildZExtOrTrunc(ShiftAmtTy, ShiftAmt);
6254 Builder.buildLShr(Dst, LHS, Trunc);
6255 MI.eraseFromParent();
6262 LLT DstTy =
MRI.getType(Dst);
6263 LLT SrcTy =
MRI.getType(Src);
6265 unsigned NumSrcBits = SrcTy.getScalarSizeInBits();
6266 assert(NumSrcBits > NumDstBits &&
"Unexpected types for truncate operation");
6269 {TargetOpcode::G_TRUNC_SSAT_S, {DstTy, SrcTy}}))
6287 Builder.buildTruncSSatS(Dst, MatchInfo);
6288 MI.eraseFromParent();
6295 LLT DstTy =
MRI.getType(Dst);
6296 LLT SrcTy =
MRI.getType(Src);
6298 unsigned NumSrcBits = SrcTy.getScalarSizeInBits();
6299 assert(NumSrcBits > NumDstBits &&
"Unexpected types for truncate operation");
6302 {TargetOpcode::G_TRUNC_SSAT_U, {DstTy, SrcTy}}))
6320 Builder.buildTruncSSatU(Dst, MatchInfo);
6321 MI.eraseFromParent();
6328 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
6329 LLT SrcTy =
MRI.getType(Val);
6331 unsigned NumSrcBits = SrcTy.getScalarSizeInBits();
6332 assert(NumSrcBits > NumDstBits &&
"Unexpected types for truncate operation");
6335 {TargetOpcode::G_TRUNC_SSAT_U, {DstTy, SrcTy}}))
6344 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
6353 unsigned Opc =
MI.getOpcode();
6354 assert(
Opc == TargetOpcode::G_FADD ||
Opc == TargetOpcode::G_FSUB ||
6355 Opc == TargetOpcode::G_FMUL ||
Opc == TargetOpcode::G_FDIV ||
6356 Opc == TargetOpcode::G_FMAD ||
Opc == TargetOpcode::G_FMA);
6368 Opc = TargetOpcode::G_FSUB;
6373 Opc = TargetOpcode::G_FADD;
6379 else if ((
Opc == TargetOpcode::G_FMUL ||
Opc == TargetOpcode::G_FDIV ||
6380 Opc == TargetOpcode::G_FMAD ||
Opc == TargetOpcode::G_FMA) &&
6389 MI.setDesc(
B.getTII().get(
Opc));
6390 MI.getOperand(1).setReg(
X);
6391 MI.getOperand(2).setReg(
Y);
6399 assert(
MI.getOpcode() == TargetOpcode::G_FSUB);
6402 MatchInfo =
MI.getOperand(2).getReg();
6403 LLT Ty =
MRI.getType(
MI.getOperand(0).getReg());
6405 const auto LHSCst = Ty.isVector()
6412 if (LHSCst->Value.isNegZero())
6416 if (LHSCst->Value.isPosZero())
6426 Dst,
Builder.buildFCanonicalize(
MRI.getType(Dst), MatchInfo).getReg(0));
6433 if (
MI.getOpcode() != TargetOpcode::G_FMUL)
6447 bool &AllowFusionGlobally,
6449 bool CanReassociate)
const {
6451 auto *MF =
MI.getMF();
6452 const auto &TLI = *MF->getSubtarget().getTargetLowering();
6454 LLT DstType =
MRI.getType(
MI.getOperand(0).getReg());
6462 bool HasFMA = TLI.isFMAFasterThanFMulAndFAdd(*MF, DstType) &&
6465 if (!HasFMAD && !HasFMA)
6473 Aggressive = TLI.enableAggressiveFMAFusion(DstType);
6480 assert(
MI.getOpcode() == TargetOpcode::G_FADD);
6482 bool AllowFusionGlobally, HasFMAD,
Aggressive;
6490 unsigned PreferredFusedOpcode =
6491 HasFMAD ? TargetOpcode::G_FMAD : TargetOpcode::G_FMA;
6505 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6506 {LHS.MI->getOperand(1).getReg(),
6507 LHS.MI->getOperand(2).getReg(), RHS.Reg});
6516 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6517 {RHS.MI->getOperand(1).getReg(),
6518 RHS.MI->getOperand(2).getReg(), LHS.Reg});
6529 assert(
MI.getOpcode() == TargetOpcode::G_FADD);
6531 bool AllowFusionGlobally, HasFMAD,
Aggressive;
6535 const auto &TLI = *
MI.getMF()->getSubtarget().getTargetLowering();
6540 LLT DstType =
MRI.getType(
MI.getOperand(0).getReg());
6542 unsigned PreferredFusedOpcode =
6543 HasFMAD ? TargetOpcode::G_FMAD : TargetOpcode::G_FMA;
6557 TLI.isFPExtFoldable(
MI, PreferredFusedOpcode, DstType,
6562 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6563 {FpExtX.getReg(0), FpExtY.getReg(0), RHS.Reg});
6572 TLI.isFPExtFoldable(
MI, PreferredFusedOpcode, DstType,
6577 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6578 {FpExtX.getReg(0), FpExtY.getReg(0), LHS.Reg});
6589 assert(
MI.getOpcode() == TargetOpcode::G_FADD);
6591 bool AllowFusionGlobally, HasFMAD,
Aggressive;
6599 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
6601 unsigned PreferredFusedOpcode =
6602 HasFMAD ? TargetOpcode::G_FMAD : TargetOpcode::G_FMA;
6615 if (LHS.MI->getOpcode() == PreferredFusedOpcode &&
6616 (
MRI.getVRegDef(LHS.MI->getOperand(3).getReg())->getOpcode() ==
6617 TargetOpcode::G_FMUL) &&
6618 MRI.hasOneNonDBGUse(LHS.MI->getOperand(0).getReg()) &&
6619 MRI.hasOneNonDBGUse(LHS.MI->getOperand(3).getReg())) {
6624 else if (RHS.MI->getOpcode() == PreferredFusedOpcode &&
6625 (
MRI.getVRegDef(RHS.MI->getOperand(3).getReg())->getOpcode() ==
6626 TargetOpcode::G_FMUL) &&
6627 MRI.hasOneNonDBGUse(RHS.MI->getOperand(0).getReg()) &&
6628 MRI.hasOneNonDBGUse(RHS.MI->getOperand(3).getReg())) {
6635 Register X = FMA->getOperand(1).getReg();
6636 Register Y = FMA->getOperand(2).getReg();
6641 Register InnerFMA =
MRI.createGenericVirtualRegister(DstTy);
6642 B.buildInstr(PreferredFusedOpcode, {InnerFMA}, {U, V, Z});
6643 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6655 assert(
MI.getOpcode() == TargetOpcode::G_FADD);
6657 bool AllowFusionGlobally, HasFMAD,
Aggressive;
6664 const auto &TLI = *
MI.getMF()->getSubtarget().getTargetLowering();
6665 LLT DstType =
MRI.getType(
MI.getOperand(0).getReg());
6671 unsigned PreferredFusedOpcode =
6672 HasFMAD ? TargetOpcode::G_FMAD : TargetOpcode::G_FMA;
6685 Register FpExtU =
B.buildFPExt(DstType, U).getReg(0);
6686 Register FpExtV =
B.buildFPExt(DstType, V).getReg(0);
6688 B.buildInstr(PreferredFusedOpcode, {DstType}, {FpExtU, FpExtV, Z})
6690 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6697 if (LHS.MI->getOpcode() == PreferredFusedOpcode &&
6701 TLI.isFPExtFoldable(
MI, PreferredFusedOpcode, DstType,
6706 LHS.MI->getOperand(1).getReg(),
6707 LHS.MI->getOperand(2).getReg(),
B);
6718 FMAMI->
getOpcode() == PreferredFusedOpcode) {
6721 TLI.isFPExtFoldable(
MI, PreferredFusedOpcode, DstType,
6726 X =
B.buildFPExt(DstType,
X).getReg(0);
6727 Y =
B.buildFPExt(DstType,
Y).getReg(0);
6738 if (RHS.MI->getOpcode() == PreferredFusedOpcode &&
6742 TLI.isFPExtFoldable(
MI, PreferredFusedOpcode, DstType,
6747 RHS.MI->getOperand(1).getReg(),
6748 RHS.MI->getOperand(2).getReg(),
B);
6759 FMAMI->
getOpcode() == PreferredFusedOpcode) {
6762 TLI.isFPExtFoldable(
MI, PreferredFusedOpcode, DstType,
6767 X =
B.buildFPExt(DstType,
X).getReg(0);
6768 Y =
B.buildFPExt(DstType,
Y).getReg(0);
6782 assert(
MI.getOpcode() == TargetOpcode::G_FSUB);
6784 bool AllowFusionGlobally, HasFMAD,
Aggressive;
6792 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
6796 int FirstMulHasFewerUses =
true;
6800 FirstMulHasFewerUses =
false;
6802 unsigned PreferredFusedOpcode =
6803 HasFMAD ? TargetOpcode::G_FMAD : TargetOpcode::G_FMA;
6806 if (FirstMulHasFewerUses &&
6810 Register NegZ =
B.buildFNeg(DstTy, RHS.Reg).getReg(0);
6811 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6812 {LHS.MI->getOperand(1).getReg(),
6813 LHS.MI->getOperand(2).getReg(), NegZ});
6822 B.buildFNeg(DstTy, RHS.MI->getOperand(1).getReg()).getReg(0);
6823 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6824 {NegY, RHS.MI->getOperand(2).getReg(), LHS.Reg});
6835 assert(
MI.getOpcode() == TargetOpcode::G_FSUB);
6837 bool AllowFusionGlobally, HasFMAD,
Aggressive;
6843 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
6845 unsigned PreferredFusedOpcode =
6846 HasFMAD ? TargetOpcode::G_FMAD : TargetOpcode::G_FMA;
6857 Register NegZ =
B.buildFNeg(DstTy, RHSReg).getReg(0);
6858 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6870 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6883 assert(
MI.getOpcode() == TargetOpcode::G_FSUB);
6885 bool AllowFusionGlobally, HasFMAD,
Aggressive;
6891 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
6893 unsigned PreferredFusedOpcode =
6894 HasFMAD ? TargetOpcode::G_FMAD : TargetOpcode::G_FMA;
6906 Register NegZ =
B.buildFNeg(DstTy, RHSReg).getReg(0);
6907 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6908 {FpExtX, FpExtY, NegZ});
6920 Register NegY =
B.buildFNeg(DstTy, FpExtY).getReg(0);
6923 B.buildInstr(PreferredFusedOpcode, {
MI.getOperand(0).getReg()},
6924 {NegY, FpExtZ, LHSReg});
6935 assert(
MI.getOpcode() == TargetOpcode::G_FSUB);
6937 bool AllowFusionGlobally, HasFMAD,
Aggressive;
6941 const auto &TLI = *
MI.getMF()->getSubtarget().getTargetLowering();
6942 LLT DstTy =
MRI.getType(
MI.getOperand(0).getReg());
6946 unsigned PreferredFusedOpcode =
6947 HasFMAD ? TargetOpcode::G_FMAD : TargetOpcode::G_FMA;
6951 Register FpExtX =
B.buildFPExt(DstTy,
X).getReg(0);
6952 Register FpExtY =
B.buildFPExt(DstTy,
Y).getReg(0);
6953 B.buildInstr(PreferredFusedOpcode, {Dst}, {FpExtX, FpExtY, Z});
6964 TLI.isFPExtFoldable(
MI, PreferredFusedOpcode, DstTy,
6967 Register FMAReg =
MRI.createGenericVirtualRegister(DstTy);
6970 B.buildFNeg(
MI.getOperand(0).getReg(), FMAReg);
6980 TLI.isFPExtFoldable(
MI, PreferredFusedOpcode, DstTy,
6993 unsigned &IdxToPropagate)
const {
6995 switch (
MI.getOpcode()) {
6998 case TargetOpcode::G_FMINNUM:
6999 case TargetOpcode::G_FMAXNUM:
7000 PropagateNaN =
false;
7002 case TargetOpcode::G_FMINIMUM:
7003 case TargetOpcode::G_FMAXIMUM:
7004 PropagateNaN =
true;
7008 auto MatchNaN = [&](
unsigned Idx) {
7009 Register MaybeNaNReg =
MI.getOperand(Idx).getReg();
7013 IdxToPropagate = PropagateNaN ? Idx : (Idx == 1 ? 2 : 1);
7017 return MatchNaN(1) || MatchNaN(2);
7025 assert(
MI.getOpcode() == TargetOpcode::G_FDIV);
7035 return N0CFP && (N0CFP->isExactlyValue(1.0) || N0CFP->isExactlyValue(-1.0));
7052 for (
auto &U :
MRI.use_nodbg_instructions(
Y)) {
7053 if (&U == &
MI || U.getParent() !=
MI.getParent())
7055 if (U.getOpcode() == TargetOpcode::G_FDIV &&
7056 U.getOperand(2).getReg() ==
Y && U.getOperand(1).getReg() !=
Y &&
7057 !IsOne(U.getOperand(1).getReg())) {
7070 return MatchInfo.
size() >= MinUses;
7078 LLT Ty =
MRI.getType(MatchInfo[0]->getOperand(0).
getReg());
7079 auto Div =
Builder.buildFDiv(Ty,
Builder.buildFConstant(Ty, 1.0),
7080 MatchInfo[0]->getOperand(2).getReg(),
7081 MatchInfo[0]->getFlags());
7086 Builder.buildFMul(
MI->getOperand(0).getReg(),
MI->getOperand(1).getReg(),
7087 Div->getOperand(0).getReg(),
MI->getFlags());
7088 MI->eraseFromParent();
7093 assert(
MI.getOpcode() == TargetOpcode::G_ADD &&
"Expected a G_ADD");
7103 Reg == MaybeSameReg;
7105 return CheckFold(LHS, RHS) || CheckFold(RHS, LHS);
7126 LLT DstVecTy =
MRI.getType(
MI.getOperand(0).getReg());
7135 return MRI.getType(MatchInfo) == DstVecTy;
7138 std::optional<ValueAndVReg> ShiftAmount;
7147 return MRI.getType(MatchInfo) == DstVecTy;
7162 return MRI.getType(MatchInfo) ==
MRI.getType(
MI.getOperand(0).getReg());
7169 std::optional<ValueAndVReg> ShiftAmt;
7175 LLT MatchTy =
MRI.getType(MatchInfo);
7176 return ShiftAmt->Value.getZExtValue() == MatchTy.
getSizeInBits() &&
7177 MatchTy ==
MRI.getType(
MI.getOperand(0).getReg());
7180unsigned CombinerHelper::getFPMinMaxOpcForSelect(
7182 SelectPatternNaNBehaviour VsNaNRetVal)
const {
7183 assert(VsNaNRetVal != SelectPatternNaNBehaviour::NOT_APPLICABLE &&
7184 "Expected a NaN behaviour?");
7194 if (VsNaNRetVal == SelectPatternNaNBehaviour::RETURNS_OTHER)
7195 return TargetOpcode::G_FMAXNUM;
7196 if (VsNaNRetVal == SelectPatternNaNBehaviour::RETURNS_NAN)
7197 return TargetOpcode::G_FMAXIMUM;
7198 if (
isLegal({TargetOpcode::G_FMAXNUM, {DstTy}}))
7199 return TargetOpcode::G_FMAXNUM;
7200 if (
isLegal({TargetOpcode::G_FMAXIMUM, {DstTy}}))
7201 return TargetOpcode::G_FMAXIMUM;
7207 if (VsNaNRetVal == SelectPatternNaNBehaviour::RETURNS_OTHER)
7208 return TargetOpcode::G_FMINNUM;
7209 if (VsNaNRetVal == SelectPatternNaNBehaviour::RETURNS_NAN)
7210 return TargetOpcode::G_FMINIMUM;
7211 if (
isLegal({TargetOpcode::G_FMINNUM, {DstTy}}))
7212 return TargetOpcode::G_FMINNUM;
7213 if (!
isLegal({TargetOpcode::G_FMINIMUM, {DstTy}}))
7215 return TargetOpcode::G_FMINIMUM;
7219CombinerHelper::SelectPatternNaNBehaviour
7221 bool IsOrderedComparison)
const {
7222 bool LHSSafe =
VT->isKnownNeverNaN(
LHS);
7223 bool RHSSafe =
VT->isKnownNeverNaN(
RHS);
7225 if (!LHSSafe && !RHSSafe)
7226 return SelectPatternNaNBehaviour::NOT_APPLICABLE;
7227 if (LHSSafe && RHSSafe)
7228 return SelectPatternNaNBehaviour::RETURNS_ANY;
7231 if (IsOrderedComparison)
7232 return LHSSafe ? SelectPatternNaNBehaviour::RETURNS_NAN
7233 : SelectPatternNaNBehaviour::RETURNS_OTHER;
7236 return LHSSafe ? SelectPatternNaNBehaviour::RETURNS_OTHER
7237 : SelectPatternNaNBehaviour::RETURNS_NAN;
7246 LLT DstTy =
MRI.getType(Dst);
7259 SelectPatternNaNBehaviour ResWithKnownNaNInfo =
7261 if (ResWithKnownNaNInfo == SelectPatternNaNBehaviour::NOT_APPLICABLE)
7263 if (TrueVal == CmpRHS && FalseVal == CmpLHS) {
7266 if (ResWithKnownNaNInfo == SelectPatternNaNBehaviour::RETURNS_NAN)
7267 ResWithKnownNaNInfo = SelectPatternNaNBehaviour::RETURNS_OTHER;
7268 else if (ResWithKnownNaNInfo == SelectPatternNaNBehaviour::RETURNS_OTHER)
7269 ResWithKnownNaNInfo = SelectPatternNaNBehaviour::RETURNS_NAN;
7271 if (TrueVal != CmpLHS || FalseVal != CmpRHS)
7274 unsigned Opc = getFPMinMaxOpcForSelect(Pred, DstTy, ResWithKnownNaNInfo);
7279 if (
Opc != TargetOpcode::G_FMAXIMUM &&
Opc != TargetOpcode::G_FMINIMUM) {
7284 if (!KnownNonZeroSide || !KnownNonZeroSide->Value.isNonZero()) {
7286 if (!KnownNonZeroSide || !KnownNonZeroSide->Value.isNonZero())
7290 MatchInfo = [=](MachineIRBuilder &
B) {
7291 B.buildInstr(
Opc, {Dst}, {CmpLHS, CmpRHS});
7299 assert(
MI.getOpcode() == TargetOpcode::G_SELECT);
7306 Register TrueVal =
MI.getOperand(2).getReg();
7307 Register FalseVal =
MI.getOperand(3).getReg();
7308 return matchFPSelectToMinMax(Dst,
Cond, TrueVal, FalseVal, MatchInfo);
7313 assert(
MI.getOpcode() == TargetOpcode::G_ICMP);
7326 if (MatchedSub &&
X != OpLHS)
7334 Y =
X == OpLHS ? OpRHS :
X == OpRHS ? OpLHS :
Register();
7337 auto Zero =
B.buildConstant(
MRI.getType(
Y), 0);
7338 B.buildICmp(Pred, Dst,
Y, Zero);
7345static std::optional<unsigned>
7347 std::optional<int64_t> &Result) {
7348 assert((Opcode == TargetOpcode::G_SHL || Opcode == TargetOpcode::G_LSHR ||
7349 Opcode == TargetOpcode::G_ASHR) &&
7350 "Expect G_SHL, G_LSHR or G_ASHR.");
7351 auto SignificantBits = 0;
7353 case TargetOpcode::G_SHL:
7357 case TargetOpcode::G_LSHR:
7361 case TargetOpcode::G_ASHR:
7370 Result = std::nullopt;
7381 Register ShiftVal =
MI.getOperand(1).getReg();
7382 Register ShiftReg =
MI.getOperand(2).getReg();
7383 LLT ResTy =
MRI.getType(
MI.getOperand(0).getReg());
7384 auto IsShiftTooBig = [&](
const Constant *
C) {
7389 MatchInfo = std::nullopt;
7393 MI.getOpcode(), MatchInfo);
7394 return OptMaxUsefulShift && CI->uge(*OptMaxUsefulShift);
7400 unsigned LHSOpndIdx = 1;
7401 unsigned RHSOpndIdx = 2;
7402 switch (
MI.getOpcode()) {
7403 case TargetOpcode::G_UADDO:
7404 case TargetOpcode::G_SADDO:
7405 case TargetOpcode::G_UMULO:
7406 case TargetOpcode::G_SMULO:
7413 Register LHS =
MI.getOperand(LHSOpndIdx).getReg();
7414 Register RHS =
MI.getOperand(RHSOpndIdx).getReg();
7419 if (
MRI.getVRegDef(LHS)->getOpcode() !=
7420 TargetOpcode::G_CONSTANT_FOLD_BARRIER)
7424 return MRI.getVRegDef(RHS)->getOpcode() !=
7425 TargetOpcode::G_CONSTANT_FOLD_BARRIER &&
7432 std::optional<FPValueAndVReg> ValAndVReg;
7440 unsigned LHSOpndIdx = 1;
7441 unsigned RHSOpndIdx = 2;
7442 switch (
MI.getOpcode()) {
7443 case TargetOpcode::G_UADDO:
7444 case TargetOpcode::G_SADDO:
7445 case TargetOpcode::G_UMULO:
7446 case TargetOpcode::G_SMULO:
7453 Register LHSReg =
MI.getOperand(LHSOpndIdx).getReg();
7454 Register RHSReg =
MI.getOperand(RHSOpndIdx).getReg();
7455 MI.getOperand(LHSOpndIdx).setReg(RHSReg);
7456 MI.getOperand(RHSOpndIdx).setReg(LHSReg);
7460bool CombinerHelper::isOneOrOneSplat(
Register Src,
bool AllowUndefs)
const {
7462 if (SrcTy.isFixedVector())
7464 if (SrcTy.isScalar()) {
7468 return IConstant && IConstant->Value == 1;
7473bool CombinerHelper::isZeroOrZeroSplat(
Register Src,
bool AllowUndefs)
const {
7474 LLT SrcTy =
MRI.getType(Src);
7476 return isConstantSplatVector(Src, 0, AllowUndefs);
7481 return IConstant && IConstant->Value == 0;
7488bool CombinerHelper::isConstantSplatVector(
Register Src, int64_t SplatValue,
7489 bool AllowUndefs)
const {
7495 for (
unsigned I = 0;
I < NumSources; ++
I) {
7496 GImplicitDef *ImplicitDef =
7498 if (ImplicitDef && AllowUndefs)
7500 if (ImplicitDef && !AllowUndefs)
7502 std::optional<ValueAndVReg> IConstant =
7504 if (IConstant && IConstant->Value == SplatValue)
7514CombinerHelper::getConstantOrConstantSplatVector(
Register Src)
const {
7517 return IConstant->Value;
7521 return std::nullopt;
7524 std::optional<APInt>
Value = std::nullopt;
7525 for (
unsigned I = 0;
I < NumSources; ++
I) {
7526 std::optional<ValueAndVReg> IConstant =
7529 return std::nullopt;
7531 Value = IConstant->Value;
7532 else if (*
Value != IConstant->Value)
7533 return std::nullopt;
7539bool CombinerHelper::isConstantOrConstantVectorI(
Register Src)
const {
7549 for (
unsigned I = 0;
I < NumSources; ++
I) {
7550 std::optional<ValueAndVReg> IConstant =
7559bool CombinerHelper::tryFoldSelectOfConstants(
GSelect *
Select,
7566 LLT CondTy =
MRI.getType(
Select->getCondReg());
7567 LLT TrueTy =
MRI.getType(
Select->getTrueReg());
7577 std::optional<ValueAndVReg> TrueOpt =
7579 std::optional<ValueAndVReg> FalseOpt =
7582 if (!TrueOpt || !FalseOpt)
7585 APInt TrueValue = TrueOpt->Value;
7586 APInt FalseValue = FalseOpt->Value;
7590 MatchInfo = [=](MachineIRBuilder &
B) {
7591 B.setInstrAndDebugLoc(*
Select);
7592 B.buildZExtOrTrunc(Dest,
Cond);
7599 MatchInfo = [=](MachineIRBuilder &
B) {
7600 B.setInstrAndDebugLoc(*
Select);
7601 B.buildSExtOrTrunc(Dest,
Cond);
7608 MatchInfo = [=](MachineIRBuilder &
B) {
7609 B.setInstrAndDebugLoc(*
Select);
7610 Register Inner =
MRI.createGenericVirtualRegister(CondTy);
7611 B.buildNot(Inner,
Cond);
7612 B.buildZExtOrTrunc(Dest, Inner);
7619 MatchInfo = [=](MachineIRBuilder &
B) {
7620 B.setInstrAndDebugLoc(*
Select);
7621 Register Inner =
MRI.createGenericVirtualRegister(CondTy);
7622 B.buildNot(Inner,
Cond);
7623 B.buildSExtOrTrunc(Dest, Inner);
7629 if (TrueValue - 1 == FalseValue) {
7630 MatchInfo = [=](MachineIRBuilder &
B) {
7631 B.setInstrAndDebugLoc(*
Select);
7632 Register Inner =
MRI.createGenericVirtualRegister(TrueTy);
7633 B.buildZExtOrTrunc(Inner,
Cond);
7634 B.buildAdd(Dest, Inner, False);
7640 if (TrueValue + 1 == FalseValue) {
7641 MatchInfo = [=](MachineIRBuilder &
B) {
7642 B.setInstrAndDebugLoc(*
Select);
7643 Register Inner =
MRI.createGenericVirtualRegister(TrueTy);
7644 B.buildSExtOrTrunc(Inner,
Cond);
7645 B.buildAdd(Dest, Inner, False);
7652 MatchInfo = [=](MachineIRBuilder &
B) {
7653 B.setInstrAndDebugLoc(*
Select);
7654 Register Inner =
MRI.createGenericVirtualRegister(TrueTy);
7655 B.buildZExtOrTrunc(Inner,
Cond);
7658 auto ShAmtC =
B.buildConstant(ShiftTy, TrueValue.
exactLogBase2());
7659 B.buildShl(Dest, Inner, ShAmtC, Flags);
7666 MatchInfo = [=](MachineIRBuilder &
B) {
7667 B.setInstrAndDebugLoc(*
Select);
7669 B.buildNot(Not,
Cond);
7670 Register Inner =
MRI.createGenericVirtualRegister(TrueTy);
7671 B.buildZExtOrTrunc(Inner, Not);
7674 auto ShAmtC =
B.buildConstant(ShiftTy, FalseValue.
exactLogBase2());
7675 B.buildShl(Dest, Inner, ShAmtC, Flags);
7682 MatchInfo = [=](MachineIRBuilder &
B) {
7683 B.setInstrAndDebugLoc(*
Select);
7684 Register Inner =
MRI.createGenericVirtualRegister(TrueTy);
7685 B.buildSExtOrTrunc(Inner,
Cond);
7686 B.buildOr(Dest, Inner, False, Flags);
7693 MatchInfo = [=](MachineIRBuilder &
B) {
7694 B.setInstrAndDebugLoc(*
Select);
7696 B.buildNot(Not,
Cond);
7697 Register Inner =
MRI.createGenericVirtualRegister(TrueTy);
7698 B.buildSExtOrTrunc(Inner, Not);
7699 B.buildOr(Dest, Inner, True, Flags);
7708bool CombinerHelper::tryFoldBoolSelectToLogic(
GSelect *
Select,
7715 LLT CondTy =
MRI.getType(
Select->getCondReg());
7716 LLT TrueTy =
MRI.getType(
Select->getTrueReg());
7725 if (CondTy != TrueTy)
7730 if ((
Cond == True) || isOneOrOneSplat(True,
true)) {
7731 MatchInfo = [=](MachineIRBuilder &
B) {
7732 B.setInstrAndDebugLoc(*
Select);
7733 Register Ext =
MRI.createGenericVirtualRegister(TrueTy);
7734 B.buildZExtOrTrunc(Ext,
Cond);
7735 auto FreezeFalse =
B.buildFreeze(TrueTy, False);
7736 B.buildOr(DstReg, Ext, FreezeFalse, Flags);
7743 if ((
Cond == False) || isZeroOrZeroSplat(False,
true)) {
7744 MatchInfo = [=](MachineIRBuilder &
B) {
7745 B.setInstrAndDebugLoc(*
Select);
7746 Register Ext =
MRI.createGenericVirtualRegister(TrueTy);
7747 B.buildZExtOrTrunc(Ext,
Cond);
7748 auto FreezeTrue =
B.buildFreeze(TrueTy, True);
7749 B.buildAnd(DstReg, Ext, FreezeTrue);
7755 if (isOneOrOneSplat(False,
true)) {
7756 MatchInfo = [=](MachineIRBuilder &
B) {
7757 B.setInstrAndDebugLoc(*
Select);
7759 Register Inner =
MRI.createGenericVirtualRegister(CondTy);
7760 B.buildNot(Inner,
Cond);
7762 Register Ext =
MRI.createGenericVirtualRegister(TrueTy);
7763 B.buildZExtOrTrunc(Ext, Inner);
7764 auto FreezeTrue =
B.buildFreeze(TrueTy, True);
7765 B.buildOr(DstReg, Ext, FreezeTrue, Flags);
7771 if (isZeroOrZeroSplat(True,
true)) {
7772 MatchInfo = [=](MachineIRBuilder &
B) {
7773 B.setInstrAndDebugLoc(*
Select);
7775 Register Inner =
MRI.createGenericVirtualRegister(CondTy);
7776 B.buildNot(Inner,
Cond);
7778 Register Ext =
MRI.createGenericVirtualRegister(TrueTy);
7779 B.buildZExtOrTrunc(Ext, Inner);
7780 auto FreezeFalse =
B.buildFreeze(TrueTy, False);
7781 B.buildAnd(DstReg, Ext, FreezeFalse);
7797 LLT DstTy =
MRI.getType(DstReg);
7803 if (!
MRI.hasOneNonDBGUse(Cmp->getReg(0)))
7812 Register CmpLHS = Cmp->getLHSReg();
7813 Register CmpRHS = Cmp->getRHSReg();
7816 if (True == CmpRHS && False == CmpLHS) {
7824 if (True != CmpLHS || False != CmpRHS)
7864 assert(
MI.getOpcode() == TargetOpcode::G_SUB);
7865 Register DestReg =
MI.getOperand(0).getReg();
7866 LLT DestTy =
MRI.getType(DestReg);
7878 if (
isLegal({NewOpc, {DestTy}})) {
7880 B.buildInstr(NewOpc, {DestReg}, {
X, Sub0});
7892 if (tryFoldSelectOfConstants(
Select, MatchInfo))
7895 if (tryFoldBoolSelectToLogic(
Select, MatchInfo))
7905bool CombinerHelper::tryFoldAndOrOrICmpsUsingRanges(
7907 assert(Logic->
getOpcode() != TargetOpcode::G_XOR &&
"unexpected xor");
7908 bool IsAnd = Logic->
getOpcode() == TargetOpcode::G_AND;
7912 unsigned Flags = Logic->
getFlags();
7931 std::optional<ValueAndVReg> MaybeC1 =
7935 C1 = MaybeC1->Value;
7937 std::optional<ValueAndVReg> MaybeC2 =
7941 C2 = MaybeC2->Value;
7962 std::optional<APInt> Offset1;
7963 std::optional<APInt> Offset2;
7966 std::optional<ValueAndVReg> MaybeOffset1 =
7969 R1 =
Add->getLHSReg();
7970 Offset1 = MaybeOffset1->Value;
7974 std::optional<ValueAndVReg> MaybeOffset2 =
7977 R2 =
Add->getLHSReg();
7978 Offset2 = MaybeOffset2->Value;
7997 bool CreateMask =
false;
8010 if (!LowerDiff.
isPowerOf2() || LowerDiff != UpperDiff ||
8023 CR->getEquivalentICmp(NewPred, NewC,
Offset);
8032 MatchInfo = [=](MachineIRBuilder &
B) {
8033 if (CreateMask &&
Offset != 0) {
8034 auto TildeLowerDiff =
B.buildConstant(CmpOperandTy, ~LowerDiff);
8035 auto And =
B.buildAnd(CmpOperandTy, R1, TildeLowerDiff);
8036 auto OffsetC =
B.buildConstant(CmpOperandTy,
Offset);
8037 auto Add =
B.buildAdd(CmpOperandTy,
And, OffsetC, Flags);
8038 auto NewCon =
B.buildConstant(CmpOperandTy, NewC);
8039 auto ICmp =
B.buildICmp(NewPred, CmpTy,
Add, NewCon);
8040 B.buildZExtOrTrunc(DstReg, ICmp);
8041 }
else if (CreateMask &&
Offset == 0) {
8042 auto TildeLowerDiff =
B.buildConstant(CmpOperandTy, ~LowerDiff);
8043 auto And =
B.buildAnd(CmpOperandTy, R1, TildeLowerDiff);
8044 auto NewCon =
B.buildConstant(CmpOperandTy, NewC);
8045 auto ICmp =
B.buildICmp(NewPred, CmpTy,
And, NewCon);
8046 B.buildZExtOrTrunc(DstReg, ICmp);
8047 }
else if (!CreateMask &&
Offset != 0) {
8048 auto OffsetC =
B.buildConstant(CmpOperandTy,
Offset);
8049 auto Add =
B.buildAdd(CmpOperandTy, R1, OffsetC, Flags);
8050 auto NewCon =
B.buildConstant(CmpOperandTy, NewC);
8051 auto ICmp =
B.buildICmp(NewPred, CmpTy,
Add, NewCon);
8052 B.buildZExtOrTrunc(DstReg, ICmp);
8053 }
else if (!CreateMask &&
Offset == 0) {
8054 auto NewCon =
B.buildConstant(CmpOperandTy, NewC);
8055 auto ICmp =
B.buildICmp(NewPred, CmpTy, R1, NewCon);
8056 B.buildZExtOrTrunc(DstReg, ICmp);
8064bool CombinerHelper::tryFoldLogicOfFCmps(
GLogicalBinOp *Logic,
8070 bool IsAnd = Logic->
getOpcode() == TargetOpcode::G_AND;
8082 LLT CmpTy =
MRI.getType(Cmp1->
getReg(0));
8088 {TargetOpcode::G_FCMP, {CmpTy, CmpOperandTy}}) ||
8089 !
MRI.hasOneNonDBGUse(Logic->
getReg(0)) ||
8090 !
MRI.hasOneNonDBGUse(Cmp1->
getReg(0)) ||
8091 !
MRI.hasOneNonDBGUse(Cmp2->
getReg(0)) ||
8102 if (LHS0 == RHS1 && LHS1 == RHS0) {
8108 if (LHS0 == RHS0 && LHS1 == RHS1) {
8112 unsigned NewPred = IsAnd ? CmpCodeL & CmpCodeR : CmpCodeL | CmpCodeR;
8114 MatchInfo = [=](MachineIRBuilder &
B) {
8119 auto False =
B.buildConstant(CmpTy, 0);
8120 B.buildZExtOrTrunc(DestReg, False);
8127 B.buildZExtOrTrunc(DestReg, True);
8129 auto Cmp =
B.buildFCmp(Pred, CmpTy, LHS0, LHS1, Flags);
8130 B.buildZExtOrTrunc(DestReg, Cmp);
8142 if (tryFoldAndOrOrICmpsUsingRanges(
And, MatchInfo))
8145 if (tryFoldLogicOfFCmps(
And, MatchInfo))
8154 if (tryFoldAndOrOrICmpsUsingRanges(
Or, MatchInfo))
8157 if (tryFoldLogicOfFCmps(
Or, MatchInfo))
8172 bool IsSigned =
Add->isSigned();
8173 LLT DstTy =
MRI.getType(Dst);
8174 LLT CarryTy =
MRI.getType(Carry);
8177 if (
MRI.use_nodbg_empty(Carry) &&
8180 B.buildAdd(Dst, LHS, RHS);
8181 B.buildUndef(Carry);
8187 if (isConstantOrConstantVectorI(LHS) && !isConstantOrConstantVectorI(RHS)) {
8190 B.buildSAddo(Dst, Carry, RHS, LHS);
8196 B.buildUAddo(Dst, Carry, RHS, LHS);
8201 std::optional<APInt> MaybeLHS = getConstantOrConstantSplatVector(LHS);
8202 std::optional<APInt> MaybeRHS = getConstantOrConstantSplatVector(RHS);
8208 APInt Result = IsSigned ? MaybeLHS->sadd_ov(*MaybeRHS, Overflow)
8209 : MaybeLHS->uadd_ov(*MaybeRHS, Overflow);
8211 B.buildConstant(Dst, Result);
8212 B.buildConstant(Carry, Overflow);
8220 B.buildCopy(Dst, LHS);
8221 B.buildConstant(Carry, 0);
8230 if (MaybeRHS && AddLHS &&
MRI.hasOneNonDBGUse(
Add->getReg(0)) &&
8233 std::optional<APInt> MaybeAddRHS =
8234 getConstantOrConstantSplatVector(AddLHS->
getRHSReg());
8237 APInt NewC = IsSigned ? MaybeAddRHS->sadd_ov(*MaybeRHS, Overflow)
8238 : MaybeAddRHS->uadd_ov(*MaybeRHS, Overflow);
8242 auto ConstRHS =
B.buildConstant(DstTy, NewC);
8243 B.buildSAddo(Dst, Carry, AddLHS->
getLHSReg(), ConstRHS);
8249 auto ConstRHS =
B.buildConstant(DstTy, NewC);
8250 B.buildUAddo(Dst, Carry, AddLHS->
getLHSReg(), ConstRHS);
8275 B.buildConstant(Carry, 0);
8282 B.buildAdd(Dst, LHS, RHS);
8283 B.buildConstant(Carry, 1);
8295 if (
VT->computeNumSignBits(RHS) > 1 &&
VT->computeNumSignBits(LHS) > 1) {
8298 B.buildConstant(Carry, 0);
8314 B.buildConstant(Carry, 0);
8321 B.buildAdd(Dst, LHS, RHS);
8322 B.buildConstant(Carry, 1);
8340 bool OptForSize =
MI.getMF()->getFunction().hasOptSize();
8346 auto [Dst,
Base] =
MI.getFirst2Regs();
8347 LLT Ty =
MRI.getType(Dst);
8351 Builder.buildFConstant(Dst, 1.0);
8352 MI.removeFromParent();
8364 std::optional<SrcOp> Res;
8366 while (ExpVal > 0) {
8371 Res =
Builder.buildFMul(Ty, *Res, CurSquare);
8374 CurSquare =
Builder.buildFMul(Ty, CurSquare, CurSquare);
8381 Res =
Builder.buildFDiv(Ty,
Builder.buildFConstant(Ty, 1.0), *Res,
8385 MI.eraseFromParent();
8394 if (!
MRI.hasOneNonDBGUse(
Add->getReg(0)))
8401 LLT DstTy =
MRI.getType(Dst);
8404 auto Const =
B.buildConstant(DstTy, C1 - C2);
8405 B.buildAdd(Dst,
Add->getLHSReg(), Const);
8417 if (!
MRI.hasOneNonDBGUse(
Add->getReg(0)))
8424 LLT DstTy =
MRI.getType(Dst);
8427 auto Const =
B.buildConstant(DstTy, C2 - C1);
8428 B.buildSub(Dst, Const,
Add->getLHSReg());
8440 if (!
MRI.hasOneNonDBGUse(Sub2->
getReg(0)))
8447 LLT DstTy =
MRI.getType(Dst);
8450 auto Const =
B.buildConstant(DstTy, C1 + C2);
8463 if (!
MRI.hasOneNonDBGUse(Sub2->
getReg(0)))
8470 LLT DstTy =
MRI.getType(Dst);
8473 auto Const =
B.buildConstant(DstTy, C1 - C2);
8486 if (!
MRI.hasOneNonDBGUse(
Sub->getReg(0)))
8493 LLT DstTy =
MRI.getType(Dst);
8496 auto Const =
B.buildConstant(DstTy, C2 - C1);
8497 B.buildAdd(Dst,
Sub->getLHSReg(), Const);
8544 if (!
MRI.hasOneNonDBGUse(BV->getReg(0)))
8548 if (BV->getNumSources() % Unmerge->
getNumDefs() != 0)
8551 LLT BigBvTy =
MRI.getType(BV->getReg(0));
8552 LLT SmallBvTy = DstTy;
8556 {TargetOpcode::G_BUILD_VECTOR, {SmallBvTy, SmallBvElemenTy}}))
8561 {TargetOpcode::G_ANYEXT,
8573 auto AnyExt =
B.buildAnyExt(SmallBvElemenTy, SourceArray);
8574 Ops.push_back(AnyExt.getReg(0));
8592 const LLT SrcTy =
MRI.getType(Shuffle.getSrc1Reg());
8593 const unsigned NumSrcElems = SrcTy.isVector() ? SrcTy.getNumElements() : 1;
8594 const unsigned NumDstElts = OrigMask.
size();
8595 for (
unsigned i = 0; i != NumDstElts; ++i) {
8596 int Idx = OrigMask[i];
8597 if (Idx >= (
int)NumSrcElems) {
8608 B.buildShuffleVector(
MI.getOperand(0),
MI.getOperand(1),
MI.getOperand(2),
8609 std::move(NewMask));
8616 const unsigned MaskSize = Mask.size();
8617 for (
unsigned I = 0;
I < MaskSize; ++
I) {
8622 if (Idx < (
int)NumElems)
8623 Mask[
I] = Idx + NumElems;
8625 Mask[
I] = Idx - NumElems;
8635 if (
getOpcodeDef(TargetOpcode::G_IMPLICIT_DEF, Shuffle.getSrc1Reg(),
MRI))
8638 if (
getOpcodeDef(TargetOpcode::G_IMPLICIT_DEF, Shuffle.getSrc2Reg(),
MRI))
8641 const LLT DstTy =
MRI.getType(Shuffle.getReg(0));
8642 const LLT Src1Ty =
MRI.getType(Shuffle.getSrc1Reg());
8644 {TargetOpcode::G_SHUFFLE_VECTOR, {DstTy, Src1Ty}}))
8648 const unsigned NumSrcElems = Src1Ty.getNumElements();
8650 bool TouchesSrc1 =
false;
8651 bool TouchesSrc2 =
false;
8652 const unsigned NumElems = Mask.size();
8653 for (
unsigned Idx = 0; Idx < NumElems; ++Idx) {
8657 if (Mask[Idx] < (
int)NumSrcElems)
8663 if (TouchesSrc1 == TouchesSrc2)
8666 Register NewSrc1 = Shuffle.getSrc1Reg();
8669 NewSrc1 = Shuffle.getSrc2Reg();
8674 auto Undef =
B.buildUndef(Src1Ty);
8675 B.buildShuffleVector(Shuffle.getReg(0), NewSrc1,
Undef, NewMask);
8689 LLT DstTy =
MRI.getType(Dst);
8690 LLT CarryTy =
MRI.getType(Carry);
8712 B.buildConstant(Carry, 0);
8719 B.buildSub(Dst, LHS, RHS);
8737 B.buildConstant(Carry, 0);
8744 B.buildSub(Dst, LHS, RHS);
8761 CtlzMI.
getOpcode() == TargetOpcode::G_CTLZ_ZERO_POISON) &&
8762 "Expected G_CTLZ variant");
8767 LLT Ty =
MRI.getType(Dst);
8768 LLT SrcTy =
MRI.getType(Src);
8770 if (!(Ty.isValid() && Ty.isScalar()))
8779 switch (
LI->getAction(Query).Action) {
8790 bool NeedAdd =
true;
8798 unsigned BitWidth = Ty.getScalarSizeInBits();
8809 B.buildCTLS(Dst,
X);
8813 auto Ctls =
B.buildCTLS(Ty,
X);
8814 auto One =
B.buildConstant(Ty, 1);
8816 B.buildAdd(Dst, Ctls, One);
8826 unsigned TargetOpc)
const {
8827 assert((
MI.getOpcode() == TargetOpcode::G_LSHR ||
8828 MI.getOpcode() == TargetOpcode::G_ASHR) &&
8829 "Expected G_LSHR/G_ASHR");
8832 return XTy ==
MRI.getType(
Y) &&
isLegal({TargetOpc, {XTy}});
MachineInstrBuilder & UseMI
MachineInstrBuilder MachineInstrBuilder & DefMI
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
AMDGPU Register Bank Select
This file declares a class to represent arbitrary precision floating point values and provide a varie...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static const Function * getParent(const Value *V)
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static bool hasMoreUses(const MachineInstr &MI0, const MachineInstr &MI1, const MachineRegisterInfo &MRI)
static bool isContractableFMul(MachineInstr &MI, bool AllowFusionGlobally)
Checks if MI is TargetOpcode::G_FMUL and contractable either due to global flags or MachineInstr flag...
static unsigned getIndexedOpc(unsigned LdStOpc)
static APFloat constantFoldFpUnary(const MachineInstr &MI, const MachineRegisterInfo &MRI, const APFloat &Val)
static std::optional< std::pair< GZExtLoad *, int64_t > > matchLoadAndBytePosition(Register Reg, unsigned MemSizeInBits, const MachineRegisterInfo &MRI)
Helper function for findLoadOffsetsForLoadOrCombine.
static std::optional< unsigned > getMinUselessShift(KnownBits ValueKB, unsigned Opcode, std::optional< int64_t > &Result)
Return the minimum useless shift amount that results in complete loss of the source value.
static Register peekThroughBitcast(Register Reg, const MachineRegisterInfo &MRI)
static unsigned bigEndianByteAt(const unsigned ByteWidth, const unsigned I)
static cl::opt< bool > ForceLegalIndexing("force-legal-indexing", cl::Hidden, cl::init(false), cl::desc("Force all indexed operations to be " "legal for the GlobalISel combiner"))
static void commuteMask(MutableArrayRef< int > Mask, const unsigned NumElems)
static cl::opt< unsigned > PostIndexUseThreshold("post-index-use-threshold", cl::Hidden, cl::init(32), cl::desc("Number of uses of a base pointer to check before it is no longer " "considered for post-indexing."))
static std::optional< bool > isBigEndian(const SmallDenseMap< int64_t, int64_t, 8 > &MemOffset2Idx, int64_t LowestIdx)
Given a map from byte offsets in memory to indices in a load/store, determine if that map corresponds...
static unsigned getExtLoadOpcForExtend(unsigned ExtOpc)
static bool isConstValidTrue(const TargetLowering &TLI, unsigned ScalarSizeBits, int64_t Cst, bool IsVector, bool IsFP)
static LLT getMidVTForTruncRightShiftCombine(LLT ShiftTy, LLT TruncTy)
static bool canFoldInAddressingMode(GLoadStore *MI, const TargetLowering &TLI, MachineRegisterInfo &MRI)
Return true if 'MI' is a load or a store that may be fold it's address operand into the load / store ...
static unsigned littleEndianByteAt(const unsigned ByteWidth, const unsigned I)
static Register buildLogBase2(Register V, MachineIRBuilder &MIB)
Determines the LogBase2 value for a non-null input value using the transform: LogBase2(V) = (EltBits ...
This contains common combine transformations that may be used in a combine pass,or by the target else...
This contains common code to allow clients to notify changes to machine instr.
Provides analysis for querying information about KnownBits during GISel passes.
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Interface for Targets to specify which operations they can successfully select and how the others sho...
static bool isConstantSplatVector(SDValue N, APInt &SplatValue, unsigned MinSizeInBits)
Implement a low-level type suitable for MachineInstr level instruction selection.
Contains matchers for matching SSA Machine Instructions.
This file declares the MachineIRBuilder class.
Promote Memory to Register
static MCRegister getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
MachineInstr unsigned OpIdx
uint64_t IntrinsicInst * II
const SmallVectorImpl< MachineOperand > & Cond
Remove Loads Into Fake Uses
static bool isValid(const char C)
Returns true if C is a valid mangled character: <0-9a-zA-Z_>.
This file implements a set that has insertion order iteration characteristics.
This file implements the SmallBitVector class.
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
This file describes how to lower LLVM code to machine code.
static constexpr roundingMode rmTowardZero
static const fltSemantics & IEEEdouble()
static constexpr roundingMode rmTowardNegative
static constexpr roundingMode rmNearestTiesToEven
static constexpr roundingMode rmTowardPositive
static constexpr roundingMode rmNearestTiesToAway
const fltSemantics & getSemantics() const
opStatus fusedMultiplyAdd(const APFloat &Multiplicand, const APFloat &Addend, roundingMode RM)
APInt bitcastToAPInt() const
Class for arbitrary precision integers.
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
uint64_t getZExtValue() const
Get zero extended value.
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
LLVM_ABI APInt trunc(unsigned width) const
Truncate to new width.
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
bool isAllOnes() const
Determine if all bits are set. This is true for zero-width values.
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
LLVM_ABI APInt urem(const APInt &RHS) const
Unsigned remainder operation.
unsigned getBitWidth() const
Return the number of bits in the APInt.
bool ult(const APInt &RHS) const
Unsigned less than comparison.
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
bool isNegative() const
Determine sign of this APInt.
int32_t exactLogBase2() const
void ashrInPlace(unsigned ShiftAmt)
Arithmetic right-shift this APInt by ShiftAmt in place.
unsigned countr_zero() const
Count the number of trailing zero bits.
unsigned countl_zero() const
The APInt version of std::countl_zero.
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
LLVM_ABI APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
bool isStrictlyPositive() const
Determine if this APInt Value is positive.
LLVM_ABI APInt multiplicativeInverse() const
bool isMask(unsigned numBits) const
LLVM_ABI APInt sext(unsigned width) const
Sign extend to a new width.
bool isPowerOf2() const
Check if this APInt's value is a power of two greater than zero.
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
bool isOne() const
Determine if this is a value of 1.
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
int64_t getSExtValue() const
Get sign extended value.
void lshrInPlace(unsigned ShiftAmt)
Logical right-shift this APInt by ShiftAmt in place.
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
unsigned countr_one() const
Count the number of trailing one bits.
bool uge(const APInt &RHS) const
Unsigned greater or equal comparison.
Represent a constant reference to an array (0 or more elements consecutively in memory),...
size_t size() const
Get the array size.
bool isEquality() const
Determine if this is an equals/not equals predicate.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
@ FCMP_TRUE
1 1 1 1 Always true (always folded)
@ ICMP_SLT
signed less than
@ ICMP_SLE
signed less or equal
@ FCMP_OLT
0 1 0 0 True if ordered and less than
@ FCMP_ULE
1 1 0 1 True if unordered, less than, or equal
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
@ ICMP_UGE
unsigned greater or equal
@ ICMP_UGT
unsigned greater than
@ ICMP_SGT
signed greater than
@ FCMP_ULT
1 1 0 0 True if unordered or less than
@ ICMP_ULT
unsigned less than
@ FCMP_UGT
1 0 1 0 True if unordered or greater than
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
@ ICMP_SGE
signed greater or equal
@ ICMP_ULE
unsigned less or equal
@ FCMP_UGE
1 0 1 1 True if unordered, greater than, or equal
@ FCMP_FALSE
0 0 0 0 Always false (always folded)
static LLVM_ABI bool isEquality(Predicate pred)
Determine if this is an equals/not equals predicate.
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Predicate getInversePredicate() const
For example, EQ -> NE, UGT -> ULE, SLT -> SGE, OEQ -> UNE, UGT -> OLE, OLT -> UGE,...
static LLVM_ABI bool isOrdered(Predicate predicate)
Determine if the predicate is an ordered operation.
LLVM_ABI void applyCombineBuildVectorOfBitcast(MachineInstr &MI, SmallVector< Register > &Ops) const
LLVM_ABI void applyCombineExtendingLoads(MachineInstr &MI, PreferredTuple &MatchInfo) const
LLVM_ABI bool matchCommuteShift(MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchRepeatedFPDivisor(MachineInstr &MI, SmallVector< MachineInstr * > &MatchInfo) const
LLVM_ABI bool matchFoldC2MinusAPlusC1(const MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchLoadOrCombine(MachineInstr &MI, BuildFnTy &MatchInfo) const
Match expression trees of the form.
LLVM_ABI const RegisterBank * getRegBank(Register Reg) const
Get the register bank of Reg.
LLVM_ABI void applyPtrAddZero(MachineInstr &MI) const
LLVM_ABI bool matchEqualDefs(const MachineOperand &MOP1, const MachineOperand &MOP2) const
Return true if MOP1 and MOP2 are register operands are defined by equivalent instructions.
LLVM_ABI void applyUDivOrURemByConst(MachineInstr &MI) const
LLVM_ABI bool matchConstantFoldBinOp(MachineInstr &MI, APInt &MatchInfo) const
Do constant folding when opportunities are exposed after MIR building.
LLVM_ABI void applyCombineUnmergeWithDeadLanesToTrunc(MachineInstr &MI) const
LLVM_ABI bool matchUnmergeValuesAnyExtBuildVector(const MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchCtls(MachineInstr &CtlzMI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchSelectSameVal(MachineInstr &MI) const
Optimize (cond ? x : x) -> x.
LLVM_ABI bool matchAddEToAddO(MachineInstr &MI, BuildFnTy &MatchInfo) const
Match: (G_*ADDE x, y, 0) -> (G_*ADDO x, y) (G_*SUBE x, y, 0) -> (G_*SUBO x, y)
LLVM_ABI bool matchReassocConstantInnerRHS(GPtrAdd &MI, MachineInstr *RHS, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchAVG(MachineInstr &MI, MachineRegisterInfo &MRI, Register X, Register Y, unsigned TargetOpc) const
LLVM_ABI bool matchBitfieldExtractFromShr(MachineInstr &MI, BuildFnTy &MatchInfo) const
Match: shr (shl x, n), k -> sbfx/ubfx x, pos, width.
LLVM_ABI bool matchFoldAMinusC1PlusC2(const MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchTruncSSatU(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI void applySimplifyURemByPow2(MachineInstr &MI) const
Combine G_UREM x, (known power of 2) to an add and bitmasking.
LLVM_ABI bool matchCombineUnmergeZExtToZExt(MachineInstr &MI) const
Transform X, Y = G_UNMERGE(G_ZEXT(Z)) -> X = G_ZEXT(Z); Y = G_CONSTANT 0.
LLVM_ABI bool matchPtrAddZero(MachineInstr &MI) const
}
const TargetInstrInfo * TII
LLVM_ABI void applyCombineConcatVectors(MachineInstr &MI, SmallVector< Register > &Ops) const
Replace MI with a flattened build_vector with Ops or an implicit_def if Ops is empty.
LLVM_ABI void applyXorOfAndWithSameReg(MachineInstr &MI, std::pair< Register, Register > &MatchInfo) const
LLVM_ABI bool canCombineFMadOrFMA(MachineInstr &MI, bool &AllowFusionGlobally, bool &HasFMAD, bool &Aggressive, bool CanReassociate=false) const
LLVM_ABI bool matchFoldAPlusC1MinusC2(const MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchExtractVecEltBuildVec(MachineInstr &MI, Register &Reg) const
LLVM_ABI void applyCombineUnmergeConstant(MachineInstr &MI, SmallVectorImpl< APInt > &Csts) const
LLVM_ABI bool matchShiftsTooBig(MachineInstr &MI, std::optional< int64_t > &MatchInfo) const
Match shifts greater or equal to the range (the bitwidth of the result datatype, or the effective bit...
LLVM_ABI bool matchCombineFAddFpExtFMulToFMadOrFMA(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform (fadd (fpext (fmul x, y)), z) -> (fma (fpext x), (fpext y), z) (fadd (fpext (fmul x,...
LLVM_ABI bool matchCombineIndexedLoadStore(MachineInstr &MI, IndexedLoadStoreMatchInfo &MatchInfo) const
LLVM_ABI void applyCombineShuffleConcat(MachineInstr &MI, SmallVector< Register > &Ops) const
Replace MI with a flattened build_vector with Ops or an implicit_def if Ops is empty.
LLVM_ABI void replaceSingleDefInstWithReg(MachineInstr &MI, Register Replacement) const
Delete MI and replace all of its uses with Replacement.
LLVM_ABI void applyCombineShuffleToBuildVector(MachineInstr &MI) const
Replace MI with a build_vector.
LLVM_ABI bool matchCombineExtractedVectorLoad(MachineInstr &MI, BuildFnTy &MatchInfo) const
Combine a G_EXTRACT_VECTOR_ELT of a load into a narrowed load.
LLVM_ABI void replaceRegWith(MachineRegisterInfo &MRI, Register FromReg, Register ToReg) const
MachineRegisterInfo::replaceRegWith() and inform the observer of the changes.
LLVM_ABI void replaceRegOpWith(MachineRegisterInfo &MRI, MachineOperand &FromRegOp, Register ToReg) const
Replace a single register operand with a new register and inform the observer of the changes.
LLVM_ABI void applyCombineMemCpyFamily(MachineInstr &MI, MemCpyFamilyLoweringInfo &MatchInfo) const
LLVM_ABI bool matchReassocCommBinOp(MachineInstr &MI, BuildFnTy &MatchInfo) const
Reassociate commutative binary operations like G_ADD.
LLVM_ABI void applyBuildFnMO(const MachineOperand &MO, BuildFnTy &MatchInfo) const
Use a function which takes in a MachineIRBuilder to perform a combine.
LLVM_ABI bool matchCommuteConstantToRHS(MachineInstr &MI) const
Match constant LHS ops that should be commuted.
LLVM_ABI const DataLayout & getDataLayout() const
LLVM_ABI bool matchBinOpSameVal(MachineInstr &MI) const
Optimize (x op x) -> x.
LLVM_ABI bool matchSimplifyNegMinMax(MachineInstr &MI, BuildFnTy &MatchInfo) const
Tranform (neg (min/max x, (neg x))) into (max/min x, (neg x)).
LLVM_ABI bool matchCombineDivRem(MachineInstr &MI, MachineInstr *&OtherMI) const
Try to combine G_[SU]DIV and G_[SU]REM into a single G_[SU]DIVREM when their source operands are iden...
LLVM_ABI void applyUMulHToLShr(MachineInstr &MI) const
LLVM_ABI void applyNotCmp(MachineInstr &MI, SmallVectorImpl< Register > &RegsToNegate) const
LLVM_ABI bool isLegalOrHasFewerElements(const LegalityQuery &Query) const
LLVM_ABI bool matchShiftImmedChain(MachineInstr &MI, RegisterImmPair &MatchInfo) const
Fold (shift (shift base, x), y) -> (shift base (x+y))
LLVM_ABI void applyCombineI2PToP2I(MachineInstr &MI, Register &Reg) const
LLVM_ABI bool matchTruncLshrBuildVectorFold(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI bool matchAllExplicitUsesAreUndef(MachineInstr &MI) const
Return true if all register explicit use operands on MI are defined by a G_IMPLICIT_DEF.
LLVM_ABI bool isPredecessor(const MachineInstr &DefMI, const MachineInstr &UseMI) const
Returns true if DefMI precedes UseMI or they are the same instruction.
LLVM_ABI bool matchPtrAddImmedChain(MachineInstr &MI, PtrAddChain &MatchInfo) const
LLVM_ABI bool matchTruncSSatS(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI const TargetLowering & getTargetLowering() const
LLVM_ABI bool matchShuffleUndefRHS(MachineInstr &MI, BuildFnTy &MatchInfo) const
Remove references to rhs if it is undef.
LLVM_ABI void applyBuildInstructionSteps(MachineInstr &MI, InstructionStepsMatchInfo &MatchInfo) const
Replace MI with a series of instructions described in MatchInfo.
LLVM_ABI void applySDivByPow2(MachineInstr &MI) const
LLVM_ABI void applySimplifyAddToSub(MachineInstr &MI, std::tuple< Register, Register > &MatchInfo) const
LLVM_ABI void applyUDivByPow2(MachineInstr &MI) const
Given an G_UDIV MI expressing an unsigned divided by a pow2 constant, return expressions that impleme...
LLVM_ABI bool matchOr(MachineInstr &MI, BuildFnTy &MatchInfo) const
Combine ors.
LLVM_ABI bool matchLshrOfTruncOfLshr(MachineInstr &MI, LshrOfTruncOfLshr &MatchInfo, MachineInstr &ShiftMI) const
Fold (lshr (trunc (lshr x, C1)), C2) -> trunc (shift x, (C1 + C2))
LLVM_ABI bool matchSimplifyAddToSub(MachineInstr &MI, std::tuple< Register, Register > &MatchInfo) const
Return true if MI is a G_ADD which can be simplified to a G_SUB.
LLVM_ABI void replaceInstWithConstant(MachineInstr &MI, int64_t C) const
Replace an instruction with a G_CONSTANT with value C.
LLVM_ABI bool matchCombineFSubFpExtFMulToFMadOrFMA(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform (fsub (fpext (fmul x, y)), z) -> (fma (fpext x), (fpext y), (fneg z)) (fsub (fpext (fmul x,...
LLVM_ABI void applyFsubToFneg(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI bool matchConstantLargerBitWidth(MachineInstr &MI, unsigned ConstIdx) const
Checks if constant at ConstIdx is larger than MI 's bitwidth.
LLVM_ABI void applyCombineCopy(MachineInstr &MI) const
LLVM_ABI bool matchAddSubSameReg(MachineInstr &MI, Register &Src) const
Transform G_ADD(x, G_SUB(y, x)) to y.
LLVM_ABI bool matchCombineShlOfExtend(MachineInstr &MI, RegisterImmPair &MatchData) const
LLVM_ABI void applyCombineAddP2IToPtrAdd(MachineInstr &MI, std::pair< Register, bool > &PtrRegAndCommute) const
LLVM_ABI bool matchCombineFSubFMulToFMadOrFMA(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform (fsub (fmul x, y), z) -> (fma x, y, -z) (fsub (fmul x, y), z) -> (fmad x,...
LLVM_ABI bool matchCombineFAddFMAFMulToFMadOrFMA(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform (fadd (fma x, y, (fmul u, v)), z) -> (fma x, y, (fma u, v, z)) (fadd (fmad x,...
LLVM_ABI bool matchSextTruncSextLoad(MachineInstr &MI) const
LLVM_ABI bool matchCombineMergeUnmerge(MachineInstr &MI, Register &MatchInfo) const
Fold away a merge of an unmerge of the corresponding values.
LLVM_ABI bool matchCombineInsertVecElts(MachineInstr &MI, SmallVectorImpl< Register > &MatchInfo) const
LLVM_ABI bool matchCombineBuildUnmerge(MachineInstr &MI, MachineRegisterInfo &MRI, Register &UnmergeSrc) const
LLVM_ABI bool matchDivByPow2(MachineInstr &MI, bool IsSigned) const
Given an G_SDIV MI expressing a signed divided by a pow2 constant, return expressions that implements...
LLVM_ABI bool matchNarrowBinopFeedingAnd(MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchRedundantNegOperands(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform (fadd x, fneg(y)) -> (fsub x, y) (fadd fneg(x), y) -> (fsub y, x) (fsub x,...
LLVM_ABI bool matchCombineLoadWithAndMask(MachineInstr &MI, BuildFnTy &MatchInfo) const
Match (and (load x), mask) -> zextload x.
LLVM_ABI bool matchCombineFAddFMulToFMadOrFMA(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform (fadd (fmul x, y), z) -> (fma x, y, z) (fadd (fmul x, y), z) -> (fmad x,...
LLVM_ABI bool matchCombineCopy(MachineInstr &MI) const
LLVM_ABI bool matchExtendThroughPhis(MachineInstr &MI, MachineInstr *&ExtMI) const
LLVM_ABI void applyShiftImmedChain(MachineInstr &MI, RegisterImmPair &MatchInfo) const
LLVM_ABI bool matchXorOfAndWithSameReg(MachineInstr &MI, std::pair< Register, Register > &MatchInfo) const
Fold (xor (and x, y), y) -> (and (not x), y) {.
LLVM_ABI bool matchCombineShuffleVector(MachineInstr &MI, SmallVectorImpl< Register > &Ops) const
Check if the G_SHUFFLE_VECTOR MI can be replaced by a concat_vectors.
LLVM_ABI void applyCombineConstPtrAddToI2P(MachineInstr &MI, APInt &NewCst) const
LLVM_ABI bool matchCombineAddP2IToPtrAdd(MachineInstr &MI, std::pair< Register, bool > &PtrRegAndCommute) const
Transform G_ADD (G_PTRTOINT x), y -> G_PTRTOINT (G_PTR_ADD x, y) Transform G_ADD y,...
LLVM_ABI void replaceInstWithFConstant(MachineInstr &MI, double C) const
Replace an instruction with a G_FCONSTANT with value C.
LLVM_ABI bool matchFunnelShiftToRotate(MachineInstr &MI) const
Match an FSHL or FSHR that can be combined to a ROTR or ROTL rotate.
LLVM_ABI bool matchOrShiftToFunnelShift(MachineInstr &MI, bool AllowScalarConstants, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchRedundantSExtInReg(MachineInstr &MI) const
LLVM_ABI void replaceOpcodeWith(MachineInstr &FromMI, unsigned ToOpcode) const
Replace the opcode in instruction with a new opcode and inform the observer of the changes.
LLVM_ABI void applyFunnelShiftConstantModulo(MachineInstr &MI) const
Replaces the shift amount in MI with ShiftAmt % BW.
LLVM_ABI bool matchFoldC1Minus2MinusC2(const MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI void applyCombineShlOfExtend(MachineInstr &MI, const RegisterImmPair &MatchData) const
LLVM_ABI void applyUseVectorTruncate(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI CombinerHelper(GISelChangeObserver &Observer, MachineIRBuilder &B, bool IsPreLegalize, GISelValueTracking *VT=nullptr, MachineDominatorTree *MDT=nullptr, const LegalizerInfo *LI=nullptr)
LLVM_ABI bool matchShuffleDisjointMask(MachineInstr &MI, BuildFnTy &MatchInfo) const
Turn shuffle a, b, mask -> shuffle undef, b, mask iff mask does not reference a.
LLVM_ABI bool matchCombineMulToShl(MachineInstr &MI, unsigned &ShiftVal) const
Transform a multiply by a power-of-2 value to a left shift.
LLVM_ABI void applyCombineShuffleVector(MachineInstr &MI, ArrayRef< Register > Ops) const
Replace MI with a concat_vectors with Ops.
LLVM_ABI bool matchCombineConstPtrAddToI2P(MachineInstr &MI, APInt &NewCst) const
LLVM_ABI bool matchCombineUnmergeUndef(MachineInstr &MI, std::function< void(MachineIRBuilder &)> &MatchInfo) const
Transform G_UNMERGE G_IMPLICIT_DEF -> G_IMPLICIT_DEF, G_IMPLICIT_DEF, ...
LLVM_ABI void applyFoldBinOpIntoSelect(MachineInstr &MI, const unsigned &SelectOpNo) const
SelectOperand is the operand in binary operator MI that is the select to fold.
LLVM_ABI bool matchFoldAMinusC1MinusC2(const MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI void applyCombineIndexedLoadStore(MachineInstr &MI, IndexedLoadStoreMatchInfo &MatchInfo) const
LLVM_ABI bool matchMulOBy2(MachineInstr &MI, BuildFnTy &MatchInfo) const
Match: (G_UMULO x, 2) -> (G_UADDO x, x) (G_SMULO x, 2) -> (G_SADDO x, x)
LLVM_ABI bool matchCombineShuffleConcat(MachineInstr &MI, SmallVector< Register > &Ops) const
LLVM_ABI void applySextInRegOfLoad(MachineInstr &MI, std::tuple< Register, unsigned > &MatchInfo) const
LLVM_ABI bool tryCombineCopy(MachineInstr &MI) const
If MI is COPY, try to combine it.
LLVM_ABI bool matchTruncUSatU(MachineInstr &MI, MachineInstr &MinMI) const
LLVM_ABI bool matchICmpToLHSKnownBits(MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchReassocPtrAdd(MachineInstr &MI, BuildFnTy &MatchInfo) const
Reassociate pointer calculations with G_ADD involved, to allow better addressing mode usage.
LLVM_ABI bool isPreLegalize() const
LLVM_ABI bool matchUndefShuffleVectorMask(MachineInstr &MI) const
Return true if a G_SHUFFLE_VECTOR instruction MI has an undef mask.
LLVM_ABI bool matchAnyExplicitUseIsUndef(MachineInstr &MI) const
Return true if any explicit use operand on MI is defined by a G_IMPLICIT_DEF.
LLVM_ABI bool matchCombineI2PToP2I(MachineInstr &MI, Register &Reg) const
Transform IntToPtr(PtrToInt(x)) to x if cast is in the same address space.
LLVM_ABI bool matchCombineSubToAdd(MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchShiftOfShiftedLogic(MachineInstr &MI, ShiftOfShiftedLogic &MatchInfo) const
If we have a shift-by-constant of a bitwise logic op that itself has a shift-by-constant operand with...
LLVM_ABI bool matchCombineConcatVectors(MachineInstr &MI, SmallVector< Register > &Ops) const
If MI is G_CONCAT_VECTORS, try to combine it.
LLVM_ABI bool matchInsertExtractVecEltOutOfBounds(MachineInstr &MI) const
Return true if a G_{EXTRACT,INSERT}_VECTOR_ELT has an out of range index.
LLVM_ABI bool matchExtractAllEltsFromBuildVector(MachineInstr &MI, SmallVectorImpl< std::pair< Register, MachineInstr * > > &MatchInfo) const
LLVM_ABI LLVMContext & getContext() const
LLVM_ABI void applyPtrAddImmedChain(MachineInstr &MI, PtrAddChain &MatchInfo) const
LLVM_ABI bool isConstantLegalOrBeforeLegalizer(const LLT Ty) const
LLVM_ABI bool matchNotCmp(MachineInstr &MI, SmallVectorImpl< Register > &RegsToNegate) const
Combine inverting a result of a compare into the opposite cond code.
LLVM_ABI bool matchSextInRegOfLoad(MachineInstr &MI, std::tuple< Register, unsigned > &MatchInfo) const
Match sext_inreg(load p), imm -> sextload p.
LLVM_ABI bool matchSelectIMinMax(const MachineOperand &MO, BuildFnTy &MatchInfo) const
Combine select to integer min/max.
LLVM_ABI bool matchConstantFoldUnaryIntOp(MachineInstr &MI, BuildFnTy &MatchInfo) const
Constant fold a unary integer op (G_CTLZ, G_CTTZ, G_CTPOP and their _ZERO_POISON variants,...
LLVM_ABI void applyCombineConstantFoldFpUnary(MachineInstr &MI, const ConstantFP *Cst) const
Transform fp_instr(cst) to constant result of the fp operation.
LLVM_ABI bool isLegal(const LegalityQuery &Query) const
LLVM_ABI bool matchICmpToTrueFalseKnownBits(MachineInstr &MI, int64_t &MatchInfo) const
LLVM_ABI bool matchOperandIsKnownToBeAPowerOfTwo(const MachineOperand &MO, bool OrNegative=false) const
Check if operand MO is known to be a power of 2.
LLVM_ABI bool tryReassocBinOp(unsigned Opc, Register DstReg, Register Op0, Register Op1, BuildFnTy &MatchInfo) const
Try to reassociate to reassociate operands of a commutative binop.
LLVM_ABI void eraseInst(MachineInstr &MI) const
Erase MI.
LLVM_ABI bool matchConstantFoldFPBinOp(MachineInstr &MI, ConstantFP *&MatchInfo) const
Do constant FP folding when opportunities are exposed after MIR building.
LLVM_ABI void applyBuildFnNoErase(MachineInstr &MI, BuildFnTy &MatchInfo) const
Use a function which takes in a MachineIRBuilder to perform a combine.
LLVM_ABI bool matchUseVectorTruncate(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI bool matchUndefStore(MachineInstr &MI) const
Return true if a G_STORE instruction MI is storing an undef value.
MachineRegisterInfo & MRI
LLVM_ABI void applyCombineP2IToI2P(MachineInstr &MI, Register &Reg) const
Transform PtrToInt(IntToPtr(x)) to x.
LLVM_ABI void applyExtendThroughPhis(MachineInstr &MI, MachineInstr *&ExtMI) const
LLVM_ABI bool matchConstantFPOp(const MachineOperand &MOP, double C) const
Return true if MOP is defined by a G_FCONSTANT or splat with a value exactly equal to C.
LLVM_ABI MachineInstr * buildUDivOrURemUsingMul(MachineInstr &MI) const
Given an G_UDIV MI or G_UREM MI expressing a divide by constant, return an expression that implements...
LLVM_ABI void applyExtractVecEltBuildVec(MachineInstr &MI, Register &Reg) const
LLVM_ABI bool matchFoldBinOpIntoSelect(MachineInstr &MI, unsigned &SelectOpNo) const
Push a binary operator through a select on constants.
LLVM_ABI bool tryCombineShiftToUnmerge(MachineInstr &MI, unsigned TargetShiftAmount) const
LLVM_ABI bool tryCombineExtendingLoads(MachineInstr &MI) const
If MI is extend that consumes the result of a load, try to combine it.
LLVM_ABI bool isLegalOrBeforeLegalizer(const LegalityQuery &Query) const
LLVM_ABI bool matchBuildVectorIdentityFold(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI bool matchBitfieldExtractFromShrAnd(MachineInstr &MI, BuildFnTy &MatchInfo) const
Match: shr (and x, n), k -> ubfx x, pos, width.
LLVM_ABI void applyTruncSSatS(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI bool matchConstantFoldCastOp(MachineInstr &MI, APInt &MatchInfo) const
Do constant folding when opportunities are exposed after MIR building.
LLVM_ABI void applyRotateOutOfRange(MachineInstr &MI) const
LLVM_ABI bool matchReassocFoldConstantsInSubTree(GPtrAdd &MI, MachineInstr *LHS, MachineInstr *RHS, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchHoistLogicOpWithSameOpcodeHands(MachineInstr &MI, InstructionStepsMatchInfo &MatchInfo) const
Match (logic_op (op x...), (op y...)) -> (op (logic_op x, y))
LLVM_ABI bool matchBitfieldExtractFromAnd(MachineInstr &MI, BuildFnTy &MatchInfo) const
Match: and (lshr x, cst), mask -> ubfx x, cst, width.
LLVM_ABI bool matchBitfieldExtractFromSExtInReg(MachineInstr &MI, BuildFnTy &MatchInfo) const
Form a G_SBFX from a G_SEXT_INREG fed by a right shift.
LLVM_ABI bool matchUndefSelectCmp(MachineInstr &MI) const
Return true if a G_SELECT instruction MI has an undef comparison.
LLVM_ABI bool matchAndOrDisjointMask(MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI void replaceInstWithUndef(MachineInstr &MI) const
Replace an instruction with a G_IMPLICIT_DEF.
LLVM_ABI bool matchRedundantBinOpInEquality(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform: (X + Y) == X -> Y == 0 (X - Y) == X -> Y == 0 (X ^ Y) == X -> Y == 0 (X + Y) !...
LLVM_ABI bool matchOptBrCondByInvertingCond(MachineInstr &MI, MachineInstr *&BrCond) const
If a brcond's true block is not the fallthrough, make it so by inverting the condition and swapping o...
LLVM_ABI bool matchAddOverflow(MachineInstr &MI, BuildFnTy &MatchInfo) const
Combine addos.
LLVM_ABI void applyAshShlToSextInreg(MachineInstr &MI, std::tuple< Register, int64_t > &MatchInfo) const
LLVM_ABI bool matchSelect(MachineInstr &MI, BuildFnTy &MatchInfo) const
Combine selects.
LLVM_ABI bool matchCombineExtendingLoads(MachineInstr &MI, PreferredTuple &MatchInfo) const
LLVM_ABI bool matchCombineUnmergeWithDeadLanesToTrunc(MachineInstr &MI) const
Transform X, Y<dead> = G_UNMERGE Z -> X = G_TRUNC Z.
LLVM_ABI bool matchFsubToFneg(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI bool matchRotateOutOfRange(MachineInstr &MI) const
LLVM_ABI void applyExpandFPowI(MachineInstr &MI, int64_t Exponent) const
Expands FPOWI into a series of multiplications and a division if the exponent is negative.
LLVM_ABI void setRegBank(Register Reg, const RegisterBank *RegBank) const
Set the register bank of Reg.
LLVM_ABI bool matchConstantSelectCmp(MachineInstr &MI, unsigned &OpIdx) const
Return true if a G_SELECT instruction MI has a constant comparison.
LLVM_ABI bool matchCommuteFPConstantToRHS(MachineInstr &MI) const
Match constant LHS FP ops that should be commuted.
LLVM_ABI void applyCombineDivRem(MachineInstr &MI, MachineInstr *&OtherMI) const
LLVM_ABI bool matchCombineFMinMaxNaN(MachineInstr &MI, unsigned &Info) const
LLVM_ABI bool matchRedundantOr(MachineInstr &MI, Register &Replacement) const
LLVM_ABI void applyTruncSSatU(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI void applySimplifySRemByPow2(MachineInstr &MI) const
Combine G_SREM x, (+/-2^k) to a bias-and-mask sequence.
LLVM_ABI bool matchCombineFSubFpExtFNegFMulToFMadOrFMA(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform (fsub (fpext (fneg (fmul x, y))), z) -> (fneg (fma (fpext x), (fpext y),...
LLVM_ABI bool matchTruncBuildVectorFold(MachineInstr &MI, Register &MatchInfo) const
LLVM_ABI void applyCombineTruncOfShift(MachineInstr &MI, std::pair< MachineInstr *, LLT > &MatchInfo) const
LLVM_ABI bool matchConstantOp(const MachineOperand &MOP, int64_t C) const
Return true if MOP is defined by a G_CONSTANT or splat with a value equal to C.
LLVM_ABI void applyCombineMulToShl(MachineInstr &MI, unsigned &ShiftVal) const
LLVM_ABI void applyCombineBuildUnmerge(MachineInstr &MI, MachineRegisterInfo &MRI, MachineIRBuilder &B, Register &UnmergeSrc) const
LLVM_ABI bool matchUMulHToLShr(MachineInstr &MI) const
MachineDominatorTree * MDT
LLVM_ABI void applyFunnelShiftToRotate(MachineInstr &MI) const
LLVM_ABI bool matchSimplifySelectToMinMax(MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI void applyRepeatedFPDivisor(SmallVector< MachineInstr * > &MatchInfo) const
LLVM_ABI bool matchTruncUSatUToFPTOUISat(MachineInstr &MI, MachineInstr &SrcMI) const
const RegisterBankInfo * RBI
LLVM_ABI bool matchMulOBy0(MachineInstr &MI, BuildFnTy &MatchInfo) const
Match: (G_*MULO x, 0) -> 0 + no carry out.
LLVM_ABI bool matchBinopWithNeg(MachineInstr &MI, BuildFnTy &MatchInfo) const
Fold a bitwiseop (~b +/- c) -> a bitwiseop ~(b -/+ c)
LLVM_ABI bool matchCombineUnmergeConstant(MachineInstr &MI, SmallVectorImpl< APInt > &Csts) const
Transform G_UNMERGE Constant -> Constant1, Constant2, ...
LLVM_ABI void applyShiftOfShiftedLogic(MachineInstr &MI, ShiftOfShiftedLogic &MatchInfo) const
const TargetRegisterInfo * TRI
LLVM_ABI bool matchRedundantAnd(MachineInstr &MI, Register &Replacement) const
LLVM_ABI bool dominates(const MachineInstr &DefMI, const MachineInstr &UseMI) const
Returns true if DefMI dominates UseMI.
GISelChangeObserver & Observer
LLVM_ABI void applyBuildFn(MachineInstr &MI, BuildFnTy &MatchInfo) const
Use a function which takes in a MachineIRBuilder to perform a combine.
LLVM_ABI bool matchCombineTruncOfShift(MachineInstr &MI, std::pair< MachineInstr *, LLT > &MatchInfo) const
Transform trunc (shl x, K) to shl (trunc x), K if K < VT.getScalarSizeInBits().
LLVM_ABI bool matchCombineShiftToUnmerge(MachineInstr &MI, unsigned TargetShiftSize, unsigned &ShiftVal) const
Reduce a shift by a constant to an unmerge and a shift on a half sized type.
LLVM_ABI bool matchUDivOrURemByConst(MachineInstr &MI) const
Combine G_UDIV or G_UREM by constant into a multiply by magic constant.
LLVM_ABI bool matchAnd(MachineInstr &MI, BuildFnTy &MatchInfo) const
Combine ands.
LLVM_ABI bool matchSuboCarryOut(const MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchConstantFoldFMA(MachineInstr &MI, ConstantFP *&MatchInfo) const
Constant fold G_FMA/G_FMAD.
LLVM_ABI bool matchCombineFSubFNegFMulToFMadOrFMA(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform (fsub (fneg (fmul, x, y)), z) -> (fma (fneg x), y, (fneg z)) (fsub (fneg (fmul,...
LLVM_ABI bool matchCombineZextTrunc(MachineInstr &MI, Register &Reg) const
Transform zext(trunc(x)) to x.
LLVM_ABI bool matchOperandIsUndef(MachineInstr &MI, unsigned OpIdx) const
Check if operand OpIdx is undef.
LLVM_ABI void applyLshrOfTruncOfLshr(MachineInstr &MI, LshrOfTruncOfLshr &MatchInfo) const
LLVM_ABI bool tryCombineMemCpyFamily(MachineInstr &MI, unsigned MaxLen=0) const
Optimize memcpy intrinsics et al, e.g.
LLVM_ABI bool matchFreezeOfSingleMaybePoisonOperand(MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI void applySDivOrSRemByConst(MachineInstr &MI) const
LLVM_ABI bool matchCombineMemCpyFamily(MachineInstr &MI, MemCpyFamilyLoweringInfo &MatchInfo, unsigned MaxLen=0) const
LLVM_ABI MachineInstr * buildSDivOrSRemUsingMul(MachineInstr &MI) const
Given an G_SDIV MI or G_SREM MI expressing a signed divide by constant, return an expression that imp...
LLVM_ABI bool isLegalOrHasWidenScalar(const LegalityQuery &Query) const
LLVM_ABI bool matchSubAddSameReg(MachineInstr &MI, BuildFnTy &MatchInfo) const
Transform: (x + y) - y -> x (x + y) - x -> y x - (y + x) -> 0 - y x - (x + z) -> 0 - z.
LLVM_ABI bool matchReassocConstantInnerLHS(GPtrAdd &MI, MachineInstr *LHS, MachineInstr *RHS, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchOverlappingAnd(MachineInstr &MI, BuildFnTy &MatchInfo) const
Fold and(and(x, C1), C2) -> C1&C2 ? and(x, C1&C2) : 0.
LLVM_ABI bool matchCombineAnyExtTrunc(MachineInstr &MI, Register &Reg) const
Transform anyext(trunc(x)) to x.
LLVM_ABI void applyExtractAllEltsFromBuildVector(MachineInstr &MI, SmallVectorImpl< std::pair< Register, MachineInstr * > > &MatchInfo) const
MachineIRBuilder & Builder
LLVM_ABI void applyCommuteBinOpOperands(MachineInstr &MI) const
LLVM_ABI void replaceSingleDefInstWithOperand(MachineInstr &MI, unsigned OpIdx) const
Delete MI and replace all of its uses with its OpIdx-th operand.
LLVM_ABI void applySextTruncSextLoad(MachineInstr &MI) const
LLVM_ABI const MachineFunction & getMachineFunction() const
LLVM_ABI bool matchCombineBuildVectorOfBitcast(MachineInstr &MI, SmallVector< Register > &Ops) const
Combine G_BUILD_VECTOR(G_UNMERGE(G_BITCAST), Undef) to G_BITCAST(G_BUILD_VECTOR(.....
LLVM_ABI bool matchCombineFAddFpExtFMulToFMadOrFMAAggressive(MachineInstr &MI, BuildFnTy &MatchInfo) const
LLVM_ABI bool matchSDivOrSRemByConst(MachineInstr &MI) const
Combine G_SDIV or G_SREM by constant into a multiply by magic constant.
LLVM_ABI void applyOptBrCondByInvertingCond(MachineInstr &MI, MachineInstr *&BrCond) const
LLVM_ABI void applyCombineShiftToUnmerge(MachineInstr &MI, const unsigned &ShiftVal) const
LLVM_ABI bool matchFPowIExpansion(MachineInstr &MI, int64_t Exponent) const
Match FPOWI if it's safe to extend it into a series of multiplications.
LLVM_ABI void applyCombineInsertVecElts(MachineInstr &MI, SmallVectorImpl< Register > &MatchInfo) const
LLVM_ABI bool matchCombineUnmergeMergeToPlainValues(MachineInstr &MI, SmallVectorImpl< Register > &Operands) const
Transform <ty,...> G_UNMERGE(G_MERGE ty X, Y, Z) -> ty X, Y, Z.
LLVM_ABI void applyCombineUnmergeMergeToPlainValues(MachineInstr &MI, SmallVectorImpl< Register > &Operands) const
LLVM_ABI bool matchAshrShlToSextInreg(MachineInstr &MI, std::tuple< Register, int64_t > &MatchInfo) const
Match ashr (shl x, C), C -> sext_inreg (C)
LLVM_ABI void applyCombineUnmergeZExtToZExt(MachineInstr &MI) const
ConstantFP - Floating Point Values [float, double].
const APFloat & getValue() const
const APFloat & getValueAPF() const
const APInt & getValue() const
Return the constant as an APInt value reference.
This class represents a range of values.
LLVM_ABI std::optional< ConstantRange > exactUnionWith(const ConstantRange &CR) const
Union the two ranges and return the result if it can be represented exactly, otherwise return std::nu...
LLVM_ABI ConstantRange subtract(const APInt &CI) const
Subtract the specified constant from the endpoints of this constant range.
static LLVM_ABI ConstantRange fromKnownBits(const KnownBits &Known, bool IsSigned)
Initialize a range based on a known bits constraint.
const APInt & getLower() const
Return the lower value for this range.
LLVM_ABI OverflowResult unsignedSubMayOverflow(const ConstantRange &Other) const
Return whether unsigned sub of the two ranges always/never overflows.
LLVM_ABI OverflowResult unsignedAddMayOverflow(const ConstantRange &Other) const
Return whether unsigned add of the two ranges always/never overflows.
LLVM_ABI bool isWrappedSet() const
Return true if this set wraps around the unsigned domain.
const APInt & getUpper() const
Return the upper value for this range.
static LLVM_ABI ConstantRange makeExactICmpRegion(CmpInst::Predicate Pred, const APInt &Other)
Produce the exact range such that all values in the returned range satisfy the given predicate with a...
LLVM_ABI OverflowResult signedAddMayOverflow(const ConstantRange &Other) const
Return whether signed add of the two ranges always/never overflows.
@ NeverOverflows
Never overflows.
@ AlwaysOverflowsHigh
Always overflows in the direction of signed/unsigned max value.
@ AlwaysOverflowsLow
Always overflows in the direction of signed/unsigned min value.
@ MayOverflow
May or may not overflow.
LLVM_ABI OverflowResult signedSubMayOverflow(const ConstantRange &Other) const
Return whether signed sub of the two ranges always/never overflows.
This is an important base class in LLVM.
A parsed version of the target data layout string in and methods for querying it.
ValueT lookup(const_arg_type_t< KeyT > Val) const
Return the entry for the specified key, or a default constructed value if no such entry exists.
iterator find(const_arg_type_t< KeyT > Val)
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
Represents overflowing add operations.
Represents an integer addition.
Represents a logical and.
CmpInst::Predicate getCond() const
Register getLHSReg() const
Register getRHSReg() const
Represents any generic load, including sign/zero extending variants.
Register getDstReg() const
Get the definition register of the loaded value.
Register getCarryOutReg() const
Register getRHSReg() const
Register getLHSReg() const
Register getLHSReg() const
Register getRHSReg() const
Represents a G_BUILD_VECTOR.
Abstract class that contains various methods for clients to notify about changes.
Simple wrapper observer that takes several observers, and calls each one for each event.
Represents any type of generic load or store.
Register getPointerReg() const
Get the source register of the pointer value.
Represents a logical binary operation.
MachineMemOperand & getMMO() const
Get the MachineMemOperand on this instruction.
bool isAtomic() const
Returns true if the attached MachineMemOperand has the atomic flag set.
LocationSize getMemSizeInBits() const
Returns the size in bits of the memory access.
bool isSimple() const
Returns true if the memory operation is neither atomic or volatile.
Register getSourceReg(unsigned I) const
Returns the I'th source register.
unsigned getNumSources() const
Returns the number of source registers.
Represents a G_MERGE_VALUES.
Register getCondReg() const
Represents overflowing sub operations.
Represents an integer subtraction.
Represents a G_UNMERGE_VALUES.
unsigned getNumDefs() const
Returns the number of def registers.
Register getSourceReg() const
Get the unmerge source register.
Register getReg(unsigned Idx) const
Access the Idx'th operand as a register and return it.
static LLVM_ABI bool compare(const APInt &LHS, const APInt &RHS, ICmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
constexpr bool isScalableVector() const
Returns true if the LLT is a scalable vector.
constexpr unsigned getScalarSizeInBits() const
constexpr bool isScalar() const
constexpr LLT changeElementType(LLT NewEltTy) const
If this type is a vector, return a vector with the same number of elements but the new element type.
static constexpr LLT vector(ElementCount EC, unsigned ScalarSizeInBits)
Get a low-level vector of some number of elements and element width.
LLT getScalarType() const
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr bool isValid() const
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
constexpr bool isByteSized() const
constexpr TypeSize getSizeInBits() const
Returns the total size of the type. Must only be called on sized types.
constexpr bool isPointer() const
constexpr ElementCount getElementCount() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
constexpr bool isPointerOrPointerVector() const
constexpr bool isFixedVector() const
Returns true if the LLT is a fixed vector.
static LLT integer(unsigned SizeInBits)
constexpr TypeSize getSizeInBytes() const
Returns the total size of the type in bytes, i.e.
LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
LLT changeElementSize(unsigned NewEltSize) const
If this type is a vector, return a vector with the same number of elements but the new element size.
This is an important class for using LLVM in a threaded context.
LLVM_ABI LegalizeResult lowerMemCpyFamily(MachineInstr &MI, Register Dst, Register Src, uint64_t KnownLen, Align Alignment, bool DstAlignCanChange, ArrayRef< LLT > MemOps)
@ Legalized
Instruction has been legalized and the MachineFunction changed.
LLVM_ABI Register getVectorElementPointer(Register VecPtr, LLT VecTy, Register Index)
Get a pointer to vector element Index located in memory for a vector of type VecTy starting at a base...
TypeSize getValue() const
const MCInstrDesc & get(unsigned Opcode) const
Return the machine instruction descriptor that corresponds to the specified instruction opcode.
LLVM_ABI iterator getFirstNonPHI()
Returns a pointer to the first instruction in this block that is not a PHINode instruction.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
MachineInstrBundleIterator< MachineInstr > iterator
DominatorTree Class - Concrete subclass of DominatorTreeBase that is used to compute a normal dominat...
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Function & getFunction()
Return the LLVM function that this machine code represents.
Helper class to build MachineInstr.
const TargetInstrInfo & getTII()
MachineInstrBuilder buildSub(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_SUB Op0, Op1.
MachineInstrBuilder buildCTLZ(const DstOp &Dst, const SrcOp &Src0)
Build and insert Res = G_CTLZ Op0, Src0.
MachineFunction & getMF()
Getter for the function we currently build.
MachineRegisterInfo * getMRI()
Getter for MRI.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
Register getReg(unsigned Idx) const
Get the register for the operand index.
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
bool mayLoadOrStore(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read or modify memory.
const MachineBasicBlock * getParent() const
LLVM_ABI bool isDereferenceableInvariantLoad() const
Return true if this load instruction never traps and points to a memory location whose value doesn't ...
bool getFlag(MIFlag Flag) const
Return whether an MI flag is set.
unsigned getNumOperands() const
Retuns the total number of operands.
LLVM_ABI void setDesc(const MCInstrDesc &TID)
Replace the instruction descriptor (thus opcode) of the current instruction with a new one.
mop_range uses()
Returns all operands which may be register uses.
MachineOperand * findRegisterUseOperand(Register Reg, const TargetRegisterInfo *TRI, bool isKill=false)
Wrapper for findRegisterUseOperandIdx, it returns a pointer to the MachineOperand rather than an inde...
const MachineOperand & getOperand(unsigned i) const
uint32_t getFlags() const
Return the MI flags bitvector.
LLVM_ABI int findRegisterDefOperandIdx(Register Reg, const TargetRegisterInfo *TRI, bool isDead=false, bool Overlap=false) const
Returns the operand index that is a def of the specified register or -1 if it is not found.
LLVM_ABI MachineInstrBundleIterator< MachineInstr > eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
A description of a memory reference used in the backend.
LLT getMemoryType() const
Return the memory type of the memory reference.
unsigned getAddrSpace() const
const MachinePointerInfo & getPointerInfo() const
LLVM_ABI Align getAlign() const
Return the minimum known alignment in bytes of the actual memory reference.
MachineOperand class - Representation of each machine instruction operand.
const ConstantInt * getCImm() const
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
MachineInstr * getParent()
getParent - Return the instruction that this operand belongs to.
void setMBB(MachineBasicBlock *MBB)
void setPredicate(unsigned Predicate)
Register getReg() const
getReg - Returns the register number.
const ConstantFP * getFPImm() const
unsigned getPredicate() const
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
bool use_nodbg_empty(Register RegNo) const
use_nodbg_empty - Return true if there are no non-Debug instructions using the specified register.
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
use_instr_nodbg_iterator use_instr_nodbg_begin(Register RegNo) const
iterator_range< use_instr_nodbg_iterator > use_nodbg_instructions(Register Reg) const
static use_instr_nodbg_iterator use_instr_nodbg_end()
Represent a mutable reference to an array (0 or more elements consecutively in memory),...
This class implements the register bank concept.
Wrapper class representing virtual and physical registers.
constexpr bool isValid() const
size_type size() const
Determine the number of elements in the SetVector.
size_type count(const_arg_type key) const
Count the number of elements of a given key in the SetVector.
bool insert(const value_type &X)
Insert a new element into the SetVector.
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
bool all() const
Returns true if all bits are set.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
A SetVector that performs no allocations if smaller than a certain size.
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
reference emplace_back(ArgTypes &&... Args)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
virtual bool isZExtFree(Type *FromTy, Type *ToTy) const
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the...
virtual bool isTruncateFree(Type *FromTy, Type *ToTy) const
Return true if it's free to truncate a value of type FromTy to type ToTy.
virtual LLVM_READONLY LLT getPreferredShiftAmountTy(LLT ShiftValueTy) const
Return the preferred type to use for a shift opcode, given the shifted amount type is ShiftValueTy.
bool isBeneficialToExpandPowI(int64_t Exponent, bool OptForSize) const
Return true if it is beneficial to expand an @llvm.powi.
virtual bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM, Type *Ty, unsigned AddrSpace, Instruction *I=nullptr) const
Return true if the addressing mode represented by AM is legal for this target, for a load/store of th...
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
virtual unsigned combineRepeatedFPDivisors() const
Indicate whether this target prefers to combine FDIVs with the same divisor.
virtual const TargetLowering * getTargetLowering() const
The instances of the Type class are immutable: once they are created, they are never changed.
A Use represents the edge between a Value definition and its users.
constexpr bool isKnownMultipleOf(ScalarTy RHS) const
This function tells the caller whether the element count is known at compile time to be a multiple of...
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
self_iterator getIterator()
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ Fast
Attempts to make calls as fast as possible (e.g.
@ C
The default llvm calling convention, compatible with C.
@ FewerElements
The (vector) operation should be implemented by splitting it into sub-vectors where the operation is ...
@ Legal
The operation is expected to be selectable directly by the target, and no transformation is necessary...
@ WidenScalar
The operation should be implemented in terms of a wider scalar base-type.
@ Custom
The target wants to do something special with this combination of operand and type.
operand_type_match m_Reg()
SpecificConstantMatch m_SpecificICst(const APInt &RequestedValue)
Matches a constant equal to RequestedValue.
BinaryOp_match< LHS, RHS, TargetOpcode::G_BUILD_VECTOR, false > m_GBuildVector(const LHS &L, const RHS &R)
GCstAndRegMatch m_GCst(std::optional< ValueAndVReg > &ValReg)
operand_type_match m_Pred()
BinaryOp_match< LHS, RHS, TargetOpcode::G_UMIN, true > m_GUMin(const LHS &L, const RHS &R)
UnaryOp_match< SrcTy, TargetOpcode::G_ZEXT > m_GZExt(const SrcTy &Src)
BinaryOp_match< LHS, RHS, TargetOpcode::G_XOR, true > m_GXor(const LHS &L, const RHS &R)
UnaryOp_match< SrcTy, TargetOpcode::G_SEXT > m_GSExt(const SrcTy &Src)
UnaryOp_match< SrcTy, TargetOpcode::G_FPEXT > m_GFPExt(const SrcTy &Src)
ConstantMatch< APInt > m_ICst(APInt &Cst)
UnaryOp_match< SrcTy, TargetOpcode::G_INTTOPTR > m_GIntToPtr(const SrcTy &Src)
BinaryOp_match< LHS, RHS, TargetOpcode::G_ADD, true > m_GAdd(const LHS &L, const RHS &R)
BinaryOp_match< LHS, RHS, TargetOpcode::G_OR, true > m_GOr(const LHS &L, const RHS &R)
BinaryOp_match< SpecificConstantMatch, SrcTy, TargetOpcode::G_SUB > m_Neg(const SrcTy &&Src)
Matches a register negated by a G_SUB.
ICstOrSplatMatch< APInt > m_ICstOrSplat(APInt &Cst)
ImplicitDefMatch m_GImplicitDef()
OneNonDBGUse_match< SubPat > m_OneNonDBGUse(const SubPat &SP)
CheckType m_SpecificType(LLT Ty)
deferred_ty< Register > m_DeferredReg(Register &R)
Similar to m_SpecificReg/Type, but the specific value to match originated from an earlier sub-pattern...
BinaryOp_match< LHS, RHS, TargetOpcode::G_UMAX, true > m_GUMax(const LHS &L, const RHS &R)
BinaryOp_match< SrcTy, SpecificConstantMatch, TargetOpcode::G_XOR, true > m_Not(const SrcTy &&Src)
Matches a register not-ed by a G_XOR.
BinaryOp_match< LHS, RHS, TargetOpcode::G_FADD, true > m_GFAdd(const LHS &L, const RHS &R)
UnaryOp_match< SrcTy, TargetOpcode::G_PTRTOINT > m_GPtrToInt(const SrcTy &Src)
BinaryOp_match< LHS, RHS, TargetOpcode::G_FSUB, false > m_GFSub(const LHS &L, const RHS &R)
BinaryOp_match< LHS, RHS, TargetOpcode::G_SUB > m_GSub(const LHS &L, const RHS &R)
BinaryOp_match< LHS, RHS, TargetOpcode::G_ASHR, false > m_GAShr(const LHS &L, const RHS &R)
bool mi_match(Reg R, const MachineRegisterInfo &MRI, Pattern &&P)
BinaryOp_match< LHS, RHS, TargetOpcode::G_PTR_ADD, false > m_GPtrAdd(const LHS &L, const RHS &R)
BinaryOp_match< LHS, RHS, TargetOpcode::G_SHL, false > m_GShl(const LHS &L, const RHS &R)
Or< Preds... > m_any_of(Preds &&... preds)
SpecificConstantOrSplatMatch m_SpecificICstOrSplat(const APInt &RequestedValue)
Matches a RequestedValue constant or a constant splat of RequestedValue.
BinaryOp_match< LHS, RHS, TargetOpcode::G_AND, true > m_GAnd(const LHS &L, const RHS &R)
UnaryOp_match< SrcTy, TargetOpcode::G_BITCAST > m_GBitcast(const SrcTy &Src)
BinaryOp_match< LHS, RHS, TargetOpcode::G_BUILD_VECTOR_TRUNC, false > m_GBuildVectorTrunc(const LHS &L, const RHS &R)
bind_ty< MachineInstr * > m_MInstr(MachineInstr *&MI)
UnaryOp_match< SrcTy, TargetOpcode::G_FNEG > m_GFNeg(const SrcTy &Src)
CompareOp_match< Pred, LHS, RHS, TargetOpcode::G_ICMP, true > m_c_GICmp(const Pred &P, const LHS &L, const RHS &R)
G_ICMP matcher that also matches commuted compares.
TernaryOp_match< Src0Ty, Src1Ty, Src2Ty, TargetOpcode::G_INSERT_VECTOR_ELT > m_GInsertVecElt(const Src0Ty &Src0, const Src1Ty &Src1, const Src2Ty &Src2)
GFCstOrSplatGFCstMatch m_GFCstOrSplat(std::optional< FPValueAndVReg > &FPValReg)
And< Preds... > m_all_of(Preds &&... preds)
BinaryOp_match< LHS, RHS, TargetOpcode::G_SMIN, true > m_GSMin(const LHS &L, const RHS &R)
BinaryOp_match< LHS, RHS, TargetOpcode::G_LSHR, false > m_GLShr(const LHS &L, const RHS &R)
UnaryOp_match< SrcTy, TargetOpcode::G_ANYEXT > m_GAnyExt(const SrcTy &Src)
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
UnaryOp_match< SrcTy, TargetOpcode::G_TRUNC > m_GTrunc(const SrcTy &Src)
BinaryOp_match< LHS, RHS, TargetOpcode::G_SMAX, true > m_GSMax(const LHS &L, const RHS &R)
CompareOp_match< Pred, LHS, RHS, TargetOpcode::G_FCMP > m_GFCmp(const Pred &P, const LHS &L, const RHS &R)
auto m_BinOp()
Match an arbitrary binary operation and ignore it.
Not(const Pred &P) -> Not< Pred >
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
FunctionAddr VTableAddr Value
LLVM_ABI bool isBuildVectorAllZeros(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndef=false)
Return true if the specified instruction is a G_BUILD_VECTOR or G_BUILD_VECTOR_TRUNC where all of the...
LLVM_ABI Type * getTypeForLLT(LLT Ty, LLVMContext &C)
Get the type back from LLT.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI MachineInstr * getOpcodeDef(unsigned Opcode, Register Reg, const MachineRegisterInfo &MRI)
See if Reg is defined by an single def instruction that is Opcode.
static double log2(double V)
LLVM_ABI const ConstantFP * getConstantFPVRegVal(Register VReg, const MachineRegisterInfo &MRI)
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
LLVM_ABI std::optional< APInt > getIConstantVRegVal(Register VReg, const MachineRegisterInfo &MRI)
If VReg is defined by a G_CONSTANT, return the corresponding value.
LLVM_ABI std::optional< APInt > getIConstantSplatVal(const Register Reg, const MachineRegisterInfo &MRI)
LLVM_ABI bool isAllOnesOrAllOnesSplat(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndefs=false)
Return true if the value is a constant -1 integer or a splatted vector of a constant -1 integer (with...
@ Undef
Value of the register doesn't matter.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
int countr_one(T Value)
Count the number of ones from the least significant bit to the first zero bit.
std::function< void(MachineIRBuilder &)> BuildFnTy
LLVM_ABI const llvm::fltSemantics & getFltSemanticForLLT(LLT Ty)
Get the appropriate floating point arithmetic semantic based on the bit size of the given scalar LLT.
LLVM_ABI std::optional< APFloat > ConstantFoldFPBinOp(unsigned Opcode, const Register Op1, const Register Op2, const MachineRegisterInfo &MRI)
LLVM_ABI MVT getMVTForLLT(LLT Ty)
Get a rough equivalent of an MVT for a given LLT.
LLVM_ABI std::optional< APInt > isConstantOrConstantSplatVector(MachineInstr &MI, const MachineRegisterInfo &MRI)
Determines if MI defines a constant integer or a splat vector of constant integers.
LLVM_ABI bool isNullOrNullSplat(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndefs=false)
Return true if the value is a constant 0 integer or a splatted vector of a constant 0 integer (with n...
LLVM_ABI MachineInstr * getDefIgnoringCopies(Register Reg, const MachineRegisterInfo &MRI)
Find the def instruction for Reg, folding away any trivial copies.
LLVM_ABI bool matchUnaryPredicate(const MachineRegisterInfo &MRI, Register Reg, std::function< bool(const Constant *ConstVal)> Match, bool AllowUndefs=false)
Attempt to match a unary predicate against a scalar/splat constant or every element of a constant G_B...
LLVM_ABI bool isConstTrueVal(const TargetLowering &TLI, int64_t Val, bool IsVector, bool IsFP)
Returns true if given the TargetLowering's boolean contents information, the value Val contains a tru...
LLVM_ABI std::optional< APInt > ConstantFoldBinOp(unsigned Opcode, const Register Op1, const Register Op2, const MachineRegisterInfo &MRI)
constexpr bool has_single_bit(T Value) noexcept
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI const APInt & getIConstantFromReg(Register VReg, const MachineRegisterInfo &MRI)
VReg is defined by a G_CONSTANT, return the corresponding value.
LLVM_ABI bool isConstantOrConstantVector(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowFP=true, bool AllowOpaqueConstants=true)
Return true if the specified instruction is known to be a constant, or a vector of constants.
SmallVector< std::function< void(MachineInstrBuilder &)>, 4 > OperandBuildSteps
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
LLVM_ABI bool canReplaceReg(Register DstReg, Register SrcReg, MachineRegisterInfo &MRI)
Check if DstReg can be replaced with SrcReg depending on the register constraints.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
std::tuple< Register, Register, uint64_t, Align, bool, std::vector< LLT > > MemCpyFamilyLoweringInfo
constexpr bool isMask_64(uint64_t Value)
Return true if the argument is a non-empty sequence of ones starting at the least significant bit wit...
LLVM_ABI bool canCreateUndefOrPoison(const Operator *Op, bool ConsiderFlagsAndMetadata=true)
canCreateUndefOrPoison returns true if Op can create undef or poison from non-undef & non-poison oper...
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
auto instructionsWithoutDebug(IterT It, IterT End, bool SkipPseudoOp=true)
Construct a range iterator which begins at It and moves forwards until End is reached,...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
LLVM_ABI std::optional< FPValueAndVReg > getFConstantSplat(Register VReg, const MachineRegisterInfo &MRI, bool AllowUndef=true)
Returns a floating point scalar constant of a build vector splat if it exists.
LLVM_ABI EVT getApproximateEVTForLLT(LLT Ty, LLVMContext &Ctx)
LLVM_ABI std::optional< APInt > ConstantFoldCastOp(unsigned Opcode, LLT DstTy, const Register Op0, const MachineRegisterInfo &MRI)
LLVM_ABI bool canLowerMemCpyFamily(const MachineInstr &MI, const MachineRegisterInfo &MRI, unsigned MaxLen, Register &Dst, Register &Src, uint64_t &KnownLen, Align &Alignment, bool &DstAlignCanChange, std::vector< LLT > &MemOps)
Matcher for memcpy-like instructions.
LLVM_ABI unsigned getInverseGMinMaxOpcode(unsigned MinMaxOpc)
Returns the inverse opcode of MinMaxOpc, which is a generic min/max opcode like G_SMIN.
@ Xor
Bitwise or logical XOR of integers.
@ And
Bitwise or logical AND of integers.
@ Sub
Subtraction of integers.
DWARFExpression::Operation Op
LLVM_ABI bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
LLVM_ABI std::optional< FPValueAndVReg > getFConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_FCONSTANT returns it...
LLVM_ABI std::optional< APFloat > isConstantOrConstantSplatVectorFP(MachineInstr &MI, const MachineRegisterInfo &MRI)
Determines if MI defines a float constant integer or a splat vector of float constant integers.
constexpr unsigned BitWidth
LLVM_ABI int64_t getICmpTrueVal(const TargetLowering &TLI, bool IsVector, bool IsFP)
Returns an integer representing true, as defined by the TargetBooleanContents.
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
LLVM_ABI std::optional< ValueAndVReg > getIConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_CONSTANT returns its...
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
iterator_range< pointer_iterator< WrappedIteratorT > > make_pointer_range(RangeT &&Range)
LLVM_ABI std::optional< DefinitionAndSourceRegister > getDefSrcRegIgnoringCopies(Register Reg, const MachineRegisterInfo &MRI)
Find the def instruction for Reg, and underlying value Register folding away any copies.
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
LLVM_ABI SmallVector< APInt > ConstantFoldUnaryIntOp(unsigned Opcode, LLT DstTy, Register Src, const MachineRegisterInfo &MRI)
Tries to constant fold a unary integer operation (G_CTLZ, G_CTTZ, G_CTPOP and their _ZERO_POISON vari...
LLVM_ABI bool isKnownToBeAPowerOfTwo(const Value *V, const DataLayout &DL, bool OrZero=false, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Return true if the given value is known to have exactly one bit set when defined.
LLVM_ABI Register getSrcRegIgnoringCopies(Register Reg, const MachineRegisterInfo &MRI)
Find the source register for Reg, folding away any trivial copies.
constexpr T maskTrailingOnes(unsigned N)
Create a bitmask with the N right-most bits set to 1, and all other bits set to 0.
unsigned getFCmpCode(CmpInst::Predicate CC)
Similar to getICmpCode but for FCmpInst.
LLVM_ABI std::optional< int64_t > getIConstantSplatSExtVal(const Register Reg, const MachineRegisterInfo &MRI)
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Simple struct used to hold a Register value and the instruction which defines it.
SmallVector< InstructionBuildSteps, 2 > InstrsToBuild
Describes instructions to be built during a combine.
bool isNonNegative() const
Returns true if this value is known to be non-negative.
unsigned countMinLeadingOnes() const
Returns the minimum number of leading one bits.
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
bool isUnknown() const
Returns true if we don't know any bits.
unsigned getBitWidth() const
Get the bit width of this value.
unsigned countMinLeadingZeros() const
Returns the minimum number of leading zero bits.
APInt getMaxValue() const
Return the maximal unsigned value possible given these KnownBits.
bool isNegative() const
Returns true if this value is known to be negative.
The LegalityQuery object bundles together all the information that's needed to decide whether a given...
This class contains a discriminated union of information about pointers in memory operands,...
LLVM_ABI unsigned getAddrSpace() const
Return the LLVM IR address space number that this pointer points into.
MachinePointerInfo getWithOffset(int64_t O) const
const RegisterBank * Bank
Register LogicNonShiftReg
Magic data for optimising signed division by a constant.
unsigned ShiftAmount
shift amount
static LLVM_ABI SignedDivisionByConstantInfo get(const APInt &D)
Calculate the magic numbers required to implement a signed integer division by a constant as a sequen...
This represents an addressing mode of: BaseGV + BaseOffs + BaseReg + Scale*ScaleReg + ScalableOffset*...
Magic data for optimising unsigned division by a constant.
unsigned PreShift
pre-shift amount
unsigned PostShift
post-shift amount
static LLVM_ABI UnsignedDivisionByConstantInfo get(const APInt &D, unsigned LeadingZeros=0, bool AllowEvenDivisorOptimization=true, bool AllowWidenOptimization=false)
Calculate the magic numbers required to implement an unsigned integer division by a constant as a seq...