53#define DEBUG_TYPE "x86-instr-info"
55#define GET_INSTRINFO_CTOR_DTOR
56#include "X86GenInstrInfo.inc"
62 cl::desc(
"Disable fusing of spill code into instructions"),
66 cl::desc(
"Print instructions that the allocator wants to"
67 " fuse, but the X86 backend currently can't"),
71 cl::desc(
"Re-materialize load from stub in PIC mode"),
75 cl::desc(
"Clearance between two register writes "
76 "for inserting XOR to avoid partial "
80 "undef-reg-clearance",
81 cl::desc(
"How many idle instructions we would like before "
82 "certain undef register reads"),
86void X86InstrInfo::anchor() {}
90 (STI.isTarget64BitLP64() ?
X86::ADJCALLSTACKDOWN64
91 :
X86::ADJCALLSTACKDOWN32),
92 (STI.isTarget64BitLP64() ?
X86::ADJCALLSTACKUP64
93 :
X86::ADJCALLSTACKUP32),
95 Subtarget(STI), RI(STI.getTargetTriple()) {}
98 unsigned OpNum)
const {
102 if (!RC || !Subtarget.hasEGPR())
114 unsigned &SubIdx)
const {
115 switch (
MI.getOpcode()) {
118 case X86::MOVSX16rr8:
119 case X86::MOVZX16rr8:
120 case X86::MOVSX32rr8:
121 case X86::MOVZX32rr8:
122 case X86::MOVSX64rr8:
123 if (!Subtarget.is64Bit())
128 case X86::MOVSX32rr16:
129 case X86::MOVZX32rr16:
130 case X86::MOVSX64rr16:
131 case X86::MOVSX64rr32: {
132 if (
MI.getOperand(0).getSubReg() ||
MI.getOperand(1).getSubReg())
135 SrcReg =
MI.getOperand(1).getReg();
136 DstReg =
MI.getOperand(0).getReg();
137 switch (
MI.getOpcode()) {
140 case X86::MOVSX16rr8:
141 case X86::MOVZX16rr8:
142 case X86::MOVSX32rr8:
143 case X86::MOVZX32rr8:
144 case X86::MOVSX64rr8:
145 SubIdx = X86::sub_8bit;
147 case X86::MOVSX32rr16:
148 case X86::MOVZX32rr16:
149 case X86::MOVSX64rr16:
150 SubIdx = X86::sub_16bit;
152 case X86::MOVSX64rr32:
153 SubIdx = X86::sub_32bit;
163 if (
MI.mayLoad() ||
MI.mayStore())
168 if (
MI.isCopyLike() ||
MI.isInsertSubreg())
171 unsigned Opcode =
MI.getOpcode();
182 if (isBSF(Opcode) || isBSR(Opcode) || isLZCNT(Opcode) || isPOPCNT(Opcode) ||
188 if (isBLCFILL(Opcode) || isBLCI(Opcode) || isBLCIC(Opcode) ||
189 isBLCMSK(Opcode) || isBLCS(Opcode) || isBLSFILL(Opcode) ||
190 isBLSI(Opcode) || isBLSIC(Opcode) || isBLSMSK(Opcode) || isBLSR(Opcode) ||
195 if (isBEXTR(Opcode) || isBZHI(Opcode))
198 if (isROL(Opcode) || isROR(Opcode) || isSAR(Opcode) || isSHL(Opcode) ||
199 isSHR(Opcode) || isSHLD(Opcode) || isSHRD(Opcode))
202 if (isADC(Opcode) || isADD(Opcode) || isAND(Opcode) || isOR(Opcode) ||
203 isSBB(Opcode) || isSUB(Opcode) || isXOR(Opcode))
209 if (isDEC(Opcode) || isINC(Opcode) || isNEG(Opcode))
217 if (isMOVSX(Opcode) || isMOVZX(Opcode) || isMOVSXD(Opcode) || isMOV(Opcode))
220 if (isRORX(Opcode) || isSARX(Opcode) || isSHLX(Opcode) || isSHRX(Opcode))
230 switch (
MI.getOpcode()) {
243 case X86::IMUL64rmi32:
258 case X86::POPCNT16rm:
259 case X86::POPCNT32rm:
260 case X86::POPCNT64rm:
268 case X86::BLCFILL32rm:
269 case X86::BLCFILL64rm:
274 case X86::BLCMSK32rm:
275 case X86::BLCMSK64rm:
278 case X86::BLSFILL32rm:
279 case X86::BLSFILL64rm:
284 case X86::BLSMSK32rm:
285 case X86::BLSMSK64rm:
295 case X86::BEXTRI32mi:
296 case X86::BEXTRI64mi:
349 case X86::CVTTSD2SI64rm:
350 case X86::VCVTTSD2SI64rm:
351 case X86::VCVTTSD2SI64Zrm:
352 case X86::CVTTSD2SIrm:
353 case X86::VCVTTSD2SIrm:
354 case X86::VCVTTSD2SIZrm:
355 case X86::CVTTSS2SI64rm:
356 case X86::VCVTTSS2SI64rm:
357 case X86::VCVTTSS2SI64Zrm:
358 case X86::CVTTSS2SIrm:
359 case X86::VCVTTSS2SIrm:
360 case X86::VCVTTSS2SIZrm:
361 case X86::CVTSI2SDrm:
362 case X86::VCVTSI2SDrm:
363 case X86::VCVTSI2SDZrm:
364 case X86::CVTSI2SSrm:
365 case X86::VCVTSI2SSrm:
366 case X86::VCVTSI2SSZrm:
367 case X86::CVTSI642SDrm:
368 case X86::VCVTSI642SDrm:
369 case X86::VCVTSI642SDZrm:
370 case X86::CVTSI642SSrm:
371 case X86::VCVTSI642SSrm:
372 case X86::VCVTSI642SSZrm:
373 case X86::CVTSS2SDrm:
374 case X86::VCVTSS2SDrm:
375 case X86::VCVTSS2SDZrm:
376 case X86::CVTSD2SSrm:
377 case X86::VCVTSD2SSrm:
378 case X86::VCVTSD2SSZrm:
380 case X86::VCVTTSD2USI64Zrm:
381 case X86::VCVTTSD2USIZrm:
382 case X86::VCVTTSS2USI64Zrm:
383 case X86::VCVTTSS2USIZrm:
384 case X86::VCVTUSI2SDZrm:
385 case X86::VCVTUSI642SDZrm:
386 case X86::VCVTUSI2SSZrm:
387 case X86::VCVTUSI642SSZrm:
391 case X86::MOV8rm_NOREX:
395 case X86::MOVSX16rm8:
396 case X86::MOVSX32rm16:
397 case X86::MOVSX32rm8:
398 case X86::MOVSX32rm8_NOREX:
399 case X86::MOVSX64rm16:
400 case X86::MOVSX64rm32:
401 case X86::MOVSX64rm8:
402 case X86::MOVZX16rm8:
403 case X86::MOVZX32rm16:
404 case X86::MOVZX32rm8:
405 case X86::MOVZX32rm8_NOREX:
406 case X86::MOVZX64rm16:
407 case X86::MOVZX64rm8:
416 if (isFrameInstr(
MI)) {
419 if (!isFrameSetup(
MI))
430 for (
auto E =
MBB->end();
I != E; ++
I) {
431 if (
I->getOpcode() == getCallFrameDestroyOpcode() ||
I->isCall())
437 if (
I->getOpcode() != getCallFrameDestroyOpcode())
440 return -(
I->getOperand(1).
getImm());
445 switch (
MI.getOpcode()) {
464 int &FrameIndex)
const {
484 case X86::KMOVBkm_EVEX:
489 case X86::KMOVWkm_EVEX:
491 case X86::VMOVSHZrm_alt:
496 case X86::MOVSSrm_alt:
498 case X86::VMOVSSrm_alt:
500 case X86::VMOVSSZrm_alt:
502 case X86::KMOVDkm_EVEX:
508 case X86::MOVSDrm_alt:
510 case X86::VMOVSDrm_alt:
512 case X86::VMOVSDZrm_alt:
513 case X86::MMX_MOVD64rm:
514 case X86::MMX_MOVQ64rm:
516 case X86::KMOVQkm_EVEX:
531 case X86::VMOVAPSZ128rm:
532 case X86::VMOVUPSZ128rm:
533 case X86::VMOVAPSZ128rm_NOVLX:
534 case X86::VMOVUPSZ128rm_NOVLX:
535 case X86::VMOVAPDZ128rm:
536 case X86::VMOVUPDZ128rm:
537 case X86::VMOVDQU8Z128rm:
538 case X86::VMOVDQU16Z128rm:
539 case X86::VMOVDQA32Z128rm:
540 case X86::VMOVDQU32Z128rm:
541 case X86::VMOVDQA64Z128rm:
542 case X86::VMOVDQU64Z128rm:
545 case X86::VMOVAPSYrm:
546 case X86::VMOVUPSYrm:
547 case X86::VMOVAPDYrm:
548 case X86::VMOVUPDYrm:
549 case X86::VMOVDQAYrm:
550 case X86::VMOVDQUYrm:
551 case X86::VMOVAPSZ256rm:
552 case X86::VMOVUPSZ256rm:
553 case X86::VMOVAPSZ256rm_NOVLX:
554 case X86::VMOVUPSZ256rm_NOVLX:
555 case X86::VMOVAPDZ256rm:
556 case X86::VMOVUPDZ256rm:
557 case X86::VMOVDQU8Z256rm:
558 case X86::VMOVDQU16Z256rm:
559 case X86::VMOVDQA32Z256rm:
560 case X86::VMOVDQU32Z256rm:
561 case X86::VMOVDQA64Z256rm:
562 case X86::VMOVDQU64Z256rm:
565 case X86::VMOVAPSZrm:
566 case X86::VMOVUPSZrm:
567 case X86::VMOVAPDZrm:
568 case X86::VMOVUPDZrm:
569 case X86::VMOVDQU8Zrm:
570 case X86::VMOVDQU16Zrm:
571 case X86::VMOVDQA32Zrm:
572 case X86::VMOVDQU32Zrm:
573 case X86::VMOVDQA64Zrm:
574 case X86::VMOVDQU64Zrm:
586 case X86::KMOVBmk_EVEX:
591 case X86::KMOVWmk_EVEX:
600 case X86::KMOVDmk_EVEX:
608 case X86::MMX_MOVD64mr:
609 case X86::MMX_MOVQ64mr:
610 case X86::MMX_MOVNTQmr:
612 case X86::KMOVQmk_EVEX:
627 case X86::VMOVUPSZ128mr:
628 case X86::VMOVAPSZ128mr:
629 case X86::VMOVUPSZ128mr_NOVLX:
630 case X86::VMOVAPSZ128mr_NOVLX:
631 case X86::VMOVUPDZ128mr:
632 case X86::VMOVAPDZ128mr:
633 case X86::VMOVDQA32Z128mr:
634 case X86::VMOVDQU32Z128mr:
635 case X86::VMOVDQA64Z128mr:
636 case X86::VMOVDQU64Z128mr:
637 case X86::VMOVDQU8Z128mr:
638 case X86::VMOVDQU16Z128mr:
641 case X86::VMOVUPSYmr:
642 case X86::VMOVAPSYmr:
643 case X86::VMOVUPDYmr:
644 case X86::VMOVAPDYmr:
645 case X86::VMOVDQUYmr:
646 case X86::VMOVDQAYmr:
647 case X86::VMOVUPSZ256mr:
648 case X86::VMOVAPSZ256mr:
649 case X86::VMOVUPSZ256mr_NOVLX:
650 case X86::VMOVAPSZ256mr_NOVLX:
651 case X86::VMOVUPDZ256mr:
652 case X86::VMOVAPDZ256mr:
653 case X86::VMOVDQU8Z256mr:
654 case X86::VMOVDQU16Z256mr:
655 case X86::VMOVDQA32Z256mr:
656 case X86::VMOVDQU32Z256mr:
657 case X86::VMOVDQA64Z256mr:
658 case X86::VMOVDQU64Z256mr:
661 case X86::VMOVUPSZmr:
662 case X86::VMOVAPSZmr:
663 case X86::VMOVUPDZmr:
664 case X86::VMOVAPDZmr:
665 case X86::VMOVDQU8Zmr:
666 case X86::VMOVDQU16Zmr:
667 case X86::VMOVDQA32Zmr:
668 case X86::VMOVDQU32Zmr:
669 case X86::VMOVDQA64Zmr:
670 case X86::VMOVDQU64Zmr:
678 int &FrameIndex)
const {
687 if (
MI.getOperand(0).getSubReg() == 0 && isFrameOperand(
MI, 1, FrameIndex))
688 return MI.getOperand(0).getReg();
693 int &FrameIndex)
const {
704 return MI.getOperand(0).getReg();
711 int &FrameIndex)
const {
721 isFrameOperand(
MI, 0, FrameIndex))
727 int &FrameIndex)
const {
747 if (!BaseReg.isVirtual())
749 bool isPICBase =
false;
751 if (
DefMI.getOpcode() != X86::MOVPC32r)
753 assert(!isPICBase &&
"More than one PIC base?");
761 switch (
MI.getOpcode()) {
767 case X86::IMPLICIT_DEF:
770 case X86::LOAD_STACK_GUARD:
777 case X86::AVX1_SETALLONES:
778 case X86::AVX2_SETALLONES:
779 case X86::AVX512_128_SET0:
780 case X86::AVX512_256_SET0:
781 case X86::AVX512_512_SET0:
782 case X86::AVX512_128_SETALLONES:
783 case X86::AVX512_256_SETALLONES:
784 case X86::AVX512_512_SETALLONES:
785 case X86::AVX512_FsFLD0SD:
786 case X86::AVX512_FsFLD0SH:
787 case X86::AVX512_FsFLD0SS:
788 case X86::AVX512_FsFLD0F128:
793 case X86::FsFLD0F128:
803 case X86::MOV32ImmSExti8:
808 case X86::MOV64ImmSExti8:
810 case X86::V_SETALLONES:
816 case X86::PTILEZEROV:
820 case X86::MOV8rm_NOREX:
825 case X86::MOVSSrm_alt:
827 case X86::MOVSDrm_alt:
835 case X86::VMOVSSrm_alt:
837 case X86::VMOVSDrm_alt:
844 case X86::VMOVAPSYrm:
845 case X86::VMOVUPSYrm:
846 case X86::VMOVAPDYrm:
847 case X86::VMOVUPDYrm:
848 case X86::VMOVDQAYrm:
849 case X86::VMOVDQUYrm:
850 case X86::MMX_MOVD64rm:
851 case X86::MMX_MOVQ64rm:
852 case X86::VBROADCASTSSrm:
853 case X86::VBROADCASTSSYrm:
854 case X86::VBROADCASTSDYrm:
856 case X86::VPBROADCASTBZ128rm:
857 case X86::VPBROADCASTBZ256rm:
858 case X86::VPBROADCASTBZrm:
859 case X86::VBROADCASTF32X2Z256rm:
860 case X86::VBROADCASTF32X2Zrm:
861 case X86::VBROADCASTI32X2Z128rm:
862 case X86::VBROADCASTI32X2Z256rm:
863 case X86::VBROADCASTI32X2Zrm:
864 case X86::VPBROADCASTWZ128rm:
865 case X86::VPBROADCASTWZ256rm:
866 case X86::VPBROADCASTWZrm:
867 case X86::VPBROADCASTDZ128rm:
868 case X86::VPBROADCASTDZ256rm:
869 case X86::VPBROADCASTDZrm:
870 case X86::VBROADCASTSSZ128rm:
871 case X86::VBROADCASTSSZ256rm:
872 case X86::VBROADCASTSSZrm:
873 case X86::VPBROADCASTQZ128rm:
874 case X86::VPBROADCASTQZ256rm:
875 case X86::VPBROADCASTQZrm:
876 case X86::VBROADCASTSDZ256rm:
877 case X86::VBROADCASTSDZrm:
879 case X86::VMOVSSZrm_alt:
881 case X86::VMOVSDZrm_alt:
883 case X86::VMOVSHZrm_alt:
884 case X86::VMOVAPDZ128rm:
885 case X86::VMOVAPDZ256rm:
886 case X86::VMOVAPDZrm:
887 case X86::VMOVAPSZ128rm:
888 case X86::VMOVAPSZ256rm:
889 case X86::VMOVAPSZ128rm_NOVLX:
890 case X86::VMOVAPSZ256rm_NOVLX:
891 case X86::VMOVAPSZrm:
892 case X86::VMOVDQA32Z128rm:
893 case X86::VMOVDQA32Z256rm:
894 case X86::VMOVDQA32Zrm:
895 case X86::VMOVDQA64Z128rm:
896 case X86::VMOVDQA64Z256rm:
897 case X86::VMOVDQA64Zrm:
898 case X86::VMOVDQU16Z128rm:
899 case X86::VMOVDQU16Z256rm:
900 case X86::VMOVDQU16Zrm:
901 case X86::VMOVDQU32Z128rm:
902 case X86::VMOVDQU32Z256rm:
903 case X86::VMOVDQU32Zrm:
904 case X86::VMOVDQU64Z128rm:
905 case X86::VMOVDQU64Z256rm:
906 case X86::VMOVDQU64Zrm:
907 case X86::VMOVDQU8Z128rm:
908 case X86::VMOVDQU8Z256rm:
909 case X86::VMOVDQU8Zrm:
910 case X86::VMOVUPDZ128rm:
911 case X86::VMOVUPDZ256rm:
912 case X86::VMOVUPDZrm:
913 case X86::VMOVUPSZ128rm:
914 case X86::VMOVUPSZ256rm:
915 case X86::VMOVUPSZ128rm_NOVLX:
916 case X86::VMOVUPSZ256rm_NOVLX:
917 case X86::VMOVUPSZrm: {
923 MI.isDereferenceableInvariantLoad()) {
925 if (BaseReg == 0 || BaseReg == X86::RIP)
968 if (ClobbersEFLAGS &&
MBB.computeRegisterLiveness(&
TRI, X86::EFLAGS,
I) !=
1003 if (MO.isReg() && MO.isDef() && MO.getReg() == X86::EFLAGS &&
1013 unsigned ShiftAmtOperandIdx) {
1015 unsigned ShiftCountMask = (
MI.getDesc().TSFlags &
X86II::REX_W) ? 63 : 31;
1016 unsigned Imm =
MI.getOperand(ShiftAmtOperandIdx).getImm();
1017 return Imm & ShiftCountMask;
1028 return ShAmt < 4 && ShAmt > 0;
1035 bool &NoSignFlag,
bool &ClearsOverflowFlag) {
1036 if (!(CmpValDefInstr.
getOpcode() == X86::SUBREG_TO_REG &&
1037 CmpInstr.
getOpcode() == X86::TEST64rr) &&
1038 !(CmpValDefInstr.
getOpcode() == X86::COPY &&
1046 "CmpInstr is an analyzable TEST16rr/TEST64rr, and "
1047 "`X86InstrInfo::analyzeCompare` requires two reg operands are the"
1056 "Caller guarantees that TEST64rr is a user of SUBREG_TO_REG or TEST16rr "
1057 "is a user of COPY sub16bit.");
1059 if (CmpInstr.
getOpcode() == X86::TEST16rr) {
1068 if (!((VregDefInstr->
getOpcode() == X86::AND32ri ||
1069 VregDefInstr->
getOpcode() == X86::AND64ri32) &&
1074 if (CmpInstr.
getOpcode() == X86::TEST64rr) {
1083 assert(VregDefInstr &&
"Must have a definition (SSA)");
1093 if (X86::isAND(VregDefInstr->
getOpcode()) &&
1114 if (Instr.modifiesRegister(X86::EFLAGS,
TRI))
1118 *AndInstr = VregDefInstr;
1139 ClearsOverflowFlag =
true;
1147 unsigned &NewSrcSubReg,
bool &isKill,
1153 RC =
Opc != X86::LEA32r ? &X86::GR64RegClass : &X86::GR32RegClass;
1155 RC =
Opc != X86::LEA32r ? &X86::GR64_NOSPRegClass : &X86::GR32_NOSPRegClass;
1158 unsigned SubReg = Src.getSubReg();
1159 isKill =
MI.killsRegister(SrcReg,
nullptr);
1161 NewSrcSubReg = X86::NoSubRegister;
1165 if (
Opc != X86::LEA64_32r) {
1167 NewSrcSubReg = SubReg;
1168 assert(!Src.isUndef() &&
"Undef op doesn't need optimization");
1183 assert(!SubReg &&
"no superregister for source");
1185 assert(!Src.isUndef() &&
"Undef op doesn't need optimization");
1190 NewSrcSubReg = X86::NoSubRegister;
1216MachineInstr *X86InstrInfo::convertToThreeAddressWithLEA(
unsigned MIOpc,
1220 bool Is8BitOp)
const {
1225 RegInfo.getTargetRegisterInfo()->getRegSizeInBits(
1226 *RegInfo.getRegClass(
MI.getOperand(0).getReg())) == 16) &&
1227 "Unexpected type for LEA transform");
1236 if (!Subtarget.is64Bit())
1239 unsigned Opcode = X86::LEA64_32r;
1240 Register InRegLEA = RegInfo.createVirtualRegister(&X86::GR64_NOSPRegClass);
1241 Register OutRegLEA = RegInfo.createVirtualRegister(&X86::GR32RegClass);
1254 unsigned SrcSubReg =
MI.getOperand(1).getSubReg();
1256 unsigned Src2SubReg;
1257 bool IsDead =
MI.getOperand(0).isDead();
1258 bool IsKill =
MI.getOperand(1).isKill();
1259 unsigned SubReg = Is8BitOp ? X86::sub_8bit : X86::sub_16bit;
1260 assert(!
MI.getOperand(1).isUndef() &&
"Undef op doesn't need optimization");
1272#define CASE_NF(OP) \
1280 unsigned ShAmt =
MI.getOperand(2).getImm();
1298 case X86::ADD8ri_DB:
1299 case X86::ADD16ri_DB:
1304 case X86::ADD8rr_DB:
1305 case X86::ADD16rr_DB: {
1306 Src2 =
MI.getOperand(2).getReg();
1307 Src2SubReg =
MI.getOperand(2).getSubReg();
1308 bool IsKill2 =
MI.getOperand(2).isKill();
1309 assert(!
MI.getOperand(2).isUndef() &&
"Undef op doesn't need optimization");
1313 addRegReg(MIB, InRegLEA,
true, X86::NoSubRegister, InRegLEA,
false,
1314 X86::NoSubRegister);
1316 if (Subtarget.is64Bit())
1322 ImpDef2 =
BuildMI(
MBB, &*MIB,
MI.getDebugLoc(),
get(X86::IMPLICIT_DEF),
1324 InsMI2 =
BuildMI(
MBB, &*MIB,
MI.getDebugLoc(),
get(TargetOpcode::COPY))
1327 addRegReg(MIB, InRegLEA,
true, X86::NoSubRegister, InRegLEA2,
true,
1328 X86::NoSubRegister);
1330 if (LV && IsKill2 && InsMI2)
1336 MachineInstr *NewMI = MIB;
1337 MachineInstr *ExtMI =
1385 LiveRange::Segment *DestSeg =
1426 if (
MI.getNumOperands() > 2)
1427 if (
MI.getOperand(2).isReg() &&
MI.getOperand(2).isUndef())
1432 unsigned SrcSubReg, SrcSubReg2;
1433 bool Is64Bit = Subtarget.is64Bit();
1435 bool Is8BitOp =
false;
1436 unsigned NumRegOperands = 2;
1437 unsigned MIOpc =
MI.getOpcode();
1442 assert(
MI.getNumOperands() >= 3 &&
"Unknown shift instruction!");
1449 Src.getReg(), &X86::GR64_NOSPRegClass))
1452 NewMI =
BuildMI(MF,
MI.getDebugLoc(),
get(X86::LEA64r))
1462 assert(
MI.getNumOperands() >= 3 &&
"Unknown shift instruction!");
1467 unsigned Opc = Is64Bit ? X86::LEA64_32r : X86::LEA32r;
1473 isKill, ImplicitOp, LV, LIS))
1484 if (ImplicitOp.
getReg() != 0)
1485 MIB.
add(ImplicitOp);
1489 if (LV && SrcReg != Src.getReg())
1497 assert(
MI.getNumOperands() >= 3 &&
"Unknown shift instruction!");
1501 return convertToThreeAddressWithLEA(MIOpc,
MI, LV, LIS, Is8BitOp);
1505 assert(
MI.getNumOperands() >= 2 &&
"Unknown inc instruction!");
1506 unsigned Opc = (MIOpc == X86::INC64r || MIOpc == X86::INC64r_NF)
1508 : (Is64Bit ? X86::LEA64_32r : X86::LEA32r);
1512 isKill, ImplicitOp, LV, LIS))
1518 if (ImplicitOp.
getReg() != 0)
1519 MIB.
add(ImplicitOp);
1524 if (LV && SrcReg != Src.getReg())
1530 assert(
MI.getNumOperands() >= 2 &&
"Unknown dec instruction!");
1531 unsigned Opc = (MIOpc == X86::DEC64r || MIOpc == X86::DEC64r_NF)
1533 : (Is64Bit ? X86::LEA64_32r : X86::LEA32r);
1538 isKill, ImplicitOp, LV, LIS))
1544 if (ImplicitOp.
getReg() != 0)
1545 MIB.
add(ImplicitOp);
1550 if (LV && SrcReg != Src.getReg())
1560 return convertToThreeAddressWithLEA(MIOpc,
MI, LV, LIS, Is8BitOp);
1563 case X86::ADD64rr_DB:
1564 case X86::ADD32rr_DB: {
1565 assert(
MI.getNumOperands() >= 3 &&
"Unknown add instruction!");
1567 if (MIOpc == X86::ADD64rr || MIOpc == X86::ADD64rr_NF ||
1568 MIOpc == X86::ADD64rr_DB)
1571 Opc = Is64Bit ? X86::LEA64_32r : X86::LEA32r;
1577 isKill2, ImplicitOp2, LV, LIS))
1582 if (Src.getReg() == Src2.
getReg()) {
1587 SrcSubReg = SrcSubReg2;
1590 isKill, ImplicitOp, LV, LIS))
1595 if (ImplicitOp.
getReg() != 0)
1596 MIB.
add(ImplicitOp);
1597 if (ImplicitOp2.
getReg() != 0)
1598 MIB.
add(ImplicitOp2);
1601 addRegReg(MIB, SrcReg, isKill, SrcSubReg, SrcReg2, isKill2, SrcSubReg2);
1605 if (SrcReg2 != Src2.
getReg())
1607 if (SrcReg != SrcReg2 && SrcReg != Src.getReg())
1614 case X86::ADD8rr_DB:
1618 case X86::ADD16rr_DB:
1619 return convertToThreeAddressWithLEA(MIOpc,
MI, LV, LIS, Is8BitOp);
1621 case X86::ADD64ri32_DB:
1622 assert(
MI.getNumOperands() >= 3 &&
"Unknown add instruction!");
1624 BuildMI(MF,
MI.getDebugLoc(),
get(X86::LEA64r)).add(Dest).add(Src),
1628 case X86::ADD32ri_DB: {
1629 assert(
MI.getNumOperands() >= 3 &&
"Unknown add instruction!");
1630 unsigned Opc = Is64Bit ? X86::LEA64_32r : X86::LEA32r;
1635 isKill, ImplicitOp, LV, LIS))
1642 if (ImplicitOp.
getReg() != 0)
1643 MIB.
add(ImplicitOp);
1648 if (LV && SrcReg != Src.getReg())
1653 case X86::ADD8ri_DB:
1657 case X86::ADD16ri_DB:
1658 return convertToThreeAddressWithLEA(MIOpc,
MI, LV, LIS, Is8BitOp);
1664 if (!
MI.getOperand(2).isImm())
1666 int64_t Imm =
MI.getOperand(2).getImm();
1670 assert(
MI.getNumOperands() >= 3 &&
"Unknown add instruction!");
1671 unsigned Opc = Is64Bit ? X86::LEA64_32r : X86::LEA32r;
1676 isKill, ImplicitOp, LV, LIS))
1683 if (ImplicitOp.
getReg() != 0)
1684 MIB.
add(ImplicitOp);
1689 if (LV && SrcReg != Src.getReg())
1695 if (!
MI.getOperand(2).isImm())
1697 int64_t Imm =
MI.getOperand(2).getImm();
1701 assert(
MI.getNumOperands() >= 3 &&
"Unknown sub instruction!");
1709 case X86::VMOVDQU8Z128rmk:
1710 case X86::VMOVDQU8Z256rmk:
1711 case X86::VMOVDQU8Zrmk:
1712 case X86::VMOVDQU16Z128rmk:
1713 case X86::VMOVDQU16Z256rmk:
1714 case X86::VMOVDQU16Zrmk:
1715 case X86::VMOVDQU32Z128rmk:
1716 case X86::VMOVDQA32Z128rmk:
1717 case X86::VMOVDQU32Z256rmk:
1718 case X86::VMOVDQA32Z256rmk:
1719 case X86::VMOVDQU32Zrmk:
1720 case X86::VMOVDQA32Zrmk:
1721 case X86::VMOVDQU64Z128rmk:
1722 case X86::VMOVDQA64Z128rmk:
1723 case X86::VMOVDQU64Z256rmk:
1724 case X86::VMOVDQA64Z256rmk:
1725 case X86::VMOVDQU64Zrmk:
1726 case X86::VMOVDQA64Zrmk:
1727 case X86::VMOVUPDZ128rmk:
1728 case X86::VMOVAPDZ128rmk:
1729 case X86::VMOVUPDZ256rmk:
1730 case X86::VMOVAPDZ256rmk:
1731 case X86::VMOVUPDZrmk:
1732 case X86::VMOVAPDZrmk:
1733 case X86::VMOVUPSZ128rmk:
1734 case X86::VMOVAPSZ128rmk:
1735 case X86::VMOVUPSZ256rmk:
1736 case X86::VMOVAPSZ256rmk:
1737 case X86::VMOVUPSZrmk:
1738 case X86::VMOVAPSZrmk:
1739 case X86::VBROADCASTSDZ256rmk:
1740 case X86::VBROADCASTSDZrmk:
1741 case X86::VBROADCASTSSZ128rmk:
1742 case X86::VBROADCASTSSZ256rmk:
1743 case X86::VBROADCASTSSZrmk:
1744 case X86::VPBROADCASTDZ128rmk:
1745 case X86::VPBROADCASTDZ256rmk:
1746 case X86::VPBROADCASTDZrmk:
1747 case X86::VPBROADCASTQZ128rmk:
1748 case X86::VPBROADCASTQZ256rmk:
1749 case X86::VPBROADCASTQZrmk: {
1754 case X86::VMOVDQU8Z128rmk:
1755 Opc = X86::VPBLENDMBZ128rmk;
1757 case X86::VMOVDQU8Z256rmk:
1758 Opc = X86::VPBLENDMBZ256rmk;
1760 case X86::VMOVDQU8Zrmk:
1761 Opc = X86::VPBLENDMBZrmk;
1763 case X86::VMOVDQU16Z128rmk:
1764 Opc = X86::VPBLENDMWZ128rmk;
1766 case X86::VMOVDQU16Z256rmk:
1767 Opc = X86::VPBLENDMWZ256rmk;
1769 case X86::VMOVDQU16Zrmk:
1770 Opc = X86::VPBLENDMWZrmk;
1772 case X86::VMOVDQU32Z128rmk:
1773 Opc = X86::VPBLENDMDZ128rmk;
1775 case X86::VMOVDQU32Z256rmk:
1776 Opc = X86::VPBLENDMDZ256rmk;
1778 case X86::VMOVDQU32Zrmk:
1779 Opc = X86::VPBLENDMDZrmk;
1781 case X86::VMOVDQU64Z128rmk:
1782 Opc = X86::VPBLENDMQZ128rmk;
1784 case X86::VMOVDQU64Z256rmk:
1785 Opc = X86::VPBLENDMQZ256rmk;
1787 case X86::VMOVDQU64Zrmk:
1788 Opc = X86::VPBLENDMQZrmk;
1790 case X86::VMOVUPDZ128rmk:
1791 Opc = X86::VBLENDMPDZ128rmk;
1793 case X86::VMOVUPDZ256rmk:
1794 Opc = X86::VBLENDMPDZ256rmk;
1796 case X86::VMOVUPDZrmk:
1797 Opc = X86::VBLENDMPDZrmk;
1799 case X86::VMOVUPSZ128rmk:
1800 Opc = X86::VBLENDMPSZ128rmk;
1802 case X86::VMOVUPSZ256rmk:
1803 Opc = X86::VBLENDMPSZ256rmk;
1805 case X86::VMOVUPSZrmk:
1806 Opc = X86::VBLENDMPSZrmk;
1808 case X86::VMOVDQA32Z128rmk:
1809 Opc = X86::VPBLENDMDZ128rmk;
1811 case X86::VMOVDQA32Z256rmk:
1812 Opc = X86::VPBLENDMDZ256rmk;
1814 case X86::VMOVDQA32Zrmk:
1815 Opc = X86::VPBLENDMDZrmk;
1817 case X86::VMOVDQA64Z128rmk:
1818 Opc = X86::VPBLENDMQZ128rmk;
1820 case X86::VMOVDQA64Z256rmk:
1821 Opc = X86::VPBLENDMQZ256rmk;
1823 case X86::VMOVDQA64Zrmk:
1824 Opc = X86::VPBLENDMQZrmk;
1826 case X86::VMOVAPDZ128rmk:
1827 Opc = X86::VBLENDMPDZ128rmk;
1829 case X86::VMOVAPDZ256rmk:
1830 Opc = X86::VBLENDMPDZ256rmk;
1832 case X86::VMOVAPDZrmk:
1833 Opc = X86::VBLENDMPDZrmk;
1835 case X86::VMOVAPSZ128rmk:
1836 Opc = X86::VBLENDMPSZ128rmk;
1838 case X86::VMOVAPSZ256rmk:
1839 Opc = X86::VBLENDMPSZ256rmk;
1841 case X86::VMOVAPSZrmk:
1842 Opc = X86::VBLENDMPSZrmk;
1844 case X86::VBROADCASTSDZ256rmk:
1845 Opc = X86::VBLENDMPDZ256rmbk;
1847 case X86::VBROADCASTSDZrmk:
1848 Opc = X86::VBLENDMPDZrmbk;
1850 case X86::VBROADCASTSSZ128rmk:
1851 Opc = X86::VBLENDMPSZ128rmbk;
1853 case X86::VBROADCASTSSZ256rmk:
1854 Opc = X86::VBLENDMPSZ256rmbk;
1856 case X86::VBROADCASTSSZrmk:
1857 Opc = X86::VBLENDMPSZrmbk;
1859 case X86::VPBROADCASTDZ128rmk:
1860 Opc = X86::VPBLENDMDZ128rmbk;
1862 case X86::VPBROADCASTDZ256rmk:
1863 Opc = X86::VPBLENDMDZ256rmbk;
1865 case X86::VPBROADCASTDZrmk:
1866 Opc = X86::VPBLENDMDZrmbk;
1868 case X86::VPBROADCASTQZ128rmk:
1869 Opc = X86::VPBLENDMQZ128rmbk;
1871 case X86::VPBROADCASTQZ256rmk:
1872 Opc = X86::VPBLENDMQZ256rmbk;
1874 case X86::VPBROADCASTQZrmk:
1875 Opc = X86::VPBLENDMQZrmbk;
1881 .
add(
MI.getOperand(2))
1883 .
add(
MI.getOperand(3))
1884 .
add(
MI.getOperand(4))
1885 .
add(
MI.getOperand(5))
1886 .
add(
MI.getOperand(6))
1887 .
add(
MI.getOperand(7));
1892 case X86::VMOVDQU8Z128rrk:
1893 case X86::VMOVDQU8Z256rrk:
1894 case X86::VMOVDQU8Zrrk:
1895 case X86::VMOVDQU16Z128rrk:
1896 case X86::VMOVDQU16Z256rrk:
1897 case X86::VMOVDQU16Zrrk:
1898 case X86::VMOVDQU32Z128rrk:
1899 case X86::VMOVDQA32Z128rrk:
1900 case X86::VMOVDQU32Z256rrk:
1901 case X86::VMOVDQA32Z256rrk:
1902 case X86::VMOVDQU32Zrrk:
1903 case X86::VMOVDQA32Zrrk:
1904 case X86::VMOVDQU64Z128rrk:
1905 case X86::VMOVDQA64Z128rrk:
1906 case X86::VMOVDQU64Z256rrk:
1907 case X86::VMOVDQA64Z256rrk:
1908 case X86::VMOVDQU64Zrrk:
1909 case X86::VMOVDQA64Zrrk:
1910 case X86::VMOVUPDZ128rrk:
1911 case X86::VMOVAPDZ128rrk:
1912 case X86::VMOVUPDZ256rrk:
1913 case X86::VMOVAPDZ256rrk:
1914 case X86::VMOVUPDZrrk:
1915 case X86::VMOVAPDZrrk:
1916 case X86::VMOVUPSZ128rrk:
1917 case X86::VMOVAPSZ128rrk:
1918 case X86::VMOVUPSZ256rrk:
1919 case X86::VMOVAPSZ256rrk:
1920 case X86::VMOVUPSZrrk:
1921 case X86::VMOVAPSZrrk: {
1926 case X86::VMOVDQU8Z128rrk:
1927 Opc = X86::VPBLENDMBZ128rrk;
1929 case X86::VMOVDQU8Z256rrk:
1930 Opc = X86::VPBLENDMBZ256rrk;
1932 case X86::VMOVDQU8Zrrk:
1933 Opc = X86::VPBLENDMBZrrk;
1935 case X86::VMOVDQU16Z128rrk:
1936 Opc = X86::VPBLENDMWZ128rrk;
1938 case X86::VMOVDQU16Z256rrk:
1939 Opc = X86::VPBLENDMWZ256rrk;
1941 case X86::VMOVDQU16Zrrk:
1942 Opc = X86::VPBLENDMWZrrk;
1944 case X86::VMOVDQU32Z128rrk:
1945 Opc = X86::VPBLENDMDZ128rrk;
1947 case X86::VMOVDQU32Z256rrk:
1948 Opc = X86::VPBLENDMDZ256rrk;
1950 case X86::VMOVDQU32Zrrk:
1951 Opc = X86::VPBLENDMDZrrk;
1953 case X86::VMOVDQU64Z128rrk:
1954 Opc = X86::VPBLENDMQZ128rrk;
1956 case X86::VMOVDQU64Z256rrk:
1957 Opc = X86::VPBLENDMQZ256rrk;
1959 case X86::VMOVDQU64Zrrk:
1960 Opc = X86::VPBLENDMQZrrk;
1962 case X86::VMOVUPDZ128rrk:
1963 Opc = X86::VBLENDMPDZ128rrk;
1965 case X86::VMOVUPDZ256rrk:
1966 Opc = X86::VBLENDMPDZ256rrk;
1968 case X86::VMOVUPDZrrk:
1969 Opc = X86::VBLENDMPDZrrk;
1971 case X86::VMOVUPSZ128rrk:
1972 Opc = X86::VBLENDMPSZ128rrk;
1974 case X86::VMOVUPSZ256rrk:
1975 Opc = X86::VBLENDMPSZ256rrk;
1977 case X86::VMOVUPSZrrk:
1978 Opc = X86::VBLENDMPSZrrk;
1980 case X86::VMOVDQA32Z128rrk:
1981 Opc = X86::VPBLENDMDZ128rrk;
1983 case X86::VMOVDQA32Z256rrk:
1984 Opc = X86::VPBLENDMDZ256rrk;
1986 case X86::VMOVDQA32Zrrk:
1987 Opc = X86::VPBLENDMDZrrk;
1989 case X86::VMOVDQA64Z128rrk:
1990 Opc = X86::VPBLENDMQZ128rrk;
1992 case X86::VMOVDQA64Z256rrk:
1993 Opc = X86::VPBLENDMQZ256rrk;
1995 case X86::VMOVDQA64Zrrk:
1996 Opc = X86::VPBLENDMQZrrk;
1998 case X86::VMOVAPDZ128rrk:
1999 Opc = X86::VBLENDMPDZ128rrk;
2001 case X86::VMOVAPDZ256rrk:
2002 Opc = X86::VBLENDMPDZ256rrk;
2004 case X86::VMOVAPDZrrk:
2005 Opc = X86::VBLENDMPDZrrk;
2007 case X86::VMOVAPSZ128rrk:
2008 Opc = X86::VBLENDMPSZ128rrk;
2010 case X86::VMOVAPSZ256rrk:
2011 Opc = X86::VBLENDMPSZ256rrk;
2013 case X86::VMOVAPSZrrk:
2014 Opc = X86::VBLENDMPSZrrk;
2020 .
add(
MI.getOperand(2))
2022 .
add(
MI.getOperand(3));
2033 for (
unsigned I = 0;
I < NumRegOperands; ++
I) {
2035 if (
Op.isReg() && (
Op.isDead() ||
Op.isKill()))
2041 MBB.insert(
MI.getIterator(), NewMI);
2062 unsigned SrcOpIdx2) {
2064 if (SrcOpIdx1 > SrcOpIdx2)
2067 unsigned Op1 = 1, Op2 = 2, Op3 = 3;
2073 if (SrcOpIdx1 == Op1 && SrcOpIdx2 == Op2)
2075 if (SrcOpIdx1 == Op1 && SrcOpIdx2 == Op3)
2077 if (SrcOpIdx1 == Op2 && SrcOpIdx2 == Op3)
2086 unsigned Opc =
MI.getOpcode();
2095 "Intrinsic instructions can't commute operand 1");
2100 assert(Case < 3 &&
"Unexpected case number!");
2105 const unsigned Form132Index = 0;
2106 const unsigned Form213Index = 1;
2107 const unsigned Form231Index = 2;
2108 static const unsigned FormMapping[][3] = {
2113 {Form231Index, Form213Index, Form132Index},
2118 {Form132Index, Form231Index, Form213Index},
2123 {Form213Index, Form132Index, Form231Index}};
2125 unsigned FMAForms[3];
2131 for (
unsigned FormIndex = 0; FormIndex < 3; FormIndex++)
2132 if (
Opc == FMAForms[FormIndex])
2133 return FMAForms[FormMapping[Case][FormIndex]];
2139 unsigned SrcOpIdx2) {
2143 assert(Case < 3 &&
"Unexpected case value!");
2146 static const uint8_t SwapMasks[3][4] = {
2147 {0x04, 0x10, 0x08, 0x20},
2148 {0x02, 0x10, 0x08, 0x40},
2149 {0x02, 0x04, 0x20, 0x40},
2152 uint8_t Imm =
MI.getOperand(
MI.getNumOperands() - 1).getImm();
2154 uint8_t NewImm = Imm & ~(SwapMasks[Case][0] | SwapMasks[Case][1] |
2155 SwapMasks[Case][2] | SwapMasks[Case][3]);
2157 if (Imm & SwapMasks[Case][0])
2158 NewImm |= SwapMasks[Case][1];
2159 if (Imm & SwapMasks[Case][1])
2160 NewImm |= SwapMasks[Case][0];
2161 if (Imm & SwapMasks[Case][2])
2162 NewImm |= SwapMasks[Case][3];
2163 if (Imm & SwapMasks[Case][3])
2164 NewImm |= SwapMasks[Case][2];
2165 MI.getOperand(
MI.getNumOperands() - 1).setImm(NewImm);
2171#define VPERM_CASES(Suffix) \
2172 case X86::VPERMI2##Suffix##Z128rr: \
2173 case X86::VPERMT2##Suffix##Z128rr: \
2174 case X86::VPERMI2##Suffix##Z256rr: \
2175 case X86::VPERMT2##Suffix##Z256rr: \
2176 case X86::VPERMI2##Suffix##Zrr: \
2177 case X86::VPERMT2##Suffix##Zrr: \
2178 case X86::VPERMI2##Suffix##Z128rm: \
2179 case X86::VPERMT2##Suffix##Z128rm: \
2180 case X86::VPERMI2##Suffix##Z256rm: \
2181 case X86::VPERMT2##Suffix##Z256rm: \
2182 case X86::VPERMI2##Suffix##Zrm: \
2183 case X86::VPERMT2##Suffix##Zrm: \
2184 case X86::VPERMI2##Suffix##Z128rrkz: \
2185 case X86::VPERMT2##Suffix##Z128rrkz: \
2186 case X86::VPERMI2##Suffix##Z256rrkz: \
2187 case X86::VPERMT2##Suffix##Z256rrkz: \
2188 case X86::VPERMI2##Suffix##Zrrkz: \
2189 case X86::VPERMT2##Suffix##Zrrkz: \
2190 case X86::VPERMI2##Suffix##Z128rmkz: \
2191 case X86::VPERMT2##Suffix##Z128rmkz: \
2192 case X86::VPERMI2##Suffix##Z256rmkz: \
2193 case X86::VPERMT2##Suffix##Z256rmkz: \
2194 case X86::VPERMI2##Suffix##Zrmkz: \
2195 case X86::VPERMT2##Suffix##Zrmkz:
2197#define VPERM_CASES_BROADCAST(Suffix) \
2198 VPERM_CASES(Suffix) \
2199 case X86::VPERMI2##Suffix##Z128rmb: \
2200 case X86::VPERMT2##Suffix##Z128rmb: \
2201 case X86::VPERMI2##Suffix##Z256rmb: \
2202 case X86::VPERMT2##Suffix##Z256rmb: \
2203 case X86::VPERMI2##Suffix##Zrmb: \
2204 case X86::VPERMT2##Suffix##Zrmb: \
2205 case X86::VPERMI2##Suffix##Z128rmbkz: \
2206 case X86::VPERMT2##Suffix##Z128rmbkz: \
2207 case X86::VPERMI2##Suffix##Z256rmbkz: \
2208 case X86::VPERMT2##Suffix##Z256rmbkz: \
2209 case X86::VPERMI2##Suffix##Zrmbkz: \
2210 case X86::VPERMT2##Suffix##Zrmbkz:
2223#undef VPERM_CASES_BROADCAST
2230#define VPERM_CASES(Orig, New) \
2231 case X86::Orig##Z128rr: \
2232 return X86::New##Z128rr; \
2233 case X86::Orig##Z128rrkz: \
2234 return X86::New##Z128rrkz; \
2235 case X86::Orig##Z128rm: \
2236 return X86::New##Z128rm; \
2237 case X86::Orig##Z128rmkz: \
2238 return X86::New##Z128rmkz; \
2239 case X86::Orig##Z256rr: \
2240 return X86::New##Z256rr; \
2241 case X86::Orig##Z256rrkz: \
2242 return X86::New##Z256rrkz; \
2243 case X86::Orig##Z256rm: \
2244 return X86::New##Z256rm; \
2245 case X86::Orig##Z256rmkz: \
2246 return X86::New##Z256rmkz; \
2247 case X86::Orig##Zrr: \
2248 return X86::New##Zrr; \
2249 case X86::Orig##Zrrkz: \
2250 return X86::New##Zrrkz; \
2251 case X86::Orig##Zrm: \
2252 return X86::New##Zrm; \
2253 case X86::Orig##Zrmkz: \
2254 return X86::New##Zrmkz;
2256#define VPERM_CASES_BROADCAST(Orig, New) \
2257 VPERM_CASES(Orig, New) \
2258 case X86::Orig##Z128rmb: \
2259 return X86::New##Z128rmb; \
2260 case X86::Orig##Z128rmbkz: \
2261 return X86::New##Z128rmbkz; \
2262 case X86::Orig##Z256rmb: \
2263 return X86::New##Z256rmb; \
2264 case X86::Orig##Z256rmbkz: \
2265 return X86::New##Z256rmbkz; \
2266 case X86::Orig##Zrmb: \
2267 return X86::New##Zrmb; \
2268 case X86::Orig##Zrmbkz: \
2269 return X86::New##Zrmbkz;
2287#undef VPERM_CASES_BROADCAST
2293 unsigned OpIdx2)
const {
2295 return std::exchange(NewMI,
false)
2296 ?
MI.getParent()->getParent()->CloneMachineInstr(&
MI)
2300 unsigned Opc =
MI.getOpcode();
2302#define CASE_ND(OP) \
2318#define FROM_TO_SIZE(A, B, S) \
2324 Opc = X86::B##_ND; \
2332 Opc = X86::A##_ND; \
2341 WorkingMI = CloneIfNew(
MI);
2350 WorkingMI = CloneIfNew(
MI);
2352 get(X86::PFSUBRrr ==
Opc ? X86::PFSUBrr : X86::PFSUBRrr));
2354 case X86::BLENDPDrri:
2355 case X86::BLENDPSrri:
2356 case X86::PBLENDWrri:
2357 case X86::VBLENDPDrri:
2358 case X86::VBLENDPSrri:
2359 case X86::VBLENDPDYrri:
2360 case X86::VBLENDPSYrri:
2361 case X86::VPBLENDDrri:
2362 case X86::VPBLENDWrri:
2363 case X86::VPBLENDDYrri:
2364 case X86::VPBLENDWYrri: {
2369 case X86::BLENDPDrri:
2370 Mask = (int8_t)0x03;
2372 case X86::BLENDPSrri:
2373 Mask = (int8_t)0x0F;
2375 case X86::PBLENDWrri:
2376 Mask = (int8_t)0xFF;
2378 case X86::VBLENDPDrri:
2379 Mask = (int8_t)0x03;
2381 case X86::VBLENDPSrri:
2382 Mask = (int8_t)0x0F;
2384 case X86::VBLENDPDYrri:
2385 Mask = (int8_t)0x0F;
2387 case X86::VBLENDPSYrri:
2388 Mask = (int8_t)0xFF;
2390 case X86::VPBLENDDrri:
2391 Mask = (int8_t)0x0F;
2393 case X86::VPBLENDWrri:
2394 Mask = (int8_t)0xFF;
2396 case X86::VPBLENDDYrri:
2397 Mask = (int8_t)0xFF;
2399 case X86::VPBLENDWYrri:
2400 Mask = (int8_t)0xFF;
2406 int8_t Imm =
MI.getOperand(3).getImm() & Mask;
2407 WorkingMI = CloneIfNew(
MI);
2411 case X86::INSERTPSrri:
2412 case X86::VINSERTPSrri:
2413 case X86::VINSERTPSZrri: {
2414 unsigned Imm =
MI.getOperand(
MI.getNumOperands() - 1).getImm();
2415 unsigned ZMask = Imm & 15;
2416 unsigned DstIdx = (Imm >> 4) & 3;
2417 unsigned SrcIdx = (Imm >> 6) & 3;
2421 if (DstIdx == SrcIdx && (ZMask & (1 << DstIdx)) == 0 &&
2424 assert(AltIdx < 4 &&
"Illegal insertion index");
2425 unsigned AltImm = (AltIdx << 6) | (AltIdx << 4) | ZMask;
2426 WorkingMI = CloneIfNew(
MI);
2435 case X86::VMOVSSrr: {
2437 if (Subtarget.hasSSE41()) {
2443 Opc = X86::BLENDPDrri;
2447 Opc = X86::BLENDPSrri;
2451 Opc = X86::VBLENDPDrri;
2455 Opc = X86::VBLENDPSrri;
2460 WorkingMI = CloneIfNew(
MI);
2466 assert(
Opc == X86::MOVSDrr &&
"Only MOVSD can commute to SHUFPD");
2467 WorkingMI = CloneIfNew(
MI);
2472 case X86::SHUFPDrri: {
2474 assert(
MI.getOperand(3).getImm() == 0x02 &&
"Unexpected immediate!");
2475 WorkingMI = CloneIfNew(
MI);
2480 case X86::PCLMULQDQrri:
2481 case X86::VPCLMULQDQrri:
2482 case X86::VPCLMULQDQYrri:
2483 case X86::VPCLMULQDQZrri:
2484 case X86::VPCLMULQDQZ128rri:
2485 case X86::VPCLMULQDQZ256rri: {
2488 unsigned Imm =
MI.getOperand(3).getImm();
2489 unsigned Src1Hi = Imm & 0x01;
2490 unsigned Src2Hi = Imm & 0x10;
2491 WorkingMI = CloneIfNew(
MI);
2495 case X86::VPCMPBZ128rri:
2496 case X86::VPCMPUBZ128rri:
2497 case X86::VPCMPBZ256rri:
2498 case X86::VPCMPUBZ256rri:
2499 case X86::VPCMPBZrri:
2500 case X86::VPCMPUBZrri:
2501 case X86::VPCMPDZ128rri:
2502 case X86::VPCMPUDZ128rri:
2503 case X86::VPCMPDZ256rri:
2504 case X86::VPCMPUDZ256rri:
2505 case X86::VPCMPDZrri:
2506 case X86::VPCMPUDZrri:
2507 case X86::VPCMPQZ128rri:
2508 case X86::VPCMPUQZ128rri:
2509 case X86::VPCMPQZ256rri:
2510 case X86::VPCMPUQZ256rri:
2511 case X86::VPCMPQZrri:
2512 case X86::VPCMPUQZrri:
2513 case X86::VPCMPWZ128rri:
2514 case X86::VPCMPUWZ128rri:
2515 case X86::VPCMPWZ256rri:
2516 case X86::VPCMPUWZ256rri:
2517 case X86::VPCMPWZrri:
2518 case X86::VPCMPUWZrri:
2519 case X86::VPCMPBZ128rrik:
2520 case X86::VPCMPUBZ128rrik:
2521 case X86::VPCMPBZ256rrik:
2522 case X86::VPCMPUBZ256rrik:
2523 case X86::VPCMPBZrrik:
2524 case X86::VPCMPUBZrrik:
2525 case X86::VPCMPDZ128rrik:
2526 case X86::VPCMPUDZ128rrik:
2527 case X86::VPCMPDZ256rrik:
2528 case X86::VPCMPUDZ256rrik:
2529 case X86::VPCMPDZrrik:
2530 case X86::VPCMPUDZrrik:
2531 case X86::VPCMPQZ128rrik:
2532 case X86::VPCMPUQZ128rrik:
2533 case X86::VPCMPQZ256rrik:
2534 case X86::VPCMPUQZ256rrik:
2535 case X86::VPCMPQZrrik:
2536 case X86::VPCMPUQZrrik:
2537 case X86::VPCMPWZ128rrik:
2538 case X86::VPCMPUWZ128rrik:
2539 case X86::VPCMPWZ256rrik:
2540 case X86::VPCMPUWZ256rrik:
2541 case X86::VPCMPWZrrik:
2542 case X86::VPCMPUWZrrik:
2543 WorkingMI = CloneIfNew(
MI);
2547 MI.getOperand(
MI.getNumOperands() - 1).getImm() & 0x7));
2550 case X86::VPCOMUBri:
2552 case X86::VPCOMUDri:
2554 case X86::VPCOMUQri:
2556 case X86::VPCOMUWri:
2557 WorkingMI = CloneIfNew(
MI);
2562 case X86::VCMPSDZrri:
2563 case X86::VCMPSSZrri:
2564 case X86::VCMPPDZrri:
2565 case X86::VCMPPSZrri:
2566 case X86::VCMPSHZrri:
2567 case X86::VCMPPHZrri:
2568 case X86::VCMPPHZ128rri:
2569 case X86::VCMPPHZ256rri:
2570 case X86::VCMPPDZ128rri:
2571 case X86::VCMPPSZ128rri:
2572 case X86::VCMPPDZ256rri:
2573 case X86::VCMPPSZ256rri:
2574 case X86::VCMPPDZrrik:
2575 case X86::VCMPPSZrrik:
2576 case X86::VCMPPHZrrik:
2577 case X86::VCMPPDZ128rrik:
2578 case X86::VCMPPSZ128rrik:
2579 case X86::VCMPPHZ128rrik:
2580 case X86::VCMPPDZ256rrik:
2581 case X86::VCMPPSZ256rrik:
2582 case X86::VCMPPHZ256rrik:
2583 WorkingMI = CloneIfNew(
MI);
2586 MI.getOperand(
MI.getNumExplicitOperands() - 1).getImm() & 0x1f));
2588 case X86::VPERM2F128rri:
2589 case X86::VPERM2I128rri:
2593 WorkingMI = CloneIfNew(
MI);
2596 case X86::MOVHLPSrr:
2597 case X86::UNPCKHPDrr:
2598 case X86::VMOVHLPSrr:
2599 case X86::VUNPCKHPDrr:
2600 case X86::VMOVHLPSZrr:
2601 case X86::VUNPCKHPDZ128rr:
2602 assert(Subtarget.hasSSE2() &&
"Commuting MOVHLP/UNPCKHPD requires SSE2!");
2607 case X86::MOVHLPSrr:
2608 Opc = X86::UNPCKHPDrr;
2610 case X86::UNPCKHPDrr:
2611 Opc = X86::MOVHLPSrr;
2613 case X86::VMOVHLPSrr:
2614 Opc = X86::VUNPCKHPDrr;
2616 case X86::VUNPCKHPDrr:
2617 Opc = X86::VMOVHLPSrr;
2619 case X86::VMOVHLPSZrr:
2620 Opc = X86::VUNPCKHPDZ128rr;
2622 case X86::VUNPCKHPDZ128rr:
2623 Opc = X86::VMOVHLPSZrr;
2626 WorkingMI = CloneIfNew(
MI);
2632 WorkingMI = CloneIfNew(
MI);
2633 unsigned OpNo =
MI.getDesc().getNumOperands() - 1;
2638 case X86::VPTERNLOGDZrri:
2639 case X86::VPTERNLOGDZrmi:
2640 case X86::VPTERNLOGDZ128rri:
2641 case X86::VPTERNLOGDZ128rmi:
2642 case X86::VPTERNLOGDZ256rri:
2643 case X86::VPTERNLOGDZ256rmi:
2644 case X86::VPTERNLOGQZrri:
2645 case X86::VPTERNLOGQZrmi:
2646 case X86::VPTERNLOGQZ128rri:
2647 case X86::VPTERNLOGQZ128rmi:
2648 case X86::VPTERNLOGQZ256rri:
2649 case X86::VPTERNLOGQZ256rmi:
2650 case X86::VPTERNLOGDZrrik:
2651 case X86::VPTERNLOGDZ128rrik:
2652 case X86::VPTERNLOGDZ256rrik:
2653 case X86::VPTERNLOGQZrrik:
2654 case X86::VPTERNLOGQZ128rrik:
2655 case X86::VPTERNLOGQZ256rrik:
2656 case X86::VPTERNLOGDZrrikz:
2657 case X86::VPTERNLOGDZrmikz:
2658 case X86::VPTERNLOGDZ128rrikz:
2659 case X86::VPTERNLOGDZ128rmikz:
2660 case X86::VPTERNLOGDZ256rrikz:
2661 case X86::VPTERNLOGDZ256rmikz:
2662 case X86::VPTERNLOGQZrrikz:
2663 case X86::VPTERNLOGQZrmikz:
2664 case X86::VPTERNLOGQZ128rrikz:
2665 case X86::VPTERNLOGQZ128rmikz:
2666 case X86::VPTERNLOGQZ256rrikz:
2667 case X86::VPTERNLOGQZ256rmikz:
2668 case X86::VPTERNLOGDZ128rmbi:
2669 case X86::VPTERNLOGDZ256rmbi:
2670 case X86::VPTERNLOGDZrmbi:
2671 case X86::VPTERNLOGQZ128rmbi:
2672 case X86::VPTERNLOGQZ256rmbi:
2673 case X86::VPTERNLOGQZrmbi:
2674 case X86::VPTERNLOGDZ128rmbikz:
2675 case X86::VPTERNLOGDZ256rmbikz:
2676 case X86::VPTERNLOGDZrmbikz:
2677 case X86::VPTERNLOGQZ128rmbikz:
2678 case X86::VPTERNLOGQZ256rmbikz:
2679 case X86::VPTERNLOGQZrmbikz: {
2680 WorkingMI = CloneIfNew(
MI);
2686 WorkingMI = CloneIfNew(
MI);
2692 WorkingMI = CloneIfNew(
MI);
2701bool X86InstrInfo::findThreeSrcCommutedOpIndices(
const MachineInstr &
MI,
2702 unsigned &SrcOpIdx1,
2703 unsigned &SrcOpIdx2,
2704 bool IsIntrinsic)
const {
2707 unsigned FirstCommutableVecOp = 1;
2708 unsigned LastCommutableVecOp = 3;
2709 unsigned KMaskOp = -1U;
2732 FirstCommutableVecOp = 3;
2734 LastCommutableVecOp++;
2735 }
else if (IsIntrinsic) {
2738 FirstCommutableVecOp = 2;
2741 if (
isMem(
MI, LastCommutableVecOp))
2742 LastCommutableVecOp--;
2747 if (SrcOpIdx1 != CommuteAnyOperandIndex &&
2748 (SrcOpIdx1 < FirstCommutableVecOp || SrcOpIdx1 > LastCommutableVecOp ||
2749 SrcOpIdx1 == KMaskOp))
2751 if (SrcOpIdx2 != CommuteAnyOperandIndex &&
2752 (SrcOpIdx2 < FirstCommutableVecOp || SrcOpIdx2 > LastCommutableVecOp ||
2753 SrcOpIdx2 == KMaskOp))
2758 if (SrcOpIdx1 == CommuteAnyOperandIndex ||
2759 SrcOpIdx2 == CommuteAnyOperandIndex) {
2760 unsigned CommutableOpIdx2 = SrcOpIdx2;
2764 if (SrcOpIdx1 == SrcOpIdx2)
2767 CommutableOpIdx2 = LastCommutableVecOp;
2768 else if (SrcOpIdx2 == CommuteAnyOperandIndex)
2770 CommutableOpIdx2 = SrcOpIdx1;
2774 Register Op2Reg =
MI.getOperand(CommutableOpIdx2).getReg();
2776 unsigned CommutableOpIdx1;
2777 for (CommutableOpIdx1 = LastCommutableVecOp;
2778 CommutableOpIdx1 >= FirstCommutableVecOp; CommutableOpIdx1--) {
2780 if (CommutableOpIdx1 == KMaskOp)
2786 if (Op2Reg !=
MI.getOperand(CommutableOpIdx1).getReg())
2791 if (CommutableOpIdx1 < FirstCommutableVecOp)
2796 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
2805 unsigned &SrcOpIdx1,
2806 unsigned &SrcOpIdx2)
const {
2808 if (!
Desc.isCommutable())
2811 switch (
MI.getOpcode()) {
2816 case X86::VCMPSDrri:
2817 case X86::VCMPSSrri:
2818 case X86::VCMPPDrri:
2819 case X86::VCMPPSrri:
2820 case X86::VCMPPDYrri:
2821 case X86::VCMPPSYrri:
2822 case X86::VCMPSDZrri:
2823 case X86::VCMPSSZrri:
2824 case X86::VCMPPDZrri:
2825 case X86::VCMPPSZrri:
2826 case X86::VCMPSHZrri:
2827 case X86::VCMPPHZrri:
2828 case X86::VCMPPHZ128rri:
2829 case X86::VCMPPHZ256rri:
2830 case X86::VCMPPDZ128rri:
2831 case X86::VCMPPSZ128rri:
2832 case X86::VCMPPDZ256rri:
2833 case X86::VCMPPSZ256rri:
2834 case X86::VCMPPDZrrik:
2835 case X86::VCMPPSZrrik:
2836 case X86::VCMPPHZrrik:
2837 case X86::VCMPPDZ128rrik:
2838 case X86::VCMPPSZ128rrik:
2839 case X86::VCMPPHZ128rrik:
2840 case X86::VCMPPDZ256rrik:
2841 case X86::VCMPPSZ256rrik:
2842 case X86::VCMPPHZ256rrik: {
2847 unsigned Imm =
MI.getOperand(3 + OpOffset).getImm() & 0x7;
2864 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1 + OpOffset,
2871 if (Subtarget.hasSSE41())
2874 case X86::SHUFPDrri:
2876 if (
MI.getOperand(3).getImm() == 0x02)
2879 case X86::MOVHLPSrr:
2880 case X86::UNPCKHPDrr:
2881 case X86::VMOVHLPSrr:
2882 case X86::VUNPCKHPDrr:
2883 case X86::VMOVHLPSZrr:
2884 case X86::VUNPCKHPDZ128rr:
2885 if (Subtarget.hasSSE2())
2888 case X86::VPTERNLOGDZrri:
2889 case X86::VPTERNLOGDZrmi:
2890 case X86::VPTERNLOGDZ128rri:
2891 case X86::VPTERNLOGDZ128rmi:
2892 case X86::VPTERNLOGDZ256rri:
2893 case X86::VPTERNLOGDZ256rmi:
2894 case X86::VPTERNLOGQZrri:
2895 case X86::VPTERNLOGQZrmi:
2896 case X86::VPTERNLOGQZ128rri:
2897 case X86::VPTERNLOGQZ128rmi:
2898 case X86::VPTERNLOGQZ256rri:
2899 case X86::VPTERNLOGQZ256rmi:
2900 case X86::VPTERNLOGDZrrik:
2901 case X86::VPTERNLOGDZ128rrik:
2902 case X86::VPTERNLOGDZ256rrik:
2903 case X86::VPTERNLOGQZrrik:
2904 case X86::VPTERNLOGQZ128rrik:
2905 case X86::VPTERNLOGQZ256rrik:
2906 case X86::VPTERNLOGDZrrikz:
2907 case X86::VPTERNLOGDZrmikz:
2908 case X86::VPTERNLOGDZ128rrikz:
2909 case X86::VPTERNLOGDZ128rmikz:
2910 case X86::VPTERNLOGDZ256rrikz:
2911 case X86::VPTERNLOGDZ256rmikz:
2912 case X86::VPTERNLOGQZrrikz:
2913 case X86::VPTERNLOGQZrmikz:
2914 case X86::VPTERNLOGQZ128rrikz:
2915 case X86::VPTERNLOGQZ128rmikz:
2916 case X86::VPTERNLOGQZ256rrikz:
2917 case X86::VPTERNLOGQZ256rmikz:
2918 case X86::VPTERNLOGDZ128rmbi:
2919 case X86::VPTERNLOGDZ256rmbi:
2920 case X86::VPTERNLOGDZrmbi:
2921 case X86::VPTERNLOGQZ128rmbi:
2922 case X86::VPTERNLOGQZ256rmbi:
2923 case X86::VPTERNLOGQZrmbi:
2924 case X86::VPTERNLOGDZ128rmbikz:
2925 case X86::VPTERNLOGDZ256rmbikz:
2926 case X86::VPTERNLOGDZrmbikz:
2927 case X86::VPTERNLOGQZ128rmbikz:
2928 case X86::VPTERNLOGQZ256rmbikz:
2929 case X86::VPTERNLOGQZrmbikz:
2930 return findThreeSrcCommutedOpIndices(
MI, SrcOpIdx1, SrcOpIdx2);
2931 case X86::VPDPWSSDYrr:
2932 case X86::VPDPWSSDrr:
2933 case X86::VPDPWSSDSYrr:
2934 case X86::VPDPWSSDSrr:
2935 case X86::VPDPWUUDrr:
2936 case X86::VPDPWUUDYrr:
2937 case X86::VPDPWUUDSrr:
2938 case X86::VPDPWUUDSYrr:
2939 case X86::VPDPBSSDSrr:
2940 case X86::VPDPBSSDSYrr:
2941 case X86::VPDPBSSDrr:
2942 case X86::VPDPBSSDYrr:
2943 case X86::VPDPBUUDSrr:
2944 case X86::VPDPBUUDSYrr:
2945 case X86::VPDPBUUDrr:
2946 case X86::VPDPBUUDYrr:
2947 case X86::VPDPBSSDSZ128rr:
2948 case X86::VPDPBSSDSZ128rrk:
2949 case X86::VPDPBSSDSZ128rrkz:
2950 case X86::VPDPBSSDSZ256rr:
2951 case X86::VPDPBSSDSZ256rrk:
2952 case X86::VPDPBSSDSZ256rrkz:
2953 case X86::VPDPBSSDSZrr:
2954 case X86::VPDPBSSDSZrrk:
2955 case X86::VPDPBSSDSZrrkz:
2956 case X86::VPDPBSSDZ128rr:
2957 case X86::VPDPBSSDZ128rrk:
2958 case X86::VPDPBSSDZ128rrkz:
2959 case X86::VPDPBSSDZ256rr:
2960 case X86::VPDPBSSDZ256rrk:
2961 case X86::VPDPBSSDZ256rrkz:
2962 case X86::VPDPBSSDZrr:
2963 case X86::VPDPBSSDZrrk:
2964 case X86::VPDPBSSDZrrkz:
2965 case X86::VPDPBUUDSZ128rr:
2966 case X86::VPDPBUUDSZ128rrk:
2967 case X86::VPDPBUUDSZ128rrkz:
2968 case X86::VPDPBUUDSZ256rr:
2969 case X86::VPDPBUUDSZ256rrk:
2970 case X86::VPDPBUUDSZ256rrkz:
2971 case X86::VPDPBUUDSZrr:
2972 case X86::VPDPBUUDSZrrk:
2973 case X86::VPDPBUUDSZrrkz:
2974 case X86::VPDPBUUDZ128rr:
2975 case X86::VPDPBUUDZ128rrk:
2976 case X86::VPDPBUUDZ128rrkz:
2977 case X86::VPDPBUUDZ256rr:
2978 case X86::VPDPBUUDZ256rrk:
2979 case X86::VPDPBUUDZ256rrkz:
2980 case X86::VPDPBUUDZrr:
2981 case X86::VPDPBUUDZrrk:
2982 case X86::VPDPBUUDZrrkz:
2983 case X86::VPDPWSSDZ128rr:
2984 case X86::VPDPWSSDZ128rrk:
2985 case X86::VPDPWSSDZ128rrkz:
2986 case X86::VPDPWSSDZ256rr:
2987 case X86::VPDPWSSDZ256rrk:
2988 case X86::VPDPWSSDZ256rrkz:
2989 case X86::VPDPWSSDZrr:
2990 case X86::VPDPWSSDZrrk:
2991 case X86::VPDPWSSDZrrkz:
2992 case X86::VPDPWSSDSZ128rr:
2993 case X86::VPDPWSSDSZ128rrk:
2994 case X86::VPDPWSSDSZ128rrkz:
2995 case X86::VPDPWSSDSZ256rr:
2996 case X86::VPDPWSSDSZ256rrk:
2997 case X86::VPDPWSSDSZ256rrkz:
2998 case X86::VPDPWSSDSZrr:
2999 case X86::VPDPWSSDSZrrk:
3000 case X86::VPDPWSSDSZrrkz:
3001 case X86::VPDPWUUDZ128rr:
3002 case X86::VPDPWUUDZ128rrk:
3003 case X86::VPDPWUUDZ128rrkz:
3004 case X86::VPDPWUUDZ256rr:
3005 case X86::VPDPWUUDZ256rrk:
3006 case X86::VPDPWUUDZ256rrkz:
3007 case X86::VPDPWUUDZrr:
3008 case X86::VPDPWUUDZrrk:
3009 case X86::VPDPWUUDZrrkz:
3010 case X86::VPDPWUUDSZ128rr:
3011 case X86::VPDPWUUDSZ128rrk:
3012 case X86::VPDPWUUDSZ128rrkz:
3013 case X86::VPDPWUUDSZ256rr:
3014 case X86::VPDPWUUDSZ256rrk:
3015 case X86::VPDPWUUDSZ256rrkz:
3016 case X86::VPDPWUUDSZrr:
3017 case X86::VPDPWUUDSZrrk:
3018 case X86::VPDPWUUDSZrrkz:
3019 case X86::VPMADD52HUQrr:
3020 case X86::VPMADD52HUQYrr:
3021 case X86::VPMADD52HUQZ128r:
3022 case X86::VPMADD52HUQZ128rk:
3023 case X86::VPMADD52HUQZ128rkz:
3024 case X86::VPMADD52HUQZ256r:
3025 case X86::VPMADD52HUQZ256rk:
3026 case X86::VPMADD52HUQZ256rkz:
3027 case X86::VPMADD52HUQZr:
3028 case X86::VPMADD52HUQZrk:
3029 case X86::VPMADD52HUQZrkz:
3030 case X86::VPMADD52LUQrr:
3031 case X86::VPMADD52LUQYrr:
3032 case X86::VPMADD52LUQZ128r:
3033 case X86::VPMADD52LUQZ128rk:
3034 case X86::VPMADD52LUQZ128rkz:
3035 case X86::VPMADD52LUQZ256r:
3036 case X86::VPMADD52LUQZ256rk:
3037 case X86::VPMADD52LUQZ256rkz:
3038 case X86::VPMADD52LUQZr:
3039 case X86::VPMADD52LUQZrk:
3040 case X86::VPMADD52LUQZrkz:
3041 case X86::VFMADDCPHZr:
3042 case X86::VFMADDCPHZrk:
3043 case X86::VFMADDCPHZrkz:
3044 case X86::VFMADDCPHZ128r:
3045 case X86::VFMADDCPHZ128rk:
3046 case X86::VFMADDCPHZ128rkz:
3047 case X86::VFMADDCPHZ256r:
3048 case X86::VFMADDCPHZ256rk:
3049 case X86::VFMADDCPHZ256rkz:
3050 case X86::VFMADDCSHZr:
3051 case X86::VFMADDCSHZrk:
3052 case X86::VFMADDCSHZrkz: {
3053 unsigned CommutableOpIdx1 = 2;
3054 unsigned CommutableOpIdx2 = 3;
3060 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
3063 if (!
MI.getOperand(SrcOpIdx1).isReg() || !
MI.getOperand(SrcOpIdx2).isReg())
3073 return findThreeSrcCommutedOpIndices(
MI, SrcOpIdx1, SrcOpIdx2,
3080 unsigned CommutableOpIdx1 =
Desc.getNumDefs() + 1;
3081 unsigned CommutableOpIdx2 =
Desc.getNumDefs() + 2;
3084 if ((
MI.getDesc().getOperandConstraint(
Desc.getNumDefs(),
3099 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
3103 if (!
MI.getOperand(SrcOpIdx1).isReg() ||
3104 !
MI.getOperand(SrcOpIdx2).isReg())
3116 unsigned Opcode =
MI->getOpcode();
3117 if (Opcode != X86::LEA32r && Opcode != X86::LEA64r &&
3118 Opcode != X86::LEA64_32r)
3140 unsigned Opcode =
MI.getOpcode();
3141 if (Opcode != X86::ADD32rr && Opcode != X86::ADD64rr)
3168 unsigned Opcode =
MCID.getOpcode();
3169 if (!(X86::isJCC(Opcode) || X86::isSETCC(Opcode) || X86::isSETZUCC(Opcode) ||
3170 X86::isCMOVCC(Opcode) || X86::isCFCMOVCC(Opcode) ||
3171 X86::isCCMPCC(Opcode) || X86::isCTESTCC(Opcode)))
3174 unsigned NumUses =
MCID.getNumOperands() -
MCID.getNumDefs();
3183 CondNo +=
MCID.getNumDefs();
3193 return X86::isSETCC(
MI.getOpcode()) || X86::isSETZUCC(
MI.getOpcode())
3209 return X86::isCCMPCC(
MI.getOpcode()) || X86::isCTESTCC(
MI.getOpcode())
3240 enum { CF = 1, ZF = 2, SF = 4, OF = 8, PF = CF };
3271#define GET_X86_NF_TRANSFORM_TABLE
3272#define GET_X86_ND2NONND_TABLE
3273#include "X86GenInstrMapping.inc"
3278 return (
I == Table.
end() ||
I->OldOpc !=
Opc) ? 0U :
I->NewOpc;
3281#if defined(EXPENSIVE_CHECKS) && !defined(NDEBUG)
3283 static std::atomic<bool> NFTableChecked(
false);
3284 if (!NFTableChecked.load(std::memory_order_relaxed)) {
3286 "X86NFTransformTable is not sorted!");
3287 NFTableChecked.store(
true, std::memory_order_relaxed);
3294#if defined(EXPENSIVE_CHECKS) && !defined(NDEBUG)
3296 static std::atomic<bool> NDTableChecked(
false);
3297 if (!NDTableChecked.load(std::memory_order_relaxed)) {
3299 "X86ND2NonNDTableis not sorted!");
3300 NDTableChecked.store(
true, std::memory_order_relaxed);
3380std::pair<X86::CondCode, bool>
3383 bool NeedSwap =
false;
3384 switch (Predicate) {
3463 return std::make_pair(CC, NeedSwap);
3472#define GET_ND_IF_ENABLED(OPC) (HasNDD ? OPC##_ND : OPC)
3487 return X86::MOV32ri;
3490 return X86::MOV32ri64;
3492 return X86::MOV64ri32;
3493 return X86::MOV64ri;
3577 switch (Imm & 0x3) {
3595 if (Info.RegClass == X86::VR128RegClassID ||
3596 Info.RegClass == X86::VR128XRegClassID)
3598 if (Info.RegClass == X86::VR256RegClassID ||
3599 Info.RegClass == X86::VR256XRegClassID)
3601 if (Info.RegClass == X86::VR512RegClassID)
3608 return (
Reg == X86::FPCW ||
Reg == X86::FPSW ||
3609 (
Reg >= X86::ST0 &&
Reg <= X86::ST7));
3617 if (
MI.isCall() ||
MI.isInlineAsm())
3641#ifdef EXPENSIVE_CHECKS
3643 "Got false negative from X86II::getMemoryOperandNo()!");
3653#ifdef EXPENSIVE_CHECKS
3655 "Expected no operands to have OPERAND_MEMORY type!");
3664 if (IsMemOp(
Desc.operands()[
I])) {
3665#ifdef EXPENSIVE_CHECKS
3669 "Expected all five operands in the memory reference to have "
3670 "OPERAND_MEMORY type!");
3682 "Unexpected number of operands!");
3685 if (!Index.isReg() || Index.getReg() != X86::NoRegister)
3693 MI.getParent()->getParent()->getConstantPool()->getConstants();
3705 switch (
MI.getOpcode()) {
3706 case X86::TCRETURNdi:
3707 case X86::TCRETURNri:
3708 case X86::TCRETURNmi:
3709 case X86::TCRETURNdi64:
3710 case X86::TCRETURNri64:
3711 case X86::TCRETURNri64_ImpCall:
3712 case X86::TCRETURNmi64:
3731 if (Symbol ==
"__x86_indirect_thunk_r11")
3736 if (TailCall.
getOpcode() != X86::TCRETURNdi &&
3737 TailCall.
getOpcode() != X86::TCRETURNdi64) {
3742 if (Subtarget.isTargetWin64() && MF->
hasWinCFI()) {
3769 while (
I !=
MBB.begin()) {
3771 if (
I->isDebugInstr())
3774 assert(0 &&
"Can't find the branch to replace!");
3778 if (CC != BranchCond[0].
getImm())
3784 unsigned Opc = TailCall.
getOpcode() == X86::TCRETURNdi ? X86::TCRETURNdicc
3785 : X86::TCRETURNdi64cc;
3798 LiveRegs.stepForward(*MIB, Clobbers);
3799 for (
const auto &
C : Clobbers) {
3804 I->eraseFromParent();
3818 if (Succ->isEHPad() || (Succ ==
TBB && FallthroughBB))
3821 if (FallthroughBB && FallthroughBB !=
TBB)
3823 FallthroughBB = Succ;
3825 return FallthroughBB;
3828bool X86InstrInfo::analyzeBranchImpl(
3839 if (
I->isDebugInstr())
3844 if (!isUnpredicatedTerminator(*
I))
3853 if (
I->getOpcode() == X86::JMP_1) {
3857 TBB =
I->getOperand(0).getMBB();
3872 UnCondBrIter =
MBB.
end();
3877 TBB =
I->getOperand(0).getMBB();
3888 if (
I->findRegisterUseOperand(X86::EFLAGS,
nullptr)->isUndef())
3894 TBB =
I->getOperand(0).getMBB();
3909 if (OldBranchCode == BranchCode &&
TBB == NewTBB)
3915 if (
TBB == NewTBB &&
3948 Cond[0].setImm(BranchCode);
3959 bool AllowModify)
const {
3961 return analyzeBranchImpl(
MBB,
TBB, FBB,
Cond, CondBranches, AllowModify);
3967 assert(MemRefBegin >= 0 &&
"instr should have memory operand");
3979 if (!
Reg.isVirtual())
3984 unsigned Opcode =
MI->getOpcode();
3985 if (Opcode != X86::LEA64r && Opcode != X86::LEA32r)
3991 unsigned Opcode =
MI.getOpcode();
3994 if (Opcode == X86::JMP64m || Opcode == X86::JMP32m) {
4002 if (Opcode == X86::JMP64r || Opcode == X86::JMP32r) {
4004 if (!Reg.isVirtual())
4011 if (
Add->getOpcode() != X86::ADD64rr &&
Add->getOpcode() != X86::ADD32rr)
4024 MachineBranchPredicate &MBP,
4025 bool AllowModify)
const {
4026 using namespace std::placeholders;
4030 if (analyzeBranchImpl(
MBB, MBP.TrueDest, MBP.FalseDest,
Cond, CondBranches,
4034 if (
Cond.size() != 1)
4037 assert(MBP.TrueDest &&
"expected!");
4040 MBP.FalseDest =
MBB.getNextNode();
4045 bool SingleUseCondition =
true;
4048 if (
MI.modifiesRegister(X86::EFLAGS,
TRI)) {
4053 if (
MI.readsRegister(X86::EFLAGS,
TRI))
4054 SingleUseCondition =
false;
4060 if (SingleUseCondition) {
4061 for (
auto *Succ :
MBB.successors())
4062 if (Succ->isLiveIn(X86::EFLAGS))
4063 SingleUseCondition =
false;
4066 MBP.ConditionDef = ConditionDef;
4067 MBP.SingleUseCondition = SingleUseCondition;
4074 const unsigned TestOpcode =
4075 Subtarget.is64Bit() ? X86::TEST64rr : X86::TEST32rr;
4077 if (ConditionDef->
getOpcode() == TestOpcode &&
4084 ? MachineBranchPredicate::PRED_NE
4085 : MachineBranchPredicate::PRED_EQ;
4093 int *BytesRemoved)
const {
4094 assert(!BytesRemoved &&
"code size not handled");
4099 while (
I !=
MBB.begin()) {
4101 if (
I->isDebugInstr())
4103 if (
I->getOpcode() != X86::JMP_1 &&
4107 I->eraseFromParent();
4121 assert(
TBB &&
"insertBranch must not be told to insert a fallthrough");
4123 "X86 branch conditions have one component!");
4124 assert(!BytesAdded &&
"code size not handled");
4128 assert(!FBB &&
"Unconditional branch with multiple successors!");
4134 bool FallThru = FBB ==
nullptr;
4149 if (FBB ==
nullptr) {
4151 assert(FBB &&
"MBB cannot be the last block in function when the false "
4152 "body is a fall-through.");
4176 Register FalseReg,
int &CondCycles,
4177 int &TrueCycles,
int &FalseCycles)
const {
4179 if (!Subtarget.canUseCMOV())
4181 if (
Cond.size() != 1)
4195 if (X86::GR16RegClass.hasSubClassEq(RC) ||
4196 X86::GR32RegClass.hasSubClassEq(RC) ||
4197 X86::GR64RegClass.hasSubClassEq(RC)) {
4218 assert(
Cond.size() == 1 &&
"Invalid Cond array");
4221 false , Subtarget.hasNDD());
4230 return X86::GR8_ABCD_HRegClass.contains(
Reg);
4236 bool HasAVX = Subtarget.
hasAVX();
4238 bool HasEGPR = Subtarget.hasEGPR();
4245 if (X86::VK16RegClass.
contains(SrcReg)) {
4246 if (X86::GR64RegClass.
contains(DestReg)) {
4247 assert(Subtarget.hasBWI());
4248 return HasEGPR ? X86::KMOVQrk_EVEX : X86::KMOVQrk;
4250 if (X86::GR32RegClass.
contains(DestReg))
4251 return Subtarget.hasBWI() ? (HasEGPR ? X86::KMOVDrk_EVEX : X86::KMOVDrk)
4252 : (HasEGPR ? X86::KMOVWrk_EVEX : X86::KMOVWrk);
4260 if (X86::VK16RegClass.
contains(DestReg)) {
4261 if (X86::GR64RegClass.
contains(SrcReg)) {
4262 assert(Subtarget.hasBWI());
4263 return HasEGPR ? X86::KMOVQkr_EVEX : X86::KMOVQkr;
4265 if (X86::GR32RegClass.
contains(SrcReg))
4266 return Subtarget.hasBWI() ? (HasEGPR ? X86::KMOVDkr_EVEX : X86::KMOVDkr)
4267 : (HasEGPR ? X86::KMOVWkr_EVEX : X86::KMOVWkr);
4275 if (X86::GR64RegClass.
contains(DestReg)) {
4276 if (X86::VR128XRegClass.
contains(SrcReg))
4278 return HasAVX512 ? X86::VMOVPQIto64Zrr
4279 : HasAVX ? X86::VMOVPQIto64rr
4280 : X86::MOVPQIto64rr;
4281 if (X86::VR64RegClass.
contains(SrcReg))
4283 return X86::MMX_MOVD64from64rr;
4284 }
else if (X86::GR64RegClass.
contains(SrcReg)) {
4286 if (X86::VR128XRegClass.
contains(DestReg))
4287 return HasAVX512 ? X86::VMOV64toPQIZrr
4288 : HasAVX ? X86::VMOV64toPQIrr
4289 : X86::MOV64toPQIrr;
4291 if (X86::VR64RegClass.
contains(DestReg))
4292 return X86::MMX_MOVD64to64rr;
4298 if (X86::GR32RegClass.
contains(DestReg) &&
4299 X86::VR128XRegClass.
contains(SrcReg))
4301 return HasAVX512 ? X86::VMOVPDI2DIZrr
4302 : HasAVX ? X86::VMOVPDI2DIrr
4305 if (X86::VR128XRegClass.
contains(DestReg) &&
4306 X86::GR32RegClass.
contains(SrcReg))
4308 return HasAVX512 ? X86::VMOVDI2PDIZrr
4309 : HasAVX ? X86::VMOVDI2PDIrr
4319 bool RenamableDest,
bool RenamableSrc)
const {
4321 bool HasAVX = Subtarget.hasAVX();
4322 bool HasVLX = Subtarget.hasVLX();
4323 bool HasEGPR = Subtarget.hasEGPR();
4325 if (X86::GR64RegClass.
contains(DestReg, SrcReg))
4327 else if (X86::GR32RegClass.
contains(DestReg, SrcReg))
4329 else if (X86::GR16RegClass.
contains(DestReg, SrcReg))
4331 else if (X86::GR8RegClass.
contains(DestReg, SrcReg)) {
4334 if ((
isHReg(DestReg) ||
isHReg(SrcReg)) && Subtarget.is64Bit()) {
4335 Opc = X86::MOV8rr_NOREX;
4338 "8-bit H register can not be copied outside GR8_NOREX");
4341 }
else if (X86::VR64RegClass.
contains(DestReg, SrcReg))
4342 Opc = X86::MMX_MOVQ64rr;
4343 else if (X86::VR128XRegClass.
contains(DestReg, SrcReg)) {
4345 Opc = X86::VMOVAPSZ128rr;
4346 else if (X86::VR128RegClass.
contains(DestReg, SrcReg))
4347 Opc = HasAVX ? X86::VMOVAPSrr : X86::MOVAPSrr;
4351 Opc = X86::VMOVAPSZrr;
4354 TRI->getMatchingSuperReg(DestReg, X86::sub_xmm, &X86::VR512RegClass);
4356 TRI->getMatchingSuperReg(SrcReg, X86::sub_xmm, &X86::VR512RegClass);
4358 }
else if (X86::VR256XRegClass.
contains(DestReg, SrcReg)) {
4360 Opc = X86::VMOVAPSZ256rr;
4361 else if (X86::VR256RegClass.
contains(DestReg, SrcReg))
4362 Opc = X86::VMOVAPSYrr;
4366 Opc = X86::VMOVAPSZrr;
4369 TRI->getMatchingSuperReg(DestReg, X86::sub_ymm, &X86::VR512RegClass);
4371 TRI->getMatchingSuperReg(SrcReg, X86::sub_ymm, &X86::VR512RegClass);
4373 }
else if (X86::VR512RegClass.
contains(DestReg, SrcReg))
4374 Opc = X86::VMOVAPSZrr;
4377 else if (X86::VK16RegClass.
contains(DestReg, SrcReg))
4378 Opc = Subtarget.hasBWI() ? (HasEGPR ? X86::KMOVQkk_EVEX : X86::KMOVQkk)
4379 : (HasEGPR ? X86::KMOVWkk_EVEX : X86::KMOVWkk);
4390 if (SrcReg == X86::EFLAGS || DestReg == X86::EFLAGS) {
4398 LLVM_DEBUG(
dbgs() <<
"Cannot copy " << RI.getName(SrcReg) <<
" to "
4399 << RI.getName(DestReg) <<
'\n');
4403std::optional<DestSourcePair>
4405 if (
MI.isMoveReg()) {
4409 if (
MI.getOperand(0).isUndef() &&
MI.getOperand(0).getSubReg())
4410 return std::nullopt;
4414 return std::nullopt;
4419 return Load ? X86::VMOVSHZrm_alt : X86::VMOVSHZmr;
4421 return X86::MOVSHPrm;
4422 return X86::MOVSHPmr;
4427 bool IsStackAligned,
4429 bool HasAVX = STI.
hasAVX();
4431 bool HasVLX = STI.hasVLX();
4432 bool HasEGPR = STI.hasEGPR();
4434 assert(RC !=
nullptr &&
"Invalid target register class");
4439 assert(X86::GR8RegClass.hasSubClassEq(RC) &&
"Unknown 1-byte regclass");
4443 if (
isHReg(
Reg) || X86::GR8_ABCD_HRegClass.hasSubClassEq(RC))
4444 return Load ? X86::MOV8rm_NOREX : X86::MOV8mr_NOREX;
4445 return Load ? X86::MOV8rm : X86::MOV8mr;
4447 if (X86::VK16RegClass.hasSubClassEq(RC))
4448 return Load ? (HasEGPR ? X86::KMOVWkm_EVEX : X86::KMOVWkm)
4449 : (HasEGPR ? X86::KMOVWmk_EVEX : X86::KMOVWmk);
4450 assert(X86::GR16RegClass.hasSubClassEq(RC) &&
"Unknown 2-byte regclass");
4451 return Load ? X86::MOV16rm : X86::MOV16mr;
4453 if (X86::GR32RegClass.hasSubClassEq(RC))
4454 return Load ? X86::MOV32rm : X86::MOV32mr;
4455 if (X86::FR32XRegClass.hasSubClassEq(RC))
4456 return Load ? (HasAVX512 ? X86::VMOVSSZrm_alt
4457 : HasAVX ? X86::VMOVSSrm_alt
4459 : (HasAVX512 ? X86::VMOVSSZmr
4460 : HasAVX ? X86::VMOVSSmr
4462 if (X86::RFP32RegClass.hasSubClassEq(RC))
4463 return Load ? X86::LD_Fp32m : X86::ST_Fp32m;
4464 if (X86::VK32RegClass.hasSubClassEq(RC)) {
4465 assert(STI.hasBWI() &&
"KMOVD requires BWI");
4466 return Load ? (HasEGPR ? X86::KMOVDkm_EVEX : X86::KMOVDkm)
4467 : (HasEGPR ? X86::KMOVDmk_EVEX : X86::KMOVDmk);
4471 if (X86::VK1PAIRRegClass.hasSubClassEq(RC) ||
4472 X86::VK2PAIRRegClass.hasSubClassEq(RC) ||
4473 X86::VK4PAIRRegClass.hasSubClassEq(RC) ||
4474 X86::VK8PAIRRegClass.hasSubClassEq(RC) ||
4475 X86::VK16PAIRRegClass.hasSubClassEq(RC))
4476 return Load ? X86::MASKPAIR16LOAD : X86::MASKPAIR16STORE;
4477 if (X86::FR16RegClass.hasSubClassEq(RC) ||
4478 X86::FR16XRegClass.hasSubClassEq(RC))
4482 if (X86::GR64RegClass.hasSubClassEq(RC))
4483 return Load ? X86::MOV64rm : X86::MOV64mr;
4484 if (X86::FR64XRegClass.hasSubClassEq(RC))
4485 return Load ? (HasAVX512 ? X86::VMOVSDZrm_alt
4486 : HasAVX ? X86::VMOVSDrm_alt
4488 : (HasAVX512 ? X86::VMOVSDZmr
4489 : HasAVX ? X86::VMOVSDmr
4491 if (X86::VR64RegClass.hasSubClassEq(RC))
4492 return Load ? X86::MMX_MOVQ64rm : X86::MMX_MOVQ64mr;
4493 if (X86::RFP64RegClass.hasSubClassEq(RC))
4494 return Load ? X86::LD_Fp64m : X86::ST_Fp64m;
4495 if (X86::VK64RegClass.hasSubClassEq(RC)) {
4496 assert(STI.hasBWI() &&
"KMOVQ requires BWI");
4497 return Load ? (HasEGPR ? X86::KMOVQkm_EVEX : X86::KMOVQkm)
4498 : (HasEGPR ? X86::KMOVQmk_EVEX : X86::KMOVQmk);
4502 assert(X86::RFP80RegClass.hasSubClassEq(RC) &&
"Unknown 10-byte regclass");
4503 return Load ? X86::LD_Fp80m : X86::ST_FpP80m;
4505 if (X86::VR128XRegClass.hasSubClassEq(RC)) {
4508 return Load ? (HasVLX ? X86::VMOVAPSZ128rm
4509 : HasAVX512 ? X86::VMOVAPSZ128rm_NOVLX
4510 : HasAVX ? X86::VMOVAPSrm
4512 : (HasVLX ? X86::VMOVAPSZ128mr
4513 : HasAVX512 ? X86::VMOVAPSZ128mr_NOVLX
4514 : HasAVX ? X86::VMOVAPSmr
4517 return Load ? (HasVLX ? X86::VMOVUPSZ128rm
4518 : HasAVX512 ? X86::VMOVUPSZ128rm_NOVLX
4519 : HasAVX ? X86::VMOVUPSrm
4521 : (HasVLX ? X86::VMOVUPSZ128mr
4522 : HasAVX512 ? X86::VMOVUPSZ128mr_NOVLX
4523 : HasAVX ? X86::VMOVUPSmr
4529 assert(X86::VR256XRegClass.hasSubClassEq(RC) &&
"Unknown 32-byte regclass");
4532 return Load ? (HasVLX ? X86::VMOVAPSZ256rm
4533 : HasAVX512 ? X86::VMOVAPSZ256rm_NOVLX
4535 : (HasVLX ? X86::VMOVAPSZ256mr
4536 : HasAVX512 ? X86::VMOVAPSZ256mr_NOVLX
4539 return Load ? (HasVLX ? X86::VMOVUPSZ256rm
4540 : HasAVX512 ? X86::VMOVUPSZ256rm_NOVLX
4542 : (HasVLX ? X86::VMOVUPSZ256mr
4543 : HasAVX512 ? X86::VMOVUPSZ256mr_NOVLX
4546 assert(X86::VR512RegClass.hasSubClassEq(RC) &&
"Unknown 64-byte regclass");
4549 return Load ? X86::VMOVAPSZrm : X86::VMOVAPSZmr;
4551 return Load ? X86::VMOVUPSZrm : X86::VMOVUPSZmr;
4553 assert(X86::TILERegClass.hasSubClassEq(RC) &&
"Unknown 1024-byte regclass");
4554 assert(STI.hasAMXTILE() &&
"Using 8*1024-bit register requires AMX-TILE");
4555#define GET_EGPR_IF_ENABLED(OPC) (STI.hasEGPR() ? OPC##_EVEX : OPC)
4558#undef GET_EGPR_IF_ENABLED
4562std::optional<ExtAddrMode>
4567 if (MemRefBegin < 0)
4568 return std::nullopt;
4573 if (!BaseOp.isReg())
4574 return std::nullopt;
4578 if (!DispMO.
isImm())
4579 return std::nullopt;
4605 ErrInfo =
"Scale factor in address must be 1, 2, 4 or 8";
4610 ErrInfo =
"Displacement in address must fit into 32-bit signed "
4620 int64_t &ImmVal)
const {
4626 if (
MI.isSubregToReg()) {
4630 unsigned SubIdx =
MI.getOperand(2).getImm();
4631 MovReg =
MI.getOperand(1).getReg();
4632 if (SubIdx != X86::sub_32bit)
4640 if (MovMI->
getOpcode() == X86::MOV32r0 &&
4646 if (MovMI->
getOpcode() != X86::MOV32ri &&
4660 if (!
MI->modifiesRegister(NullValueReg,
TRI))
4662 switch (
MI->getOpcode()) {
4669 assert(
MI->getOperand(0).isDef() &&
MI->getOperand(1).isUse() &&
4670 "expected for shift opcode!");
4671 return MI->getOperand(0).getReg() == NullValueReg &&
4672 MI->getOperand(1).getReg() == NullValueReg;
4677 return TRI->isSubRegisterEq(NullValueReg, MO.getReg());
4691 if (MemRefBegin < 0)
4698 if (!BaseOp->
isReg())
4711 if (!DispMO.
isImm())
4716 if (!BaseOp->
isReg())
4719 OffsetIsScalable =
false;
4723 Width = !
MemOp.memoperands_empty() ?
MemOp.memoperands().front()->getSize()
4731 bool IsStackAligned,
4746 case X86::TILELOADD:
4747 case X86::TILESTORED:
4748 case X86::TILELOADD_EVEX:
4749 case X86::TILESTORED_EVEX:
4757 bool isKill)
const {
4761 case X86::TILESTORED:
4762 case X86::TILESTORED_EVEX: {
4765 Register VirtReg = RegInfo.createVirtualRegister(&X86::GR64_NOSPRegClass);
4775 case X86::TILELOADD:
4776 case X86::TILELOADD_EVEX: {
4779 Register VirtReg = RegInfo.createVirtualRegister(&X86::GR64_NOSPRegClass);
4799 "Stack slot too small for store");
4801 unsigned Alignment = std::max<uint32_t>(RI.getSpillSize(*RC), 16);
4803 (Subtarget.getFrameLowering()->
getStackAlign() >= Alignment) ||
4824 "Load size exceeds stack slot");
4825 unsigned Alignment = std::max<uint32_t>(RI.getSpillSize(*RC), 16);
4827 (Subtarget.getFrameLowering()->
getStackAlign() >= Alignment) ||
4839 Register &SrcReg2, int64_t &CmpMask,
4840 int64_t &CmpValue)
const {
4841 switch (
MI.getOpcode()) {
4844 case X86::CMP64ri32:
4848 SrcReg =
MI.getOperand(0).getReg();
4850 if (
MI.getOperand(1).isImm()) {
4852 CmpValue =
MI.getOperand(1).getImm();
4854 CmpMask = CmpValue = 0;
4862 SrcReg =
MI.getOperand(1).getReg();
4871 SrcReg =
MI.getOperand(1).getReg();
4872 SrcReg2 =
MI.getOperand(2).getReg();
4880 SrcReg =
MI.getOperand(1).getReg();
4882 if (
MI.getOperand(2).isImm()) {
4884 CmpValue =
MI.getOperand(2).getImm();
4886 CmpMask = CmpValue = 0;
4893 SrcReg =
MI.getOperand(0).getReg();
4894 SrcReg2 =
MI.getOperand(1).getReg();
4902 SrcReg =
MI.getOperand(0).getReg();
4903 if (
MI.getOperand(1).getReg() != SrcReg)
4910 case X86::TEST64ri32:
4914 SrcReg =
MI.getOperand(0).getReg();
4924bool X86InstrInfo::isRedundantFlagInstr(
const MachineInstr &FlagI,
4926 int64_t ImmMask, int64_t ImmValue,
4928 int64_t *ImmDelta)
const {
4943 OIMask != ImmMask || OIValue != ImmValue)
4945 if (SrcReg == OISrcReg && SrcReg2 == OISrcReg2) {
4949 if (SrcReg == OISrcReg2 && SrcReg2 == OISrcReg) {
4955 case X86::CMP64ri32:
4959 case X86::TEST64ri32:
4970 case X86::TEST8rr: {
4977 SrcReg == OISrcReg && ImmMask == OIMask) {
4978 if (OIValue == ImmValue) {
4981 }
else if (
static_cast<uint64_t
>(ImmValue) ==
4982 static_cast<uint64_t
>(OIValue) - 1) {
4985 }
else if (
static_cast<uint64_t
>(ImmValue) ==
4986 static_cast<uint64_t
>(OIValue) + 1) {
5004 bool &ClearsOverflowFlag) {
5006 ClearsOverflowFlag =
false;
5012 if (
MI.getOpcode() == X86::ADD64rm ||
MI.getOpcode() == X86::ADD32rm) {
5013 unsigned Flags =
MI.getOperand(5).getTargetFlags();
5019 switch (
MI.getOpcode()) {
5115 case X86::LZCNT16rr:
5116 case X86::LZCNT16rm:
5117 case X86::LZCNT32rr:
5118 case X86::LZCNT32rm:
5119 case X86::LZCNT64rr:
5120 case X86::LZCNT64rm:
5121 case X86::POPCNT16rr:
5122 case X86::POPCNT16rm:
5123 case X86::POPCNT32rr:
5124 case X86::POPCNT32rm:
5125 case X86::POPCNT64rr:
5126 case X86::POPCNT64rm:
5127 case X86::TZCNT16rr:
5128 case X86::TZCNT16rm:
5129 case X86::TZCNT32rr:
5130 case X86::TZCNT32rm:
5131 case X86::TZCNT64rr:
5132 case X86::TZCNT64rm:
5178 case X86::BLSMSK32rr:
5179 case X86::BLSMSK32rm:
5180 case X86::BLSMSK64rr:
5181 case X86::BLSMSK64rm:
5186 case X86::BLCFILL32rr:
5187 case X86::BLCFILL32rm:
5188 case X86::BLCFILL64rr:
5189 case X86::BLCFILL64rm:
5194 case X86::BLCIC32rr:
5195 case X86::BLCIC32rm:
5196 case X86::BLCIC64rr:
5197 case X86::BLCIC64rm:
5198 case X86::BLCMSK32rr:
5199 case X86::BLCMSK32rm:
5200 case X86::BLCMSK64rr:
5201 case X86::BLCMSK64rm:
5206 case X86::BLSFILL32rr:
5207 case X86::BLSFILL32rm:
5208 case X86::BLSFILL64rr:
5209 case X86::BLSFILL64rm:
5210 case X86::BLSIC32rr:
5211 case X86::BLSIC32rm:
5212 case X86::BLSIC64rr:
5213 case X86::BLSIC64rm:
5218 case X86::T1MSKC32rr:
5219 case X86::T1MSKC32rm:
5220 case X86::T1MSKC64rr:
5221 case X86::T1MSKC64rm:
5222 case X86::TZMSK32rr:
5223 case X86::TZMSK32rm:
5224 case X86::TZMSK64rr:
5225 case X86::TZMSK64rm:
5229 ClearsOverflowFlag =
true;
5231 case X86::BEXTR32rr:
5232 case X86::BEXTR64rr:
5233 case X86::BEXTR32rm:
5234 case X86::BEXTR64rm:
5235 case X86::BEXTRI32ri:
5236 case X86::BEXTRI32mi:
5237 case X86::BEXTRI64ri:
5238 case X86::BEXTRI64mi:
5249 switch (
MI.getOpcode()) {
5257 case X86::LZCNT16rr:
5258 case X86::LZCNT32rr:
5259 case X86::LZCNT64rr:
5261 case X86::POPCNT16rr:
5262 case X86::POPCNT32rr:
5263 case X86::POPCNT64rr:
5265 case X86::TZCNT16rr:
5266 case X86::TZCNT32rr:
5267 case X86::TZCNT64rr:
5281 case X86::BLSMSK32rr:
5282 case X86::BLSMSK64rr:
5314 unsigned NewOpcode = 0;
5315#define FROM_TO(A, B) \
5316 CASE_ND(A) NewOpcode = X86::B; \
5340 if (NewOpcode == X86::CMP64rm || NewOpcode == X86::CMP32rm ||
5341 NewOpcode == X86::CMP16rm || NewOpcode == X86::CMP8rm)
5349 bool IsCmpZero = (CmpMask != 0 && CmpValue == 0);
5355 assert(SrcRegDef &&
"Must have a definition (SSA)");
5361 bool NoSignFlag =
false;
5362 bool ClearsOverflowFlag =
false;
5363 bool ShouldUpdateCC =
false;
5364 bool IsSwapped =
false;
5365 bool HasNF = Subtarget.hasNF();
5368 int64_t ImmDelta = 0;
5381 if (&Inst == SrcRegDef) {
5404 Subtarget, NoSignFlag, ClearsOverflowFlag)) {
5413 if (Inst.modifiesRegister(X86::EFLAGS,
TRI)) {
5424 Inst.getOperand(OpNo).getReg() == SrcReg) {
5425 ShouldUpdateCC =
true;
5436 if (isRedundantFlagInstr(CmpInstr, SrcReg, SrcReg2, CmpMask, CmpValue,
5437 Inst, &IsSwapped, &ImmDelta)) {
5445 if (!Movr0Inst && Inst.
getOpcode() == X86::MOV32r0 &&
5446 Inst.registerDefIsDead(X86::EFLAGS,
TRI)) {
5460 if (HasNF && Inst.registerDefIsDead(X86::EFLAGS,
TRI) && !IsWithReloc) {
5465 InstsToUpdate.
push_back(std::make_pair(&Inst, NewOp));
5479 if (
MBB->pred_size() != 1)
5481 MBB = *
MBB->pred_begin();
5482 From =
MBB->rbegin();
5489 bool FlagsMayLiveOut =
true;
5494 bool ModifyEFLAGS = Instr.modifiesRegister(X86::EFLAGS,
TRI);
5495 bool UseEFLAGS = Instr.readsRegister(X86::EFLAGS,
TRI);
5497 if (!UseEFLAGS && ModifyEFLAGS) {
5499 FlagsMayLiveOut =
false;
5502 if (!UseEFLAGS && !ModifyEFLAGS)
5533 if (!ClearsOverflowFlag)
5552 ReplacementCC = NewCC;
5558 }
else if (IsSwapped) {
5565 ShouldUpdateCC =
true;
5566 }
else if (ImmDelta != 0) {
5577 if (ImmDelta != 1 || CmpValue == 0)
5587 if (ImmDelta != 1 || CmpValue == 0)
5614 ShouldUpdateCC =
true;
5617 if (ShouldUpdateCC && ReplacementCC != OldCC) {
5621 OpsToUpdate.
push_back(std::make_pair(&Instr, ReplacementCC));
5623 if (ModifyEFLAGS || Instr.killsRegister(X86::EFLAGS,
TRI)) {
5625 FlagsMayLiveOut =
false;
5632 if ((
MI !=
nullptr || ShouldUpdateCC) && FlagsMayLiveOut) {
5639 assert((
MI ==
nullptr ||
Sub ==
nullptr) &&
"Should not have Sub and MI set");
5646 if (&CmpMBB != SubBB)
5650 InsertE =
Sub->getParent()->rend();
5651 for (; InsertI != InsertE; ++InsertI) {
5653 if (!Instr->readsRegister(X86::EFLAGS,
TRI) &&
5654 Instr->modifiesRegister(X86::EFLAGS,
TRI)) {
5661 if (InsertI == InsertE)
5666 for (
auto &Inst : InstsToUpdate) {
5667 Inst.first->setDesc(
get(Inst.second));
5668 Inst.first->removeOperand(
5669 Inst.first->findRegisterDefOperandIdx(X86::EFLAGS,
nullptr));
5674 Sub->findRegisterDefOperand(X86::EFLAGS,
nullptr);
5675 assert(FlagDef &&
"Unable to locate a def EFLAGS operand");
5681 for (
auto &
Op : OpsToUpdate) {
5682 Op.first->getOperand(
Op.first->getDesc().getNumOperands() - 1)
5687 MBB = *
MBB->pred_begin()) {
5688 assert(
MBB->pred_size() == 1 &&
"Expected exactly one predecessor");
5689 if (!
MBB->isLiveIn(X86::EFLAGS))
5690 MBB->addLiveIn(X86::EFLAGS);
5718#define FROM_TO(FROM, TO) \
5721 case X86::FROM##_ND: \
5722 return X86::TO##_ND;
5750#define FROM_TO(FROM, TO) \
5756 FROM_TO(CTEST64rr, CTEST64ri32)
5764 case X86::ADD64rr_ND:
5765 return X86::ADD64ri32_ND;
5766 case X86::SUB64rr_ND:
5767 return X86::SUB64ri32_ND;
5779 bool MakeChange)
const {
5785 const TargetRegisterClass *RC =
nullptr;
5789 (
Reg.
isVirtual() && X86::GR64RegClass.hasSubClassEq(RC))) {
5794 if (
UseMI.findRegisterUseOperand(
Reg,
nullptr)->getSubReg())
5804 if (
Opc == TargetOpcode::COPY) {
5806 const TargetRegisterClass *RC =
nullptr;
5809 bool GR32Reg = (ToReg.
isVirtual() && X86::GR32RegClass.hasSubClassEq(RC)) ||
5811 bool GR64Reg = (ToReg.
isVirtual() && X86::GR64RegClass.hasSubClassEq(RC)) ||
5813 bool GR8Reg = (ToReg.
isVirtual() && X86::GR8RegClass.hasSubClassEq(RC)) ||
5824 NewOpc = X86::MOV32ri64;
5826 NewOpc = X86::MOV64ri;
5827 }
else if (GR32Reg) {
5828 NewOpc = X86::MOV32ri;
5832 if (
UseMI.getParent()->computeRegisterLiveness(
5841 UseMI.removeOperand(
5842 UseMI.findRegisterUseOperandIdx(
Reg,
nullptr));
5850 NewOpc = X86::MOV8ri;
5860 if ((NewOpc == X86::SUB64ri32 || NewOpc == X86::SUB32ri ||
5861 NewOpc == X86::SBB64ri32 || NewOpc == X86::SBB32ri ||
5862 NewOpc == X86::SUB64ri32_ND || NewOpc == X86::SUB32ri_ND ||
5863 NewOpc == X86::SBB64ri32_ND || NewOpc == X86::SBB32ri_ND) &&
5864 UseMI.findRegisterUseOperandIdx(
Reg,
nullptr) != 2)
5867 if (((NewOpc == X86::CMP64ri32 || NewOpc == X86::CMP32ri) ||
5868 (NewOpc == X86::CCMP64ri32 || NewOpc == X86::CCMP32ri)) &&
5869 UseMI.findRegisterUseOperandIdx(
Reg,
nullptr) != 1)
5872 using namespace X86;
5873 if (isSHL(
Opc) || isSHR(
Opc) || isSAR(
Opc) || isROL(
Opc) || isROR(
Opc) ||
5874 isRCL(
Opc) || isRCR(
Opc)) {
5875 unsigned RegIdx =
UseMI.findRegisterUseOperandIdx(
Reg,
nullptr);
5885 UseMI.removeOperand(RegIdx);
5899 UseMI.registerDefIsDead(X86::EFLAGS,
nullptr)) {
5903 UseMI.setDesc(
get(TargetOpcode::COPY));
5904 UseMI.removeOperand(
5905 UseMI.findRegisterUseOperandIdx(
Reg,
nullptr));
5906 UseMI.removeOperand(
5907 UseMI.findRegisterDefOperandIdx(X86::EFLAGS,
nullptr));
5908 UseMI.untieRegOperand(0);
5912 unsigned Op1 = 1, Op2 = CommuteAnyOperandIndex;
5913 unsigned ImmOpNum = 2;
5914 if (!
UseMI.getOperand(0).isDef()) {
5918 if (
Opc == TargetOpcode::COPY)
5922 commuteInstruction(
UseMI);
5926 UseMI.getOperand(ImmOpNum).ChangeToImmediate(ImmVal);
5944 return foldImmediateImpl(
UseMI, &
DefMI, Reg, ImmVal, MRI,
true);
5956 assert(
Desc.getNumOperands() == 3 &&
"Expected two-addr instruction.");
5976 assert(
Desc.getNumOperands() == 3 &&
"Expected two-addr instruction.");
5994 MIB->
setDesc(
TII.get(MinusOne ? X86::DEC32r : X86::INC32r));
6006 assert(Imm != 0 &&
"Using push/pop for 0 is not efficient.");
6009 int StackAdjustment;
6011 if (Subtarget.is64Bit()) {
6013 MIB->
getOpcode() == X86::MOV32ImmSExti8);
6027 StackAdjustment = 8;
6033 StackAdjustment = 4;
6045 bool EmitCFI = !TFL->
hasFP(MF) && NeedsDwarfCFI;
6092 MIB->
getOpcode() == X86::XOR64_FP ? X86::XOR64rr : X86::XOR32rr;
6104 const MCInstrDesc &BroadcastDesc,
unsigned SubIdx) {
6107 if (
TRI->getEncodingValue(DestReg) < 16) {
6114 DestReg =
TRI->getMatchingSuperReg(DestReg, SubIdx, &X86::VR512RegClass);
6126 const MCInstrDesc &ExtractDesc,
unsigned SubIdx) {
6129 if (
TRI->getEncodingValue(SrcReg) < 16) {
6136 SrcReg =
TRI->getMatchingSuperReg(SrcReg, SubIdx, &X86::VR512RegClass);
6159 if (
MI.getOpcode() == X86::MOVSHPrm) {
6160 NewOpc = HasAVX ? X86::VMOVSSrm : X86::MOVSSrm;
6162 if (
Reg > X86::XMM15)
6163 NewOpc = X86::VMOVSSZrm;
6165 NewOpc = HasAVX ? X86::VMOVSSmr : X86::MOVSSmr;
6167 if (
Reg > X86::XMM15)
6168 NewOpc = X86::VMOVSSZmr;
6176 bool HasAVX = Subtarget.hasAVX();
6178 switch (
MI.getOpcode()) {
6185 case X86::MOV32ImmSExti8:
6186 case X86::MOV64ImmSExti8:
6188 case X86::SETB_C32r:
6190 case X86::SETB_C64r:
6198 case X86::FsFLD0F128:
6200 case X86::AVX_SET0: {
6201 assert(HasAVX &&
"AVX not supported");
6204 Register XReg =
TRI->getSubReg(SrcReg, X86::sub_xmm);
6210 case X86::AVX512_128_SET0:
6211 case X86::AVX512_FsFLD0SH:
6212 case X86::AVX512_FsFLD0SS:
6213 case X86::AVX512_FsFLD0SD:
6214 case X86::AVX512_FsFLD0F128: {
6215 bool HasVLX = Subtarget.hasVLX();
6218 if (HasVLX ||
TRI->getEncodingValue(SrcReg) < 16)
6220 get(HasVLX ? X86::VPXORDZ128rr : X86::VXORPSrr));
6223 TRI->getMatchingSuperReg(SrcReg, X86::sub_xmm, &X86::VR512RegClass);
6227 case X86::AVX512_256_SET0:
6228 case X86::AVX512_512_SET0: {
6229 bool HasVLX = Subtarget.hasVLX();
6232 if (HasVLX ||
TRI->getEncodingValue(SrcReg) < 16) {
6233 Register XReg =
TRI->getSubReg(SrcReg, X86::sub_xmm);
6239 if (
MI.getOpcode() == X86::AVX512_256_SET0) {
6242 TRI->getMatchingSuperReg(SrcReg, X86::sub_ymm, &X86::VR512RegClass);
6250 case X86::V_SETALLONES:
6252 get(HasAVX ? X86::VPCMPEQDrr : X86::PCMPEQDrr));
6253 case X86::AVX2_SETALLONES:
6255 case X86::AVX1_SETALLONES: {
6262 case X86::AVX512_128_SETALLONES:
6263 case X86::AVX512_256_SETALLONES:
6264 case X86::AVX512_512_SETALLONES: {
6267 switch (
MI.getOpcode()) {
6268 case X86::AVX512_128_SETALLONES: {
6269 if (X86::VR128RegClass.
contains(Reg))
6272 Opc = X86::VPTERNLOGDZ128rri;
6275 case X86::AVX512_256_SETALLONES: {
6276 if (X86::VR256RegClass.
contains(Reg))
6279 Opc = X86::VPTERNLOGDZ256rri;
6282 case X86::AVX512_512_SETALLONES:
6283 Opc = X86::VPTERNLOGDZrri;
6295 case X86::AVX512_512_SEXT_MASK_32:
6296 case X86::AVX512_512_SEXT_MASK_64: {
6300 unsigned Opc = (
MI.getOpcode() == X86::AVX512_512_SEXT_MASK_64)
6301 ? X86::VPTERNLOGQZrrikz
6302 : X86::VPTERNLOGDZrrikz;
6303 MI.removeOperand(1);
6308 .
addReg(MaskReg, MaskState)
6314 case X86::VMOVAPSZ128rm_NOVLX:
6316 get(X86::VBROADCASTF32X4Zrm), X86::sub_xmm);
6317 case X86::VMOVUPSZ128rm_NOVLX:
6319 get(X86::VBROADCASTF32X4Zrm), X86::sub_xmm);
6320 case X86::VMOVAPSZ256rm_NOVLX:
6322 get(X86::VBROADCASTF64X4Zrm), X86::sub_ymm);
6323 case X86::VMOVUPSZ256rm_NOVLX:
6325 get(X86::VBROADCASTF64X4Zrm), X86::sub_ymm);
6326 case X86::VMOVAPSZ128mr_NOVLX:
6328 get(X86::VEXTRACTF32X4Zmri), X86::sub_xmm);
6329 case X86::VMOVUPSZ128mr_NOVLX:
6331 get(X86::VEXTRACTF32X4Zmri), X86::sub_xmm);
6332 case X86::VMOVAPSZ256mr_NOVLX:
6334 get(X86::VEXTRACTF64X4Zmri), X86::sub_ymm);
6335 case X86::VMOVUPSZ256mr_NOVLX:
6337 get(X86::VEXTRACTF64X4Zmri), X86::sub_ymm);
6338 case X86::MOV32ri64: {
6340 Register Reg32 = RI.getSubReg(Reg, X86::sub_32bit);
6341 MI.setDesc(
get(X86::MOV32ri));
6347 case X86::RDFLAGS32:
6348 case X86::RDFLAGS64: {
6349 unsigned Is64Bit =
MI.getOpcode() == X86::RDFLAGS64;
6353 get(Is64Bit ? X86::PUSHF64 : X86::PUSHF32))
6361 "Unexpected register in operand! Should be EFLAGS.");
6364 "Unexpected register in operand! Should be DF.");
6367 MIB->
setDesc(
get(Is64Bit ? X86::POP64r : X86::POP32r));
6371 case X86::WRFLAGS32:
6372 case X86::WRFLAGS64: {
6373 unsigned Is64Bit =
MI.getOpcode() == X86::WRFLAGS64;
6377 get(Is64Bit ? X86::PUSH64r : X86::PUSH32r))
6378 .
addReg(
MI.getOperand(0).getReg());
6380 get(Is64Bit ? X86::POPF64 : X86::POPF32));
6381 MI.eraseFromParent();
6408 case TargetOpcode::LOAD_STACK_GUARD:
6414 case X86::SHLDROT32ri:
6416 case X86::SHLDROT64ri:
6418 case X86::SHRDROT32ri:
6420 case X86::SHRDROT64ri:
6422 case X86::ADD8rr_DB:
6425 case X86::ADD16rr_DB:
6428 case X86::ADD32rr_DB:
6431 case X86::ADD64rr_DB:
6434 case X86::ADD8ri_DB:
6437 case X86::ADD16ri_DB:
6440 case X86::ADD32ri_DB:
6443 case X86::ADD64ri32_DB:
6467 bool ForLoadFold =
false) {
6469 case X86::CVTSI2SSrr:
6470 case X86::CVTSI2SSrm:
6471 case X86::CVTSI642SSrr:
6472 case X86::CVTSI642SSrm:
6473 case X86::CVTSI2SDrr:
6474 case X86::CVTSI2SDrm:
6475 case X86::CVTSI642SDrr:
6476 case X86::CVTSI642SDrm:
6479 return !ForLoadFold;
6480 case X86::CVTSD2SSrr:
6481 case X86::CVTSD2SSrm:
6482 case X86::CVTSS2SDrr:
6483 case X86::CVTSS2SDrm:
6490 case X86::RCPSSr_Int:
6491 case X86::RCPSSm_Int:
6492 case X86::ROUNDSDri:
6493 case X86::ROUNDSDmi:
6494 case X86::ROUNDSSri:
6495 case X86::ROUNDSSmi:
6498 case X86::RSQRTSSr_Int:
6499 case X86::RSQRTSSm_Int:
6502 case X86::SQRTSSr_Int:
6503 case X86::SQRTSSm_Int:
6506 case X86::SQRTSDr_Int:
6507 case X86::SQRTSDm_Int:
6509 case X86::VFCMULCPHZ128rm:
6510 case X86::VFCMULCPHZ128rmb:
6511 case X86::VFCMULCPHZ128rmbkz:
6512 case X86::VFCMULCPHZ128rmkz:
6513 case X86::VFCMULCPHZ128rr:
6514 case X86::VFCMULCPHZ128rrkz:
6515 case X86::VFCMULCPHZ256rm:
6516 case X86::VFCMULCPHZ256rmb:
6517 case X86::VFCMULCPHZ256rmbkz:
6518 case X86::VFCMULCPHZ256rmkz:
6519 case X86::VFCMULCPHZ256rr:
6520 case X86::VFCMULCPHZ256rrkz:
6521 case X86::VFCMULCPHZrm:
6522 case X86::VFCMULCPHZrmb:
6523 case X86::VFCMULCPHZrmbkz:
6524 case X86::VFCMULCPHZrmkz:
6525 case X86::VFCMULCPHZrr:
6526 case X86::VFCMULCPHZrrb:
6527 case X86::VFCMULCPHZrrbkz:
6528 case X86::VFCMULCPHZrrkz:
6529 case X86::VFMULCPHZ128rm:
6530 case X86::VFMULCPHZ128rmb:
6531 case X86::VFMULCPHZ128rmbkz:
6532 case X86::VFMULCPHZ128rmkz:
6533 case X86::VFMULCPHZ128rr:
6534 case X86::VFMULCPHZ128rrkz:
6535 case X86::VFMULCPHZ256rm:
6536 case X86::VFMULCPHZ256rmb:
6537 case X86::VFMULCPHZ256rmbkz:
6538 case X86::VFMULCPHZ256rmkz:
6539 case X86::VFMULCPHZ256rr:
6540 case X86::VFMULCPHZ256rrkz:
6541 case X86::VFMULCPHZrm:
6542 case X86::VFMULCPHZrmb:
6543 case X86::VFMULCPHZrmbkz:
6544 case X86::VFMULCPHZrmkz:
6545 case X86::VFMULCPHZrr:
6546 case X86::VFMULCPHZrrb:
6547 case X86::VFMULCPHZrrbkz:
6548 case X86::VFMULCPHZrrkz:
6549 case X86::VFCMULCSHZrm:
6550 case X86::VFCMULCSHZrmkz:
6551 case X86::VFCMULCSHZrr:
6552 case X86::VFCMULCSHZrrb:
6553 case X86::VFCMULCSHZrrbkz:
6554 case X86::VFCMULCSHZrrkz:
6555 case X86::VFMULCSHZrm:
6556 case X86::VFMULCSHZrmkz:
6557 case X86::VFMULCSHZrr:
6558 case X86::VFMULCSHZrrb:
6559 case X86::VFMULCSHZrrbkz:
6560 case X86::VFMULCSHZrrkz:
6561 return Subtarget.hasMULCFalseDeps();
6562 case X86::VPERMDYrm:
6563 case X86::VPERMDYrr:
6564 case X86::VPERMQYmi:
6565 case X86::VPERMQYri:
6566 case X86::VPERMPSYrm:
6567 case X86::VPERMPSYrr:
6568 case X86::VPERMPDYmi:
6569 case X86::VPERMPDYri:
6570 case X86::VPERMDZ256rm:
6571 case X86::VPERMDZ256rmb:
6572 case X86::VPERMDZ256rmbkz:
6573 case X86::VPERMDZ256rmkz:
6574 case X86::VPERMDZ256rr:
6575 case X86::VPERMDZ256rrkz:
6576 case X86::VPERMDZrm:
6577 case X86::VPERMDZrmb:
6578 case X86::VPERMDZrmbkz:
6579 case X86::VPERMDZrmkz:
6580 case X86::VPERMDZrr:
6581 case X86::VPERMDZrrkz:
6582 case X86::VPERMQZ256mbi:
6583 case X86::VPERMQZ256mbikz:
6584 case X86::VPERMQZ256mi:
6585 case X86::VPERMQZ256mikz:
6586 case X86::VPERMQZ256ri:
6587 case X86::VPERMQZ256rikz:
6588 case X86::VPERMQZ256rm:
6589 case X86::VPERMQZ256rmb:
6590 case X86::VPERMQZ256rmbkz:
6591 case X86::VPERMQZ256rmkz:
6592 case X86::VPERMQZ256rr:
6593 case X86::VPERMQZ256rrkz:
6594 case X86::VPERMQZmbi:
6595 case X86::VPERMQZmbikz:
6596 case X86::VPERMQZmi:
6597 case X86::VPERMQZmikz:
6598 case X86::VPERMQZri:
6599 case X86::VPERMQZrikz:
6600 case X86::VPERMQZrm:
6601 case X86::VPERMQZrmb:
6602 case X86::VPERMQZrmbkz:
6603 case X86::VPERMQZrmkz:
6604 case X86::VPERMQZrr:
6605 case X86::VPERMQZrrkz:
6606 case X86::VPERMPSZ256rm:
6607 case X86::VPERMPSZ256rmb:
6608 case X86::VPERMPSZ256rmbkz:
6609 case X86::VPERMPSZ256rmkz:
6610 case X86::VPERMPSZ256rr:
6611 case X86::VPERMPSZ256rrkz:
6612 case X86::VPERMPSZrm:
6613 case X86::VPERMPSZrmb:
6614 case X86::VPERMPSZrmbkz:
6615 case X86::VPERMPSZrmkz:
6616 case X86::VPERMPSZrr:
6617 case X86::VPERMPSZrrkz:
6618 case X86::VPERMPDZ256mbi:
6619 case X86::VPERMPDZ256mbikz:
6620 case X86::VPERMPDZ256mi:
6621 case X86::VPERMPDZ256mikz:
6622 case X86::VPERMPDZ256ri:
6623 case X86::VPERMPDZ256rikz:
6624 case X86::VPERMPDZ256rm:
6625 case X86::VPERMPDZ256rmb:
6626 case X86::VPERMPDZ256rmbkz:
6627 case X86::VPERMPDZ256rmkz:
6628 case X86::VPERMPDZ256rr:
6629 case X86::VPERMPDZ256rrkz:
6630 case X86::VPERMPDZmbi:
6631 case X86::VPERMPDZmbikz:
6632 case X86::VPERMPDZmi:
6633 case X86::VPERMPDZmikz:
6634 case X86::VPERMPDZri:
6635 case X86::VPERMPDZrikz:
6636 case X86::VPERMPDZrm:
6637 case X86::VPERMPDZrmb:
6638 case X86::VPERMPDZrmbkz:
6639 case X86::VPERMPDZrmkz:
6640 case X86::VPERMPDZrr:
6641 case X86::VPERMPDZrrkz:
6642 return Subtarget.hasPERMFalseDeps();
6643 case X86::VRANGEPDZ128rmbi:
6644 case X86::VRANGEPDZ128rmbikz:
6645 case X86::VRANGEPDZ128rmi:
6646 case X86::VRANGEPDZ128rmikz:
6647 case X86::VRANGEPDZ128rri:
6648 case X86::VRANGEPDZ128rrikz:
6649 case X86::VRANGEPDZ256rmbi:
6650 case X86::VRANGEPDZ256rmbikz:
6651 case X86::VRANGEPDZ256rmi:
6652 case X86::VRANGEPDZ256rmikz:
6653 case X86::VRANGEPDZ256rri:
6654 case X86::VRANGEPDZ256rrikz:
6655 case X86::VRANGEPDZrmbi:
6656 case X86::VRANGEPDZrmbikz:
6657 case X86::VRANGEPDZrmi:
6658 case X86::VRANGEPDZrmikz:
6659 case X86::VRANGEPDZrri:
6660 case X86::VRANGEPDZrrib:
6661 case X86::VRANGEPDZrribkz:
6662 case X86::VRANGEPDZrrikz:
6663 case X86::VRANGEPSZ128rmbi:
6664 case X86::VRANGEPSZ128rmbikz:
6665 case X86::VRANGEPSZ128rmi:
6666 case X86::VRANGEPSZ128rmikz:
6667 case X86::VRANGEPSZ128rri:
6668 case X86::VRANGEPSZ128rrikz:
6669 case X86::VRANGEPSZ256rmbi:
6670 case X86::VRANGEPSZ256rmbikz:
6671 case X86::VRANGEPSZ256rmi:
6672 case X86::VRANGEPSZ256rmikz:
6673 case X86::VRANGEPSZ256rri:
6674 case X86::VRANGEPSZ256rrikz:
6675 case X86::VRANGEPSZrmbi:
6676 case X86::VRANGEPSZrmbikz:
6677 case X86::VRANGEPSZrmi:
6678 case X86::VRANGEPSZrmikz:
6679 case X86::VRANGEPSZrri:
6680 case X86::VRANGEPSZrrib:
6681 case X86::VRANGEPSZrribkz:
6682 case X86::VRANGEPSZrrikz:
6683 case X86::VRANGESDZrmi:
6684 case X86::VRANGESDZrmikz:
6685 case X86::VRANGESDZrri:
6686 case X86::VRANGESDZrrib:
6687 case X86::VRANGESDZrribkz:
6688 case X86::VRANGESDZrrikz:
6689 case X86::VRANGESSZrmi:
6690 case X86::VRANGESSZrmikz:
6691 case X86::VRANGESSZrri:
6692 case X86::VRANGESSZrrib:
6693 case X86::VRANGESSZrribkz:
6694 case X86::VRANGESSZrrikz:
6695 return Subtarget.hasRANGEFalseDeps();
6696 case X86::VGETMANTSSZrmi:
6697 case X86::VGETMANTSSZrmikz:
6698 case X86::VGETMANTSSZrri:
6699 case X86::VGETMANTSSZrrib:
6700 case X86::VGETMANTSSZrribkz:
6701 case X86::VGETMANTSSZrrikz:
6702 case X86::VGETMANTSDZrmi:
6703 case X86::VGETMANTSDZrmikz:
6704 case X86::VGETMANTSDZrri:
6705 case X86::VGETMANTSDZrrib:
6706 case X86::VGETMANTSDZrribkz:
6707 case X86::VGETMANTSDZrrikz:
6708 case X86::VGETMANTSHZrmi:
6709 case X86::VGETMANTSHZrmikz:
6710 case X86::VGETMANTSHZrri:
6711 case X86::VGETMANTSHZrrib:
6712 case X86::VGETMANTSHZrribkz:
6713 case X86::VGETMANTSHZrrikz:
6714 case X86::VGETMANTPSZ128rmbi:
6715 case X86::VGETMANTPSZ128rmbikz:
6716 case X86::VGETMANTPSZ128rmi:
6717 case X86::VGETMANTPSZ128rmikz:
6718 case X86::VGETMANTPSZ256rmbi:
6719 case X86::VGETMANTPSZ256rmbikz:
6720 case X86::VGETMANTPSZ256rmi:
6721 case X86::VGETMANTPSZ256rmikz:
6722 case X86::VGETMANTPSZrmbi:
6723 case X86::VGETMANTPSZrmbikz:
6724 case X86::VGETMANTPSZrmi:
6725 case X86::VGETMANTPSZrmikz:
6726 case X86::VGETMANTPDZ128rmbi:
6727 case X86::VGETMANTPDZ128rmbikz:
6728 case X86::VGETMANTPDZ128rmi:
6729 case X86::VGETMANTPDZ128rmikz:
6730 case X86::VGETMANTPDZ256rmbi:
6731 case X86::VGETMANTPDZ256rmbikz:
6732 case X86::VGETMANTPDZ256rmi:
6733 case X86::VGETMANTPDZ256rmikz:
6734 case X86::VGETMANTPDZrmbi:
6735 case X86::VGETMANTPDZrmbikz:
6736 case X86::VGETMANTPDZrmi:
6737 case X86::VGETMANTPDZrmikz:
6738 return Subtarget.hasGETMANTFalseDeps();
6739 case X86::VPMULLQZ128rm:
6740 case X86::VPMULLQZ128rmb:
6741 case X86::VPMULLQZ128rmbkz:
6742 case X86::VPMULLQZ128rmkz:
6743 case X86::VPMULLQZ128rr:
6744 case X86::VPMULLQZ128rrkz:
6745 case X86::VPMULLQZ256rm:
6746 case X86::VPMULLQZ256rmb:
6747 case X86::VPMULLQZ256rmbkz:
6748 case X86::VPMULLQZ256rmkz:
6749 case X86::VPMULLQZ256rr:
6750 case X86::VPMULLQZ256rrkz:
6751 case X86::VPMULLQZrm:
6752 case X86::VPMULLQZrmb:
6753 case X86::VPMULLQZrmbkz:
6754 case X86::VPMULLQZrmkz:
6755 case X86::VPMULLQZrr:
6756 case X86::VPMULLQZrrkz:
6757 return Subtarget.hasMULLQFalseDeps();
6759 case X86::POPCNT32rm:
6760 case X86::POPCNT32rr:
6761 case X86::POPCNT64rm:
6762 case X86::POPCNT64rr:
6763 return Subtarget.hasPOPCNTFalseDeps();
6764 case X86::LZCNT32rm:
6765 case X86::LZCNT32rr:
6766 case X86::LZCNT64rm:
6767 case X86::LZCNT64rr:
6768 case X86::TZCNT32rm:
6769 case X86::TZCNT32rr:
6770 case X86::TZCNT64rm:
6771 case X86::TZCNT64rr:
6772 return Subtarget.hasLZCNTFalseDeps();
6789 bool HasNDDPartialWrite =
false;
6792 if (!Reg.isVirtual())
6793 HasNDDPartialWrite =
6794 X86::GR8RegClass.contains(Reg) || X86::GR16RegClass.contains(Reg);
6807 bool ReadsReg =
false;
6808 if (Reg.isVirtual())
6809 ReadsReg = (MO.
readsReg() ||
MI.readsVirtualRegister(Reg));
6811 ReadsReg =
MI.readsRegister(Reg,
TRI);
6812 if (ReadsReg != HasNDDPartialWrite)
6826 bool ForLoadFold =
false) {
6829 case X86::MMX_PUNPCKHBWrr:
6830 case X86::MMX_PUNPCKHWDrr:
6831 case X86::MMX_PUNPCKHDQrr:
6832 case X86::MMX_PUNPCKLBWrr:
6833 case X86::MMX_PUNPCKLWDrr:
6834 case X86::MMX_PUNPCKLDQrr:
6835 case X86::MOVHLPSrr:
6836 case X86::PACKSSWBrr:
6837 case X86::PACKUSWBrr:
6838 case X86::PACKSSDWrr:
6839 case X86::PACKUSDWrr:
6840 case X86::PUNPCKHBWrr:
6841 case X86::PUNPCKLBWrr:
6842 case X86::PUNPCKHWDrr:
6843 case X86::PUNPCKLWDrr:
6844 case X86::PUNPCKHDQrr:
6845 case X86::PUNPCKLDQrr:
6846 case X86::PUNPCKHQDQrr:
6847 case X86::PUNPCKLQDQrr:
6848 case X86::SHUFPDrri:
6849 case X86::SHUFPSrri:
6855 return OpNum == 2 && !ForLoadFold;
6857 case X86::VMOVLHPSrr:
6858 case X86::VMOVLHPSZrr:
6859 case X86::VPACKSSWBrr:
6860 case X86::VPACKUSWBrr:
6861 case X86::VPACKSSDWrr:
6862 case X86::VPACKUSDWrr:
6863 case X86::VPACKSSWBZ128rr:
6864 case X86::VPACKUSWBZ128rr:
6865 case X86::VPACKSSDWZ128rr:
6866 case X86::VPACKUSDWZ128rr:
6867 case X86::VPERM2F128rri:
6868 case X86::VPERM2I128rri:
6869 case X86::VSHUFF32X4Z256rri:
6870 case X86::VSHUFF32X4Zrri:
6871 case X86::VSHUFF64X2Z256rri:
6872 case X86::VSHUFF64X2Zrri:
6873 case X86::VSHUFI32X4Z256rri:
6874 case X86::VSHUFI32X4Zrri:
6875 case X86::VSHUFI64X2Z256rri:
6876 case X86::VSHUFI64X2Zrri:
6877 case X86::VPUNPCKHBWrr:
6878 case X86::VPUNPCKLBWrr:
6879 case X86::VPUNPCKHBWYrr:
6880 case X86::VPUNPCKLBWYrr:
6881 case X86::VPUNPCKHBWZ128rr:
6882 case X86::VPUNPCKLBWZ128rr:
6883 case X86::VPUNPCKHBWZ256rr:
6884 case X86::VPUNPCKLBWZ256rr:
6885 case X86::VPUNPCKHBWZrr:
6886 case X86::VPUNPCKLBWZrr:
6887 case X86::VPUNPCKHWDrr:
6888 case X86::VPUNPCKLWDrr:
6889 case X86::VPUNPCKHWDYrr:
6890 case X86::VPUNPCKLWDYrr:
6891 case X86::VPUNPCKHWDZ128rr:
6892 case X86::VPUNPCKLWDZ128rr:
6893 case X86::VPUNPCKHWDZ256rr:
6894 case X86::VPUNPCKLWDZ256rr:
6895 case X86::VPUNPCKHWDZrr:
6896 case X86::VPUNPCKLWDZrr:
6897 case X86::VPUNPCKHDQrr:
6898 case X86::VPUNPCKLDQrr:
6899 case X86::VPUNPCKHDQYrr:
6900 case X86::VPUNPCKLDQYrr:
6901 case X86::VPUNPCKHDQZ128rr:
6902 case X86::VPUNPCKLDQZ128rr:
6903 case X86::VPUNPCKHDQZ256rr:
6904 case X86::VPUNPCKLDQZ256rr:
6905 case X86::VPUNPCKHDQZrr:
6906 case X86::VPUNPCKLDQZrr:
6907 case X86::VPUNPCKHQDQrr:
6908 case X86::VPUNPCKLQDQrr:
6909 case X86::VPUNPCKHQDQYrr:
6910 case X86::VPUNPCKLQDQYrr:
6911 case X86::VPUNPCKHQDQZ128rr:
6912 case X86::VPUNPCKLQDQZ128rr:
6913 case X86::VPUNPCKHQDQZ256rr:
6914 case X86::VPUNPCKLQDQZ256rr:
6915 case X86::VPUNPCKHQDQZrr:
6916 case X86::VPUNPCKLQDQZrr:
6920 return (OpNum == 1 || OpNum == 2) && !ForLoadFold;
6922 case X86::VCVTSI2SSrr:
6923 case X86::VCVTSI2SSrm:
6924 case X86::VCVTSI2SSrr_Int:
6925 case X86::VCVTSI2SSrm_Int:
6926 case X86::VCVTSI642SSrr:
6927 case X86::VCVTSI642SSrm:
6928 case X86::VCVTSI642SSrr_Int:
6929 case X86::VCVTSI642SSrm_Int:
6930 case X86::VCVTSI2SDrr:
6931 case X86::VCVTSI2SDrm:
6932 case X86::VCVTSI2SDrr_Int:
6933 case X86::VCVTSI2SDrm_Int:
6934 case X86::VCVTSI642SDrr:
6935 case X86::VCVTSI642SDrm:
6936 case X86::VCVTSI642SDrr_Int:
6937 case X86::VCVTSI642SDrm_Int:
6939 case X86::VCVTSI2SSZrr:
6940 case X86::VCVTSI2SSZrm:
6941 case X86::VCVTSI2SSZrr_Int:
6942 case X86::VCVTSI2SSZrrb_Int:
6943 case X86::VCVTSI2SSZrm_Int:
6944 case X86::VCVTSI642SSZrr:
6945 case X86::VCVTSI642SSZrm:
6946 case X86::VCVTSI642SSZrr_Int:
6947 case X86::VCVTSI642SSZrrb_Int:
6948 case X86::VCVTSI642SSZrm_Int:
6949 case X86::VCVTSI2SDZrr:
6950 case X86::VCVTSI2SDZrm:
6951 case X86::VCVTSI2SDZrr_Int:
6952 case X86::VCVTSI2SDZrm_Int:
6953 case X86::VCVTSI642SDZrr:
6954 case X86::VCVTSI642SDZrm:
6955 case X86::VCVTSI642SDZrr_Int:
6956 case X86::VCVTSI642SDZrrb_Int:
6957 case X86::VCVTSI642SDZrm_Int:
6958 case X86::VCVTUSI2SSZrr:
6959 case X86::VCVTUSI2SSZrm:
6960 case X86::VCVTUSI2SSZrr_Int:
6961 case X86::VCVTUSI2SSZrrb_Int:
6962 case X86::VCVTUSI2SSZrm_Int:
6963 case X86::VCVTUSI642SSZrr:
6964 case X86::VCVTUSI642SSZrm:
6965 case X86::VCVTUSI642SSZrr_Int:
6966 case X86::VCVTUSI642SSZrrb_Int:
6967 case X86::VCVTUSI642SSZrm_Int:
6968 case X86::VCVTUSI2SDZrr:
6969 case X86::VCVTUSI2SDZrm:
6970 case X86::VCVTUSI2SDZrr_Int:
6971 case X86::VCVTUSI2SDZrm_Int:
6972 case X86::VCVTUSI642SDZrr:
6973 case X86::VCVTUSI642SDZrm:
6974 case X86::VCVTUSI642SDZrr_Int:
6975 case X86::VCVTUSI642SDZrrb_Int:
6976 case X86::VCVTUSI642SDZrm_Int:
6977 case X86::VCVTSI2SHZrr:
6978 case X86::VCVTSI2SHZrm:
6979 case X86::VCVTSI2SHZrr_Int:
6980 case X86::VCVTSI2SHZrrb_Int:
6981 case X86::VCVTSI2SHZrm_Int:
6982 case X86::VCVTSI642SHZrr:
6983 case X86::VCVTSI642SHZrm:
6984 case X86::VCVTSI642SHZrr_Int:
6985 case X86::VCVTSI642SHZrrb_Int:
6986 case X86::VCVTSI642SHZrm_Int:
6987 case X86::VCVTUSI2SHZrr:
6988 case X86::VCVTUSI2SHZrm:
6989 case X86::VCVTUSI2SHZrr_Int:
6990 case X86::VCVTUSI2SHZrrb_Int:
6991 case X86::VCVTUSI2SHZrm_Int:
6992 case X86::VCVTUSI642SHZrr:
6993 case X86::VCVTUSI642SHZrm:
6994 case X86::VCVTUSI642SHZrr_Int:
6995 case X86::VCVTUSI642SHZrrb_Int:
6996 case X86::VCVTUSI642SHZrm_Int:
6999 return OpNum == 1 && !ForLoadFold;
7000 case X86::VCVTSD2SSrr:
7001 case X86::VCVTSD2SSrm:
7002 case X86::VCVTSD2SSrr_Int:
7003 case X86::VCVTSD2SSrm_Int:
7004 case X86::VCVTSS2SDrr:
7005 case X86::VCVTSS2SDrm:
7006 case X86::VCVTSS2SDrr_Int:
7007 case X86::VCVTSS2SDrm_Int:
7009 case X86::VRCPSSr_Int:
7011 case X86::VRCPSSm_Int:
7012 case X86::VROUNDSDri:
7013 case X86::VROUNDSDmi:
7014 case X86::VROUNDSDri_Int:
7015 case X86::VROUNDSDmi_Int:
7016 case X86::VROUNDSSri:
7017 case X86::VROUNDSSmi:
7018 case X86::VROUNDSSri_Int:
7019 case X86::VROUNDSSmi_Int:
7020 case X86::VRSQRTSSr:
7021 case X86::VRSQRTSSr_Int:
7022 case X86::VRSQRTSSm:
7023 case X86::VRSQRTSSm_Int:
7025 case X86::VSQRTSSr_Int:
7027 case X86::VSQRTSSm_Int:
7029 case X86::VSQRTSDr_Int:
7031 case X86::VSQRTSDm_Int:
7033 case X86::VCVTSD2SSZrr:
7034 case X86::VCVTSD2SSZrr_Int:
7035 case X86::VCVTSD2SSZrrb_Int:
7036 case X86::VCVTSD2SSZrm:
7037 case X86::VCVTSD2SSZrm_Int:
7038 case X86::VCVTSS2SDZrr:
7039 case X86::VCVTSS2SDZrr_Int:
7040 case X86::VCVTSS2SDZrrb_Int:
7041 case X86::VCVTSS2SDZrm:
7042 case X86::VCVTSS2SDZrm_Int:
7043 case X86::VGETEXPSDZr:
7044 case X86::VGETEXPSDZrb:
7045 case X86::VGETEXPSDZm:
7046 case X86::VGETEXPSSZr:
7047 case X86::VGETEXPSSZrb:
7048 case X86::VGETEXPSSZm:
7049 case X86::VGETMANTSDZrri:
7050 case X86::VGETMANTSDZrrib:
7051 case X86::VGETMANTSDZrmi:
7052 case X86::VGETMANTSSZrri:
7053 case X86::VGETMANTSSZrrib:
7054 case X86::VGETMANTSSZrmi:
7055 case X86::VRNDSCALESDZrri:
7056 case X86::VRNDSCALESDZrri_Int:
7057 case X86::VRNDSCALESDZrrib_Int:
7058 case X86::VRNDSCALESDZrmi:
7059 case X86::VRNDSCALESDZrmi_Int:
7060 case X86::VRNDSCALESSZrri:
7061 case X86::VRNDSCALESSZrri_Int:
7062 case X86::VRNDSCALESSZrrib_Int:
7063 case X86::VRNDSCALESSZrmi:
7064 case X86::VRNDSCALESSZrmi_Int:
7065 case X86::VRCP14SDZrr:
7066 case X86::VRCP14SDZrm:
7067 case X86::VRCP14SSZrr:
7068 case X86::VRCP14SSZrm:
7069 case X86::VRCPSHZrr:
7070 case X86::VRCPSHZrm:
7071 case X86::VRSQRTSHZrr:
7072 case X86::VRSQRTSHZrm:
7073 case X86::VREDUCESHZrmi:
7074 case X86::VREDUCESHZrri:
7075 case X86::VREDUCESHZrrib:
7076 case X86::VGETEXPSHZr:
7077 case X86::VGETEXPSHZrb:
7078 case X86::VGETEXPSHZm:
7079 case X86::VGETMANTSHZrri:
7080 case X86::VGETMANTSHZrrib:
7081 case X86::VGETMANTSHZrmi:
7082 case X86::VRNDSCALESHZrri:
7083 case X86::VRNDSCALESHZrri_Int:
7084 case X86::VRNDSCALESHZrrib_Int:
7085 case X86::VRNDSCALESHZrmi:
7086 case X86::VRNDSCALESHZrmi_Int:
7087 case X86::VSQRTSHZr:
7088 case X86::VSQRTSHZr_Int:
7089 case X86::VSQRTSHZrb_Int:
7090 case X86::VSQRTSHZm:
7091 case X86::VSQRTSHZm_Int:
7092 case X86::VRCP28SDZr:
7093 case X86::VRCP28SDZrb:
7094 case X86::VRCP28SDZm:
7095 case X86::VRCP28SSZr:
7096 case X86::VRCP28SSZrb:
7097 case X86::VRCP28SSZm:
7098 case X86::VREDUCESSZrmi:
7099 case X86::VREDUCESSZrri:
7100 case X86::VREDUCESSZrrib:
7101 case X86::VRSQRT14SDZrr:
7102 case X86::VRSQRT14SDZrm:
7103 case X86::VRSQRT14SSZrr:
7104 case X86::VRSQRT14SSZrm:
7105 case X86::VRSQRT28SDZr:
7106 case X86::VRSQRT28SDZrb:
7107 case X86::VRSQRT28SDZm:
7108 case X86::VRSQRT28SSZr:
7109 case X86::VRSQRT28SSZrb:
7110 case X86::VRSQRT28SSZm:
7111 case X86::VSQRTSSZr:
7112 case X86::VSQRTSSZr_Int:
7113 case X86::VSQRTSSZrb_Int:
7114 case X86::VSQRTSSZm:
7115 case X86::VSQRTSSZm_Int:
7116 case X86::VSQRTSDZr:
7117 case X86::VSQRTSDZr_Int:
7118 case X86::VSQRTSDZrb_Int:
7119 case X86::VSQRTSDZm:
7120 case X86::VSQRTSDZm_Int:
7121 case X86::VCVTSD2SHZrr:
7122 case X86::VCVTSD2SHZrr_Int:
7123 case X86::VCVTSD2SHZrrb_Int:
7124 case X86::VCVTSD2SHZrm:
7125 case X86::VCVTSD2SHZrm_Int:
7126 case X86::VCVTSS2SHZrr:
7127 case X86::VCVTSS2SHZrr_Int:
7128 case X86::VCVTSS2SHZrrb_Int:
7129 case X86::VCVTSS2SHZrm:
7130 case X86::VCVTSS2SHZrm_Int:
7131 case X86::VCVTSH2SDZrr:
7132 case X86::VCVTSH2SDZrr_Int:
7133 case X86::VCVTSH2SDZrrb_Int:
7134 case X86::VCVTSH2SDZrm:
7135 case X86::VCVTSH2SDZrm_Int:
7136 case X86::VCVTSH2SSZrr:
7137 case X86::VCVTSH2SSZrr_Int:
7138 case X86::VCVTSH2SSZrrb_Int:
7139 case X86::VCVTSH2SSZrm:
7140 case X86::VCVTSH2SSZrm_Int:
7142 case X86::VMOVSSZrrk:
7143 case X86::VMOVSDZrrk:
7144 return OpNum == 3 && !ForLoadFold;
7145 case X86::VMOVSSZrrkz:
7146 case X86::VMOVSDZrrkz:
7147 return OpNum == 2 && !ForLoadFold;
7179 Register Reg =
MI.getOperand(OpNum).getReg();
7181 if (
MI.killsRegister(Reg,
TRI))
7184 if (X86::VR128RegClass.
contains(Reg)) {
7187 unsigned Opc = Subtarget.hasAVX() ? X86::VXORPSrr : X86::XORPSrr;
7191 MI.addRegisterKilled(Reg,
TRI,
true);
7192 }
else if (X86::VR256RegClass.
contains(Reg)) {
7195 Register XReg =
TRI->getSubReg(Reg, X86::sub_xmm);
7200 MI.addRegisterKilled(Reg,
TRI,
true);
7201 }
else if (X86::VR128XRegClass.
contains(Reg)) {
7203 if (!Subtarget.hasVLX())
7206 BuildMI(*
MI.getParent(),
MI,
MI.getDebugLoc(),
get(X86::VPXORDZ128rr), Reg)
7209 MI.addRegisterKilled(Reg,
TRI,
true);
7210 }
else if (X86::VR256XRegClass.
contains(Reg) ||
7211 X86::VR512RegClass.
contains(Reg)) {
7213 if (!Subtarget.hasVLX())
7217 Register XReg =
TRI->getSubReg(Reg, X86::sub_xmm);
7218 BuildMI(*
MI.getParent(),
MI,
MI.getDebugLoc(),
get(X86::VPXORDZ128rr), XReg)
7222 MI.addRegisterKilled(Reg,
TRI,
true);
7223 }
else if (X86::GR64RegClass.
contains(Reg)) {
7226 Register XReg =
TRI->getSubReg(Reg, X86::sub_32bit);
7231 MI.addRegisterKilled(Reg,
TRI,
true);
7232 }
else if (X86::GR32RegClass.
contains(Reg)) {
7236 MI.addRegisterKilled(Reg,
TRI,
true);
7237 }
else if ((X86::GR16RegClass.
contains(Reg) ||
7246 if (!
MI.definesRegister(SuperReg,
nullptr))
7252 int PtrOffset = 0) {
7253 unsigned NumAddrOps = MOs.
size();
7255 if (NumAddrOps < 4) {
7257 for (
unsigned i = 0; i != NumAddrOps; ++i)
7263 assert(MOs.
size() == 5 &&
"Unexpected memory operand list length");
7264 for (
unsigned i = 0; i != NumAddrOps; ++i) {
7266 if (i == 3 && PtrOffset != 0) {
7286 if (!
Reg.isVirtual())
7293 dbgs() <<
"WARNING: Unable to update register constraint for operand "
7294 << Idx <<
" of instruction:\n";
7308 MF.CreateMachineInstr(
TII.get(Opcode),
MI.getDebugLoc(),
true);
7313 unsigned NumOps =
MI.getDesc().getNumOperands() - 2;
7314 for (
unsigned i = 0; i !=
NumOps; ++i) {
7324 MBB->insert(InsertPt, NewMI);
7333 int PtrOffset = 0) {
7336 MF.CreateMachineInstr(
TII.get(Opcode),
MI.getDebugLoc(),
true);
7339 for (
unsigned i = 0, e =
MI.getNumOperands(); i != e; ++i) {
7342 assert(MO.
isReg() &&
"Expected to fold into reg operand!");
7356 MBB->insert(InsertPt, NewMI);
7366 MI.getDebugLoc(),
TII.get(Opcode));
7375 switch (
MI.getOpcode()) {
7376 case X86::INSERTPSrri:
7377 case X86::VINSERTPSrri:
7378 case X86::VINSERTPSZrri:
7382 unsigned Imm =
MI.getOperand(
MI.getNumOperands() - 1).getImm();
7383 unsigned ZMask =
Imm & 15;
7384 unsigned DstIdx = (
Imm >> 4) & 3;
7385 unsigned SrcIdx = (
Imm >> 6) & 3;
7388 const TargetRegisterClass *RC =
getRegClass(
MI.getDesc(), OpNum);
7389 unsigned RCSize =
TRI.getRegSizeInBits(*RC) / 8;
7390 if ((
Size == 0 ||
Size >= 16) && RCSize >= 16 &&
7391 (
MI.getOpcode() != X86::INSERTPSrri || Alignment >=
Align(4))) {
7392 int PtrOffset = SrcIdx * 4;
7393 unsigned NewImm = (DstIdx << 4) | ZMask;
7394 unsigned NewOpCode =
7395 (
MI.getOpcode() == X86::VINSERTPSZrri) ? X86::VINSERTPSZrmi
7396 : (
MI.getOpcode() == X86::VINSERTPSrri) ? X86::VINSERTPSrmi
7398 MachineInstr *NewMI =
7399 fuseInst(MF, NewOpCode, OpNum, MOs, InsertPt,
MI, *
this, PtrOffset);
7405 case X86::MOVHLPSrr:
7406 case X86::VMOVHLPSrr:
7407 case X86::VMOVHLPSZrr:
7413 const TargetRegisterClass *RC =
getRegClass(
MI.getDesc(), OpNum);
7414 unsigned RCSize =
TRI.getRegSizeInBits(*RC) / 8;
7415 if ((
Size == 0 ||
Size >= 16) && RCSize >= 16 && Alignment >=
Align(8)) {
7416 unsigned NewOpCode =
7417 (
MI.getOpcode() == X86::VMOVHLPSZrr) ? X86::VMOVLPSZ128rm
7418 : (
MI.getOpcode() == X86::VMOVHLPSrr) ? X86::VMOVLPSrm
7420 MachineInstr *NewMI =
7421 fuseInst(MF, NewOpCode, OpNum, MOs, InsertPt,
MI, *
this, 8);
7426 case X86::UNPCKLPDrr:
7432 const TargetRegisterClass *RC =
getRegClass(
MI.getDesc(), OpNum);
7433 unsigned RCSize =
TRI.getRegSizeInBits(*RC) / 8;
7434 if ((
Size == 0 ||
Size >= 16) && RCSize >= 16 && Alignment <
Align(16)) {
7435 MachineInstr *NewMI =
7436 fuseInst(MF, X86::MOVHPDrm, OpNum, MOs, InsertPt,
MI, *
this);
7443 makeM0Inst(*
this, (
Size == 4) ? X86::MOV32mi : X86::MOV64mi32, MOs,
7455 !
MI.getOperand(1).isReg())
7463 if (
MI.getOperand(1).isUndef())
7472 unsigned Idx1)
const {
7473 unsigned Idx2 = CommuteAnyOperandIndex;
7477 bool HasDef =
MI.getDesc().getNumDefs();
7479 Register Reg1 =
MI.getOperand(Idx1).getReg();
7480 Register Reg2 =
MI.getOperand(Idx2).getReg();
7481 bool Tied1 = 0 ==
MI.getDesc().getOperandConstraint(Idx1,
MCOI::TIED_TO);
7482 bool Tied2 = 0 ==
MI.getDesc().getOperandConstraint(Idx2,
MCOI::TIED_TO);
7486 if ((HasDef && Reg0 == Reg1 && Tied1) || (HasDef && Reg0 == Reg2 && Tied2))
7489 return commuteInstruction(
MI,
false, Idx1, Idx2) ? Idx2 : Idx1;
7494 dbgs() <<
"We failed to fuse operand " << Idx <<
" in " <<
MI;
7502 bool isSlowTwoMemOps = Subtarget.slowTwoMemOps();
7503 bool isSlowIndirectCall = Subtarget.slowIndirectCall();
7504 unsigned Opc =
MI.getOpcode();
7508 if ((isSlowTwoMemOps || isSlowIndirectCall) &&
7510 (
Opc == X86::CALL32r ||
Opc == X86::CALL64r ||
7511 Opc == X86::CALL64r_ImpCall))
7517 (
Opc == X86::PUSH16r ||
Opc == X86::PUSH32r ||
Opc == X86::PUSH64r))
7526 unsigned NumOps =
MI.getDesc().getNumOperands();
7527 bool IsTwoAddr =
NumOps > 1 && OpNum < 2 &&
MI.getOperand(0).isReg() &&
7528 MI.getOperand(1).isReg() &&
7529 MI.getOperand(0).getReg() ==
MI.getOperand(1).getReg();
7533 if (
Opc == X86::ADD32ri &&
7542 Opc != X86::ADD64rr)
7547 if (
MI.isCall() &&
MI.getCFIType())
7551 if (
auto *CustomMI = foldMemoryOperandCustom(MF,
MI, OpNum, MOs, InsertPt,
7562 bool NoNDDM = NonNDOpc && !Subtarget.hasNDDM();
7565 if (NoNDDM && !IsTwoAddr && !MRI.
isSSA()) {
7574 if (
MI.getOperand(0).getSubReg())
7580 if (VRM && Dst !=
MI.getOperand(1).getReg() &&
7581 (!Dst.isVirtual() || VRM->
getPhys(Dst)))
7591 unsigned Opcode =
I->DstOp;
7595 bool NarrowToMOV32rm =
false;
7599 unsigned RCSize =
TRI.getRegSizeInBits(*RC) / 8;
7607 if (Opcode != X86::MOV64rm || RCSize != 8 ||
Size != 4)
7609 if (
MI.getOperand(0).getSubReg() ||
MI.getOperand(1).getSubReg())
7611 Opcode = X86::MOV32rm;
7612 NarrowToMOV32rm =
true;
7622 :
fuseInst(MF, Opcode, OpNum, MOs, InsertPt,
MI, *
this);
7624 if (NarrowToMOV32rm) {
7635 if (NoNDDM && !IsTwoAddr) {
7637 unsigned SrcSub =
MI.getOperand(1).getSubReg();
7638 if (
MI.killsRegister(SrcReg,
nullptr) ||
7639 MI.getOperand(0).getReg() == SrcReg)
7649 get(TargetOpcode::COPY))
7651 .
addReg(SrcReg, {}, SrcSub);
7661 unsigned CommuteOpIdx2 = commuteOperandsForFold(
MI, OpNum);
7662 if (CommuteOpIdx2 == OpNum) {
7668 Alignment,
false, CopyMI);
7672 commuteInstruction(
MI,
false, OpNum, CommuteOpIdx2);
7696 for (
auto Op :
Ops) {
7701 if (
MI.getOpcode() == X86::MOV32r0 && SubReg == X86::sub_32bit)
7703 if (SubReg && (MO.
isDef() || SubReg == X86::sub_8bit_hi))
7712 if (!RI.hasStackRealignment(MF))
7714 std::min(Alignment, Subtarget.getFrameLowering()->getStackAlign());
7719 Alignment,
true, CopyMI, VRM);
7721 if (
Ops.size() == 2 &&
Ops[0] == 0 &&
Ops[1] == 1) {
7722 unsigned NewOpc = 0;
7723 unsigned RCSize = 0;
7724 unsigned Opc =
MI.getOpcode();
7731 NewOpc = X86::CMP8ri;
7735 NewOpc = X86::CMP16ri;
7739 NewOpc = X86::CMP32ri;
7743 NewOpc = X86::CMP64ri32;
7752 MI.setDesc(
get(NewOpc));
7753 MI.getOperand(1).ChangeToImmediate(0);
7754 }
else if (
Ops.size() != 1)
7782 unsigned RegSize =
TRI.getRegSizeInBits(*RC);
7784 if ((
Opc == X86::MOVSSrm ||
Opc == X86::VMOVSSrm ||
Opc == X86::VMOVSSZrm ||
7785 Opc == X86::MOVSSrm_alt ||
Opc == X86::VMOVSSrm_alt ||
7786 Opc == X86::VMOVSSZrm_alt) &&
7792 case X86::CVTSS2SDrr_Int:
7793 case X86::VCVTSS2SDrr_Int:
7794 case X86::VCVTSS2SDZrr_Int:
7795 case X86::VCVTSS2SDZrrk_Int:
7796 case X86::VCVTSS2SDZrrkz_Int:
7797 case X86::CVTSS2SIrr_Int:
7798 case X86::CVTSS2SI64rr_Int:
7799 case X86::VCVTSS2SIrr_Int:
7800 case X86::VCVTSS2SI64rr_Int:
7801 case X86::VCVTSS2SIZrr_Int:
7802 case X86::VCVTSS2SI64Zrr_Int:
7803 case X86::CVTTSS2SIrr_Int:
7804 case X86::CVTTSS2SI64rr_Int:
7805 case X86::VCVTTSS2SIrr_Int:
7806 case X86::VCVTTSS2SI64rr_Int:
7807 case X86::VCVTTSS2SIZrr_Int:
7808 case X86::VCVTTSS2SI64Zrr_Int:
7809 case X86::VCVTSS2USIZrr_Int:
7810 case X86::VCVTSS2USI64Zrr_Int:
7811 case X86::VCVTTSS2USIZrr_Int:
7812 case X86::VCVTTSS2USI64Zrr_Int:
7813 case X86::RCPSSr_Int:
7814 case X86::VRCPSSr_Int:
7815 case X86::RSQRTSSr_Int:
7816 case X86::VRSQRTSSr_Int:
7817 case X86::ROUNDSSri_Int:
7818 case X86::VROUNDSSri_Int:
7819 case X86::COMISSrr_Int:
7820 case X86::VCOMISSrr_Int:
7821 case X86::VCOMISSZrr_Int:
7822 case X86::UCOMISSrr_Int:
7823 case X86::VUCOMISSrr_Int:
7824 case X86::VUCOMISSZrr_Int:
7825 case X86::ADDSSrr_Int:
7826 case X86::VADDSSrr_Int:
7827 case X86::VADDSSZrr_Int:
7828 case X86::CMPSSrri_Int:
7829 case X86::VCMPSSrri_Int:
7830 case X86::VCMPSSZrri_Int:
7831 case X86::DIVSSrr_Int:
7832 case X86::VDIVSSrr_Int:
7833 case X86::VDIVSSZrr_Int:
7834 case X86::MAXSSrr_Int:
7835 case X86::VMAXSSrr_Int:
7836 case X86::VMAXSSZrr_Int:
7837 case X86::MINSSrr_Int:
7838 case X86::VMINSSrr_Int:
7839 case X86::VMINSSZrr_Int:
7840 case X86::MULSSrr_Int:
7841 case X86::VMULSSrr_Int:
7842 case X86::VMULSSZrr_Int:
7843 case X86::SQRTSSr_Int:
7844 case X86::VSQRTSSr_Int:
7845 case X86::VSQRTSSZr_Int:
7846 case X86::SUBSSrr_Int:
7847 case X86::VSUBSSrr_Int:
7848 case X86::VSUBSSZrr_Int:
7849 case X86::VADDSSZrrk_Int:
7850 case X86::VADDSSZrrkz_Int:
7851 case X86::VCMPSSZrrik_Int:
7852 case X86::VDIVSSZrrk_Int:
7853 case X86::VDIVSSZrrkz_Int:
7854 case X86::VMAXSSZrrk_Int:
7855 case X86::VMAXSSZrrkz_Int:
7856 case X86::VMINSSZrrk_Int:
7857 case X86::VMINSSZrrkz_Int:
7858 case X86::VMULSSZrrk_Int:
7859 case X86::VMULSSZrrkz_Int:
7860 case X86::VSQRTSSZrk_Int:
7861 case X86::VSQRTSSZrkz_Int:
7862 case X86::VSUBSSZrrk_Int:
7863 case X86::VSUBSSZrrkz_Int:
7864 case X86::VFMADDSS4rr_Int:
7865 case X86::VFNMADDSS4rr_Int:
7866 case X86::VFMSUBSS4rr_Int:
7867 case X86::VFNMSUBSS4rr_Int:
7868 case X86::VFMADD132SSr_Int:
7869 case X86::VFNMADD132SSr_Int:
7870 case X86::VFMADD213SSr_Int:
7871 case X86::VFNMADD213SSr_Int:
7872 case X86::VFMADD231SSr_Int:
7873 case X86::VFNMADD231SSr_Int:
7874 case X86::VFMSUB132SSr_Int:
7875 case X86::VFNMSUB132SSr_Int:
7876 case X86::VFMSUB213SSr_Int:
7877 case X86::VFNMSUB213SSr_Int:
7878 case X86::VFMSUB231SSr_Int:
7879 case X86::VFNMSUB231SSr_Int:
7880 case X86::VFMADD132SSZr_Int:
7881 case X86::VFNMADD132SSZr_Int:
7882 case X86::VFMADD213SSZr_Int:
7883 case X86::VFNMADD213SSZr_Int:
7884 case X86::VFMADD231SSZr_Int:
7885 case X86::VFNMADD231SSZr_Int:
7886 case X86::VFMSUB132SSZr_Int:
7887 case X86::VFNMSUB132SSZr_Int:
7888 case X86::VFMSUB213SSZr_Int:
7889 case X86::VFNMSUB213SSZr_Int:
7890 case X86::VFMSUB231SSZr_Int:
7891 case X86::VFNMSUB231SSZr_Int:
7892 case X86::VFMADD132SSZrk_Int:
7893 case X86::VFNMADD132SSZrk_Int:
7894 case X86::VFMADD213SSZrk_Int:
7895 case X86::VFNMADD213SSZrk_Int:
7896 case X86::VFMADD231SSZrk_Int:
7897 case X86::VFNMADD231SSZrk_Int:
7898 case X86::VFMSUB132SSZrk_Int:
7899 case X86::VFNMSUB132SSZrk_Int:
7900 case X86::VFMSUB213SSZrk_Int:
7901 case X86::VFNMSUB213SSZrk_Int:
7902 case X86::VFMSUB231SSZrk_Int:
7903 case X86::VFNMSUB231SSZrk_Int:
7904 case X86::VFMADD132SSZrkz_Int:
7905 case X86::VFNMADD132SSZrkz_Int:
7906 case X86::VFMADD213SSZrkz_Int:
7907 case X86::VFNMADD213SSZrkz_Int:
7908 case X86::VFMADD231SSZrkz_Int:
7909 case X86::VFNMADD231SSZrkz_Int:
7910 case X86::VFMSUB132SSZrkz_Int:
7911 case X86::VFNMSUB132SSZrkz_Int:
7912 case X86::VFMSUB213SSZrkz_Int:
7913 case X86::VFNMSUB213SSZrkz_Int:
7914 case X86::VFMSUB231SSZrkz_Int:
7915 case X86::VFNMSUB231SSZrkz_Int:
7916 case X86::VFIXUPIMMSSZrri:
7917 case X86::VFIXUPIMMSSZrrik:
7918 case X86::VFIXUPIMMSSZrrikz:
7919 case X86::VFPCLASSSSZri:
7920 case X86::VFPCLASSSSZrik:
7921 case X86::VGETEXPSSZr:
7922 case X86::VGETEXPSSZrk:
7923 case X86::VGETEXPSSZrkz:
7924 case X86::VGETMANTSSZrri:
7925 case X86::VGETMANTSSZrrik:
7926 case X86::VGETMANTSSZrrikz:
7927 case X86::VRANGESSZrri:
7928 case X86::VRANGESSZrrik:
7929 case X86::VRANGESSZrrikz:
7930 case X86::VRCP14SSZrr:
7931 case X86::VRCP14SSZrrk:
7932 case X86::VRCP14SSZrrkz:
7933 case X86::VRCP28SSZr:
7934 case X86::VRCP28SSZrk:
7935 case X86::VRCP28SSZrkz:
7936 case X86::VREDUCESSZrri:
7937 case X86::VREDUCESSZrrik:
7938 case X86::VREDUCESSZrrikz:
7939 case X86::VRNDSCALESSZrri_Int:
7940 case X86::VRNDSCALESSZrrik_Int:
7941 case X86::VRNDSCALESSZrrikz_Int:
7942 case X86::VRSQRT14SSZrr:
7943 case X86::VRSQRT14SSZrrk:
7944 case X86::VRSQRT14SSZrrkz:
7945 case X86::VRSQRT28SSZr:
7946 case X86::VRSQRT28SSZrk:
7947 case X86::VRSQRT28SSZrkz:
7948 case X86::VSCALEFSSZrr:
7949 case X86::VSCALEFSSZrrk:
7950 case X86::VSCALEFSSZrrkz:
7957 if ((
Opc == X86::MOVSDrm ||
Opc == X86::VMOVSDrm ||
Opc == X86::VMOVSDZrm ||
7958 Opc == X86::MOVSDrm_alt ||
Opc == X86::VMOVSDrm_alt ||
7959 Opc == X86::VMOVSDZrm_alt) &&
7965 case X86::CVTSD2SSrr_Int:
7966 case X86::VCVTSD2SSrr_Int:
7967 case X86::VCVTSD2SSZrr_Int:
7968 case X86::VCVTSD2SSZrrk_Int:
7969 case X86::VCVTSD2SSZrrkz_Int:
7970 case X86::CVTSD2SIrr_Int:
7971 case X86::CVTSD2SI64rr_Int:
7972 case X86::VCVTSD2SIrr_Int:
7973 case X86::VCVTSD2SI64rr_Int:
7974 case X86::VCVTSD2SIZrr_Int:
7975 case X86::VCVTSD2SI64Zrr_Int:
7976 case X86::CVTTSD2SIrr_Int:
7977 case X86::CVTTSD2SI64rr_Int:
7978 case X86::VCVTTSD2SIrr_Int:
7979 case X86::VCVTTSD2SI64rr_Int:
7980 case X86::VCVTTSD2SIZrr_Int:
7981 case X86::VCVTTSD2SI64Zrr_Int:
7982 case X86::VCVTSD2USIZrr_Int:
7983 case X86::VCVTSD2USI64Zrr_Int:
7984 case X86::VCVTTSD2USIZrr_Int:
7985 case X86::VCVTTSD2USI64Zrr_Int:
7986 case X86::ROUNDSDri_Int:
7987 case X86::VROUNDSDri_Int:
7988 case X86::COMISDrr_Int:
7989 case X86::VCOMISDrr_Int:
7990 case X86::VCOMISDZrr_Int:
7991 case X86::UCOMISDrr_Int:
7992 case X86::VUCOMISDrr_Int:
7993 case X86::VUCOMISDZrr_Int:
7994 case X86::ADDSDrr_Int:
7995 case X86::VADDSDrr_Int:
7996 case X86::VADDSDZrr_Int:
7997 case X86::CMPSDrri_Int:
7998 case X86::VCMPSDrri_Int:
7999 case X86::VCMPSDZrri_Int:
8000 case X86::DIVSDrr_Int:
8001 case X86::VDIVSDrr_Int:
8002 case X86::VDIVSDZrr_Int:
8003 case X86::MAXSDrr_Int:
8004 case X86::VMAXSDrr_Int:
8005 case X86::VMAXSDZrr_Int:
8006 case X86::MINSDrr_Int:
8007 case X86::VMINSDrr_Int:
8008 case X86::VMINSDZrr_Int:
8009 case X86::MULSDrr_Int:
8010 case X86::VMULSDrr_Int:
8011 case X86::VMULSDZrr_Int:
8012 case X86::SQRTSDr_Int:
8013 case X86::VSQRTSDr_Int:
8014 case X86::VSQRTSDZr_Int:
8015 case X86::SUBSDrr_Int:
8016 case X86::VSUBSDrr_Int:
8017 case X86::VSUBSDZrr_Int:
8018 case X86::VADDSDZrrk_Int:
8019 case X86::VADDSDZrrkz_Int:
8020 case X86::VCMPSDZrrik_Int:
8021 case X86::VDIVSDZrrk_Int:
8022 case X86::VDIVSDZrrkz_Int:
8023 case X86::VMAXSDZrrk_Int:
8024 case X86::VMAXSDZrrkz_Int:
8025 case X86::VMINSDZrrk_Int:
8026 case X86::VMINSDZrrkz_Int:
8027 case X86::VMULSDZrrk_Int:
8028 case X86::VMULSDZrrkz_Int:
8029 case X86::VSQRTSDZrk_Int:
8030 case X86::VSQRTSDZrkz_Int:
8031 case X86::VSUBSDZrrk_Int:
8032 case X86::VSUBSDZrrkz_Int:
8033 case X86::VFMADDSD4rr_Int:
8034 case X86::VFNMADDSD4rr_Int:
8035 case X86::VFMSUBSD4rr_Int:
8036 case X86::VFNMSUBSD4rr_Int:
8037 case X86::VFMADD132SDr_Int:
8038 case X86::VFNMADD132SDr_Int:
8039 case X86::VFMADD213SDr_Int:
8040 case X86::VFNMADD213SDr_Int:
8041 case X86::VFMADD231SDr_Int:
8042 case X86::VFNMADD231SDr_Int:
8043 case X86::VFMSUB132SDr_Int:
8044 case X86::VFNMSUB132SDr_Int:
8045 case X86::VFMSUB213SDr_Int:
8046 case X86::VFNMSUB213SDr_Int:
8047 case X86::VFMSUB231SDr_Int:
8048 case X86::VFNMSUB231SDr_Int:
8049 case X86::VFMADD132SDZr_Int:
8050 case X86::VFNMADD132SDZr_Int:
8051 case X86::VFMADD213SDZr_Int:
8052 case X86::VFNMADD213SDZr_Int:
8053 case X86::VFMADD231SDZr_Int:
8054 case X86::VFNMADD231SDZr_Int:
8055 case X86::VFMSUB132SDZr_Int:
8056 case X86::VFNMSUB132SDZr_Int:
8057 case X86::VFMSUB213SDZr_Int:
8058 case X86::VFNMSUB213SDZr_Int:
8059 case X86::VFMSUB231SDZr_Int:
8060 case X86::VFNMSUB231SDZr_Int:
8061 case X86::VFMADD132SDZrk_Int:
8062 case X86::VFNMADD132SDZrk_Int:
8063 case X86::VFMADD213SDZrk_Int:
8064 case X86::VFNMADD213SDZrk_Int:
8065 case X86::VFMADD231SDZrk_Int:
8066 case X86::VFNMADD231SDZrk_Int:
8067 case X86::VFMSUB132SDZrk_Int:
8068 case X86::VFNMSUB132SDZrk_Int:
8069 case X86::VFMSUB213SDZrk_Int:
8070 case X86::VFNMSUB213SDZrk_Int:
8071 case X86::VFMSUB231SDZrk_Int:
8072 case X86::VFNMSUB231SDZrk_Int:
8073 case X86::VFMADD132SDZrkz_Int:
8074 case X86::VFNMADD132SDZrkz_Int:
8075 case X86::VFMADD213SDZrkz_Int:
8076 case X86::VFNMADD213SDZrkz_Int:
8077 case X86::VFMADD231SDZrkz_Int:
8078 case X86::VFNMADD231SDZrkz_Int:
8079 case X86::VFMSUB132SDZrkz_Int:
8080 case X86::VFNMSUB132SDZrkz_Int:
8081 case X86::VFMSUB213SDZrkz_Int:
8082 case X86::VFNMSUB213SDZrkz_Int:
8083 case X86::VFMSUB231SDZrkz_Int:
8084 case X86::VFNMSUB231SDZrkz_Int:
8085 case X86::VFIXUPIMMSDZrri:
8086 case X86::VFIXUPIMMSDZrrik:
8087 case X86::VFIXUPIMMSDZrrikz:
8088 case X86::VFPCLASSSDZri:
8089 case X86::VFPCLASSSDZrik:
8090 case X86::VGETEXPSDZr:
8091 case X86::VGETEXPSDZrk:
8092 case X86::VGETEXPSDZrkz:
8093 case X86::VGETMANTSDZrri:
8094 case X86::VGETMANTSDZrrik:
8095 case X86::VGETMANTSDZrrikz:
8096 case X86::VRANGESDZrri:
8097 case X86::VRANGESDZrrik:
8098 case X86::VRANGESDZrrikz:
8099 case X86::VRCP14SDZrr:
8100 case X86::VRCP14SDZrrk:
8101 case X86::VRCP14SDZrrkz:
8102 case X86::VRCP28SDZr:
8103 case X86::VRCP28SDZrk:
8104 case X86::VRCP28SDZrkz:
8105 case X86::VREDUCESDZrri:
8106 case X86::VREDUCESDZrrik:
8107 case X86::VREDUCESDZrrikz:
8108 case X86::VRNDSCALESDZrri_Int:
8109 case X86::VRNDSCALESDZrrik_Int:
8110 case X86::VRNDSCALESDZrrikz_Int:
8111 case X86::VRSQRT14SDZrr:
8112 case X86::VRSQRT14SDZrrk:
8113 case X86::VRSQRT14SDZrrkz:
8114 case X86::VRSQRT28SDZr:
8115 case X86::VRSQRT28SDZrk:
8116 case X86::VRSQRT28SDZrkz:
8117 case X86::VSCALEFSDZrr:
8118 case X86::VSCALEFSDZrrk:
8119 case X86::VSCALEFSDZrrkz:
8126 if ((
Opc == X86::VMOVSHZrm ||
Opc == X86::VMOVSHZrm_alt) &&
RegSize > 16) {
8131 case X86::VADDSHZrr_Int:
8132 case X86::VCMPSHZrri_Int:
8133 case X86::VDIVSHZrr_Int:
8134 case X86::VMAXSHZrr_Int:
8135 case X86::VMINSHZrr_Int:
8136 case X86::VMULSHZrr_Int:
8137 case X86::VSUBSHZrr_Int:
8138 case X86::VADDSHZrrk_Int:
8139 case X86::VADDSHZrrkz_Int:
8140 case X86::VCMPSHZrrik_Int:
8141 case X86::VDIVSHZrrk_Int:
8142 case X86::VDIVSHZrrkz_Int:
8143 case X86::VMAXSHZrrk_Int:
8144 case X86::VMAXSHZrrkz_Int:
8145 case X86::VMINSHZrrk_Int:
8146 case X86::VMINSHZrrkz_Int:
8147 case X86::VMULSHZrrk_Int:
8148 case X86::VMULSHZrrkz_Int:
8149 case X86::VSUBSHZrrk_Int:
8150 case X86::VSUBSHZrrkz_Int:
8151 case X86::VFMADD132SHZr_Int:
8152 case X86::VFNMADD132SHZr_Int:
8153 case X86::VFMADD213SHZr_Int:
8154 case X86::VFNMADD213SHZr_Int:
8155 case X86::VFMADD231SHZr_Int:
8156 case X86::VFNMADD231SHZr_Int:
8157 case X86::VFMSUB132SHZr_Int:
8158 case X86::VFNMSUB132SHZr_Int:
8159 case X86::VFMSUB213SHZr_Int:
8160 case X86::VFNMSUB213SHZr_Int:
8161 case X86::VFMSUB231SHZr_Int:
8162 case X86::VFNMSUB231SHZr_Int:
8163 case X86::VFMADD132SHZrk_Int:
8164 case X86::VFNMADD132SHZrk_Int:
8165 case X86::VFMADD213SHZrk_Int:
8166 case X86::VFNMADD213SHZrk_Int:
8167 case X86::VFMADD231SHZrk_Int:
8168 case X86::VFNMADD231SHZrk_Int:
8169 case X86::VFMSUB132SHZrk_Int:
8170 case X86::VFNMSUB132SHZrk_Int:
8171 case X86::VFMSUB213SHZrk_Int:
8172 case X86::VFNMSUB213SHZrk_Int:
8173 case X86::VFMSUB231SHZrk_Int:
8174 case X86::VFNMSUB231SHZrk_Int:
8175 case X86::VFMADD132SHZrkz_Int:
8176 case X86::VFNMADD132SHZrkz_Int:
8177 case X86::VFMADD213SHZrkz_Int:
8178 case X86::VFNMADD213SHZrkz_Int:
8179 case X86::VFMADD231SHZrkz_Int:
8180 case X86::VFNMADD231SHZrkz_Int:
8181 case X86::VFMSUB132SHZrkz_Int:
8182 case X86::VFNMSUB132SHZrkz_Int:
8183 case X86::VFMSUB213SHZrkz_Int:
8184 case X86::VFNMSUB213SHZrkz_Int:
8185 case X86::VFMSUB231SHZrkz_Int:
8186 case X86::VFNMSUB231SHZrkz_Int:
8212 return RC == &X86::VK2WMRegClass || RC == &X86::VK4WMRegClass ||
8213 RC == &X86::VK8WMRegClass || RC == &X86::VK16WMRegClass ||
8214 RC == &X86::VK32WMRegClass || RC == &X86::VK64WMRegClass;
8228 bool HasSameMask =
false;
8229 for (
unsigned I = 1, E =
MI.getDesc().getNumOperands();
I < E; ++
I) {
8231 if (
Op.isReg() &&
Op.getReg() == MaskReg) {
8243 for (
auto Op :
Ops) {
8244 if (
MI.getOperand(
Op).getSubReg())
8281 case X86::AVX512_512_SET0:
8282 case X86::AVX512_512_SETALLONES:
8283 Alignment =
Align(64);
8285 case X86::AVX2_SETALLONES:
8286 case X86::AVX1_SETALLONES:
8288 case X86::AVX512_256_SET0:
8289 case X86::AVX512_256_SETALLONES:
8290 Alignment =
Align(32);
8293 case X86::V_SETALLONES:
8294 case X86::AVX512_128_SET0:
8295 case X86::FsFLD0F128:
8296 case X86::AVX512_FsFLD0F128:
8297 case X86::AVX512_128_SETALLONES:
8298 Alignment =
Align(16);
8302 case X86::AVX512_FsFLD0SD:
8303 Alignment =
Align(8);
8306 case X86::AVX512_FsFLD0SS:
8307 Alignment =
Align(4);
8310 case X86::AVX512_FsFLD0SH:
8311 Alignment =
Align(2);
8316 if (
Ops.size() == 2 &&
Ops[0] == 0 &&
Ops[1] == 1) {
8317 unsigned NewOpc = 0;
8318 switch (
MI.getOpcode()) {
8322 NewOpc = X86::CMP8ri;
8325 NewOpc = X86::CMP16ri;
8328 NewOpc = X86::CMP32ri;
8331 NewOpc = X86::CMP64ri32;
8335 MI.setDesc(
get(NewOpc));
8336 MI.getOperand(1).ChangeToImmediate(0);
8337 }
else if (
Ops.size() != 1)
8349 case X86::V_SETALLONES:
8350 case X86::AVX2_SETALLONES:
8351 case X86::AVX1_SETALLONES:
8353 case X86::AVX512_128_SET0:
8354 case X86::AVX512_256_SET0:
8355 case X86::AVX512_512_SET0:
8356 case X86::AVX512_128_SETALLONES:
8357 case X86::AVX512_256_SETALLONES:
8358 case X86::AVX512_512_SETALLONES:
8360 case X86::AVX512_FsFLD0SH:
8362 case X86::AVX512_FsFLD0SD:
8364 case X86::AVX512_FsFLD0SS:
8365 case X86::FsFLD0F128:
8366 case X86::AVX512_FsFLD0F128: {
8375 unsigned PICBase = 0;
8378 if (Subtarget.is64Bit()) {
8391 bool IsAllOnes =
false;
8394 case X86::AVX512_FsFLD0SS:
8398 case X86::AVX512_FsFLD0SD:
8401 case X86::FsFLD0F128:
8402 case X86::AVX512_FsFLD0F128:
8406 case X86::AVX512_FsFLD0SH:
8409 case X86::AVX512_512_SETALLONES:
8412 case X86::AVX512_512_SET0:
8416 case X86::AVX1_SETALLONES:
8417 case X86::AVX2_SETALLONES:
8418 case X86::AVX512_256_SETALLONES:
8421 case X86::AVX512_256_SET0:
8431 case X86::V_SETALLONES:
8432 case X86::AVX512_128_SETALLONES:
8436 case X86::AVX512_128_SET0:
8454 case X86::VPBROADCASTBZ128rm:
8455 case X86::VPBROADCASTBZ256rm:
8456 case X86::VPBROADCASTBZrm:
8457 case X86::VBROADCASTF32X2Z256rm:
8458 case X86::VBROADCASTF32X2Zrm:
8459 case X86::VBROADCASTI32X2Z128rm:
8460 case X86::VBROADCASTI32X2Z256rm:
8461 case X86::VBROADCASTI32X2Zrm:
8465#define FOLD_BROADCAST(SIZE) \
8466 MOs.append(LoadMI.operands_begin() + NumOps - X86::AddrNumOperands, \
8467 LoadMI.operands_begin() + NumOps); \
8468 return foldMemoryBroadcast(MF, MI, Ops[0], MOs, InsertPt, SIZE, \
8470 case X86::VPBROADCASTWZ128rm:
8471 case X86::VPBROADCASTWZ256rm:
8472 case X86::VPBROADCASTWZrm:
8474 case X86::VPBROADCASTDZ128rm:
8475 case X86::VPBROADCASTDZ256rm:
8476 case X86::VPBROADCASTDZrm:
8477 case X86::VBROADCASTSSZ128rm:
8478 case X86::VBROADCASTSSZ256rm:
8479 case X86::VBROADCASTSSZrm:
8481 case X86::VPBROADCASTQZ128rm:
8482 case X86::VPBROADCASTQZ256rm:
8483 case X86::VPBROADCASTQZrm:
8484 case X86::VBROADCASTSDZ256rm:
8485 case X86::VBROADCASTSDZrm:
8506 unsigned BitsSize,
bool AllowCommute)
const {
8510 ?
fuseInst(MF,
I->DstOp, OpNum, MOs, InsertPt,
MI, *
this)
8516 unsigned CommuteOpIdx2 = commuteOperandsForFold(
MI, OpNum);
8517 if (CommuteOpIdx2 == OpNum) {
8522 foldMemoryBroadcast(MF,
MI, CommuteOpIdx2, MOs, InsertPt, BitsSize,
8527 commuteInstruction(
MI,
false, OpNum, CommuteOpIdx2);
8542 if (!MMO->isStore()) {
8560 if (!MMO->isStore())
8563 if (!MMO->isLoad()) {
8581 assert((SpillSize == 64 || STI.hasVLX()) &&
8582 "Can't broadcast less than 64 bytes without AVX512VL!");
8584#define CASE_BCAST_TYPE_OPC(TYPE, OP16, OP32, OP64) \
8586 switch (SpillSize) { \
8588 llvm_unreachable("Unknown spill size"); \
8622 unsigned Opc =
I->DstOp;
8626 if (UnfoldLoad && !FoldedLoad)
8628 UnfoldLoad &= FoldedLoad;
8629 if (UnfoldStore && !FoldedStore)
8631 UnfoldStore &= FoldedStore;
8638 if (!
MI.hasOneMemOperand() && RC == &X86::VR128RegClass &&
8639 Subtarget.isUnalignedMem16Slow())
8648 for (
unsigned i = 0, e =
MI.getNumOperands(); i != e; ++i) {
8652 else if (
Op.isReg() &&
Op.isImplicit())
8668 unsigned Alignment = std::max<uint32_t>(
TRI.getSpillSize(*RC), 16);
8669 bool isAligned = !MMOs.empty() && MMOs.front()->getAlign() >= Alignment;
8713 case X86::CMP64ri32:
8724 case X86::CMP64ri32:
8725 NewOpc = X86::TEST64rr;
8728 NewOpc = X86::TEST32rr;
8731 NewOpc = X86::TEST16rr;
8734 NewOpc = X86::TEST8rr;
8748 unsigned Alignment = std::max<uint32_t>(
TRI.getSpillSize(*DstRC), 16);
8749 bool isAligned = !MMOs.empty() && MMOs.front()->getAlign() >= Alignment;
8765 if (!
N->isMachineOpcode())
8771 unsigned Opc =
I->DstOp;
8779 unsigned NumDefs =
MCID.NumDefs;
8780 std::vector<SDValue> AddrOps;
8781 std::vector<SDValue> BeforeOps;
8782 std::vector<SDValue> AfterOps;
8784 unsigned NumOps =
N->getNumOperands();
8785 for (
unsigned i = 0; i !=
NumOps - 1; ++i) {
8788 AddrOps.push_back(
Op);
8789 else if (i < Index - NumDefs)
8790 BeforeOps.push_back(
Op);
8791 else if (i > Index - NumDefs)
8792 AfterOps.push_back(
Op);
8795 AddrOps.push_back(Chain);
8800 EVT VT = *
TRI.legalclasstypes_begin(*RC);
8802 if (MMOs.empty() && RC == &X86::VR128RegClass &&
8803 Subtarget.isUnalignedMem16Slow())
8813 unsigned Alignment = std::max<uint32_t>(
TRI.getSpillSize(*RC), 16);
8814 bool isAligned = !MMOs.empty() && MMOs.front()->getAlign() >= Alignment;
8826 std::vector<EVT> VTs;
8828 if (
MCID.getNumDefs() > 0) {
8830 VTs.push_back(*
TRI.legalclasstypes_begin(*DstRC));
8832 for (
unsigned i = 0, e =
N->getNumValues(); i != e; ++i) {
8833 EVT VT =
N->getValueType(i);
8834 if (VT != MVT::Other && i >= (
unsigned)
MCID.getNumDefs())
8838 BeforeOps.push_back(
SDValue(Load, 0));
8844 case X86::CMP64ri32:
8852 case X86::CMP64ri32:
8853 Opc = X86::TEST64rr;
8856 Opc = X86::TEST32rr;
8859 Opc = X86::TEST16rr;
8865 BeforeOps[1] = BeforeOps[0];
8874 AddrOps.push_back(
SDValue(NewNode, 0));
8875 AddrOps.push_back(Chain);
8877 if (MMOs.empty() && RC == &X86::VR128RegClass &&
8878 Subtarget.isUnalignedMem16Slow())
8883 unsigned Alignment = std::max<uint32_t>(
TRI.getSpillSize(*RC), 16);
8884 bool isAligned = !MMOs.empty() && MMOs.front()->getAlign() >= Alignment;
8887 dl, MVT::Other, AddrOps);
8900 unsigned *LoadRegIndex)
const {
8906 if (UnfoldLoad && !FoldedLoad)
8908 if (UnfoldStore && !FoldedStore)
8917 int64_t &Offset2)
const {
8921 auto IsLoadOpcode = [&](
unsigned Opcode) {
8933 case X86::MOVSSrm_alt:
8935 case X86::MOVSDrm_alt:
8936 case X86::MMX_MOVD64rm:
8937 case X86::MMX_MOVQ64rm:
8946 case X86::VMOVSSrm_alt:
8948 case X86::VMOVSDrm_alt:
8949 case X86::VMOVAPSrm:
8950 case X86::VMOVUPSrm:
8951 case X86::VMOVAPDrm:
8952 case X86::VMOVUPDrm:
8953 case X86::VMOVDQArm:
8954 case X86::VMOVDQUrm:
8955 case X86::VMOVAPSYrm:
8956 case X86::VMOVUPSYrm:
8957 case X86::VMOVAPDYrm:
8958 case X86::VMOVUPDYrm:
8959 case X86::VMOVDQAYrm:
8960 case X86::VMOVDQUYrm:
8962 case X86::VMOVSSZrm:
8963 case X86::VMOVSSZrm_alt:
8964 case X86::VMOVSDZrm:
8965 case X86::VMOVSDZrm_alt:
8966 case X86::VMOVAPSZ128rm:
8967 case X86::VMOVUPSZ128rm:
8968 case X86::VMOVAPSZ128rm_NOVLX:
8969 case X86::VMOVUPSZ128rm_NOVLX:
8970 case X86::VMOVAPDZ128rm:
8971 case X86::VMOVUPDZ128rm:
8972 case X86::VMOVDQU8Z128rm:
8973 case X86::VMOVDQU16Z128rm:
8974 case X86::VMOVDQA32Z128rm:
8975 case X86::VMOVDQU32Z128rm:
8976 case X86::VMOVDQA64Z128rm:
8977 case X86::VMOVDQU64Z128rm:
8978 case X86::VMOVAPSZ256rm:
8979 case X86::VMOVUPSZ256rm:
8980 case X86::VMOVAPSZ256rm_NOVLX:
8981 case X86::VMOVUPSZ256rm_NOVLX:
8982 case X86::VMOVAPDZ256rm:
8983 case X86::VMOVUPDZ256rm:
8984 case X86::VMOVDQU8Z256rm:
8985 case X86::VMOVDQU16Z256rm:
8986 case X86::VMOVDQA32Z256rm:
8987 case X86::VMOVDQU32Z256rm:
8988 case X86::VMOVDQA64Z256rm:
8989 case X86::VMOVDQU64Z256rm:
8990 case X86::VMOVAPSZrm:
8991 case X86::VMOVUPSZrm:
8992 case X86::VMOVAPDZrm:
8993 case X86::VMOVUPDZrm:
8994 case X86::VMOVDQU8Zrm:
8995 case X86::VMOVDQU16Zrm:
8996 case X86::VMOVDQA32Zrm:
8997 case X86::VMOVDQU32Zrm:
8998 case X86::VMOVDQA64Zrm:
8999 case X86::VMOVDQU64Zrm:
9001 case X86::KMOVBkm_EVEX:
9003 case X86::KMOVWkm_EVEX:
9005 case X86::KMOVDkm_EVEX:
9007 case X86::KMOVQkm_EVEX:
9017 auto HasSameOp = [&](
int I) {
9033 if (!Disp1 || !Disp2)
9036 Offset1 = Disp1->getSExtValue();
9037 Offset2 = Disp2->getSExtValue();
9042 int64_t Offset1, int64_t Offset2,
9043 unsigned NumLoads)
const {
9044 assert(Offset2 > Offset1);
9045 if ((Offset2 - Offset1) / 8 > 64)
9059 case X86::MMX_MOVD64rm:
9060 case X86::MMX_MOVQ64rm:
9069 if (Subtarget.is64Bit()) {
9072 }
else if (NumLoads) {
9095 unsigned Opcode =
MI.getOpcode();
9096 if (Opcode == X86::ENDBR64 || Opcode == X86::ENDBR32 ||
9097 Opcode == X86::PLDTILECFGV)
9110 assert(
Cond.size() == 1 &&
"Invalid X86 branch condition!");
9120 return !(RC == &X86::CCRRegClass || RC == &X86::DFCCRRegClass ||
9121 RC == &X86::RFP32RegClass || RC == &X86::RFP64RegClass ||
9122 RC == &X86::RFP80RegClass);
9135 return GlobalBaseReg;
9140 GlobalBaseReg = RegInfo.createVirtualRegister(
9141 Subtarget.is64Bit() ? &X86::GR64_NOSPRegClass : &X86::GR32_NOSPRegClass);
9143 return GlobalBaseReg;
9151 for (
const uint16_t(&Row)[3] : Table)
9152 if (Row[domain - 1] == opcode)
9160 for (
const uint16_t(&Row)[4] : Table)
9161 if (Row[domain - 1] == opcode || (domain == 3 && Row[3] == opcode))
9168 unsigned NewWidth,
unsigned *pNewMask =
nullptr) {
9169 assert(((OldWidth % NewWidth) == 0 || (NewWidth % OldWidth) == 0) &&
9170 "Illegal blend mask scale");
9171 unsigned NewMask = 0;
9173 if ((OldWidth % NewWidth) == 0) {
9174 unsigned Scale = OldWidth / NewWidth;
9175 unsigned SubMask = (1u << Scale) - 1;
9176 for (
unsigned i = 0; i != NewWidth; ++i) {
9177 unsigned Sub = (OldMask >> (i * Scale)) & SubMask;
9179 NewMask |= (1u << i);
9180 else if (
Sub != 0x0)
9184 unsigned Scale = NewWidth / OldWidth;
9185 unsigned SubMask = (1u << Scale) - 1;
9186 for (
unsigned i = 0; i != OldWidth; ++i) {
9187 if (OldMask & (1 << i)) {
9188 NewMask |= (SubMask << (i * Scale));
9194 *pNewMask = NewMask;
9199 unsigned Opcode =
MI.getOpcode();
9200 unsigned NumOperands =
MI.getDesc().getNumOperands();
9202 auto GetBlendDomains = [&](
unsigned ImmWidth,
bool Is256) {
9204 if (
MI.getOperand(NumOperands - 1).isImm()) {
9205 unsigned Imm =
MI.getOperand(NumOperands - 1).getImm();
9207 validDomains |= 0x2;
9209 validDomains |= 0x4;
9210 if (!Is256 || Subtarget.hasAVX2())
9211 validDomains |= 0x8;
9213 return validDomains;
9217 case X86::BLENDPDrmi:
9218 case X86::BLENDPDrri:
9219 case X86::VBLENDPDrmi:
9220 case X86::VBLENDPDrri:
9221 return GetBlendDomains(2,
false);
9222 case X86::VBLENDPDYrmi:
9223 case X86::VBLENDPDYrri:
9224 return GetBlendDomains(4,
true);
9225 case X86::BLENDPSrmi:
9226 case X86::BLENDPSrri:
9227 case X86::VBLENDPSrmi:
9228 case X86::VBLENDPSrri:
9229 case X86::VPBLENDDrmi:
9230 case X86::VPBLENDDrri:
9231 return GetBlendDomains(4,
false);
9232 case X86::VBLENDPSYrmi:
9233 case X86::VBLENDPSYrri:
9234 case X86::VPBLENDDYrmi:
9235 case X86::VPBLENDDYrri:
9236 return GetBlendDomains(8,
true);
9237 case X86::PBLENDWrmi:
9238 case X86::PBLENDWrri:
9239 case X86::VPBLENDWrmi:
9240 case X86::VPBLENDWrri:
9242 case X86::VPBLENDWYrmi:
9243 case X86::VPBLENDWYrri:
9244 return GetBlendDomains(8,
false);
9245 case X86::VPANDDZ128rr:
9246 case X86::VPANDDZ128rm:
9247 case X86::VPANDDZ256rr:
9248 case X86::VPANDDZ256rm:
9249 case X86::VPANDQZ128rr:
9250 case X86::VPANDQZ128rm:
9251 case X86::VPANDQZ256rr:
9252 case X86::VPANDQZ256rm:
9253 case X86::VPANDNDZ128rr:
9254 case X86::VPANDNDZ128rm:
9255 case X86::VPANDNDZ256rr:
9256 case X86::VPANDNDZ256rm:
9257 case X86::VPANDNQZ128rr:
9258 case X86::VPANDNQZ128rm:
9259 case X86::VPANDNQZ256rr:
9260 case X86::VPANDNQZ256rm:
9261 case X86::VPORDZ128rr:
9262 case X86::VPORDZ128rm:
9263 case X86::VPORDZ256rr:
9264 case X86::VPORDZ256rm:
9265 case X86::VPORQZ128rr:
9266 case X86::VPORQZ128rm:
9267 case X86::VPORQZ256rr:
9268 case X86::VPORQZ256rm:
9269 case X86::VPXORDZ128rr:
9270 case X86::VPXORDZ128rm:
9271 case X86::VPXORDZ256rr:
9272 case X86::VPXORDZ256rm:
9273 case X86::VPXORQZ128rr:
9274 case X86::VPXORQZ128rm:
9275 case X86::VPXORQZ256rr:
9276 case X86::VPXORQZ256rm:
9279 if (Subtarget.hasDQI())
9282 if (RI.getEncodingValue(
MI.getOperand(0).getReg()) >= 16)
9284 if (RI.getEncodingValue(
MI.getOperand(1).getReg()) >= 16)
9287 if (NumOperands == 3 &&
9288 RI.getEncodingValue(
MI.getOperand(2).getReg()) >= 16)
9293 case X86::MOVHLPSrr:
9300 if (
MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg() &&
9301 MI.getOperand(0).getSubReg() == 0 &&
9302 MI.getOperand(1).getSubReg() == 0 &&
MI.getOperand(2).getSubReg() == 0)
9305 case X86::SHUFPDrri:
9311#include "X86ReplaceableInstrs.def"
9317 assert(dom &&
"Not an SSE instruction");
9319 unsigned Opcode =
MI.getOpcode();
9320 unsigned NumOperands =
MI.getDesc().getNumOperands();
9322 auto SetBlendDomain = [&](
unsigned ImmWidth,
bool Is256) {
9323 if (
MI.getOperand(NumOperands - 1).isImm()) {
9324 unsigned Imm =
MI.getOperand(NumOperands - 1).getImm() & 255;
9325 Imm = (ImmWidth == 16 ? ((Imm << 8) | Imm) : Imm);
9326 unsigned NewImm = Imm;
9328 const uint16_t *table =
lookup(Opcode, dom, ReplaceableBlendInstrs);
9330 table =
lookup(Opcode, dom, ReplaceableBlendAVX2Instrs);
9334 }
else if (
Domain == 2) {
9336 }
else if (
Domain == 3) {
9337 if (Subtarget.hasAVX2()) {
9339 if ((ImmWidth / (Is256 ? 2 : 1)) != 8) {
9340 table =
lookup(Opcode, dom, ReplaceableBlendAVX2Instrs);
9344 assert(!Is256 &&
"128-bit vector expected");
9349 assert(table && table[
Domain - 1] &&
"Unknown domain op");
9351 MI.getOperand(NumOperands - 1).setImm(NewImm & 255);
9357 case X86::BLENDPDrmi:
9358 case X86::BLENDPDrri:
9359 case X86::VBLENDPDrmi:
9360 case X86::VBLENDPDrri:
9361 return SetBlendDomain(2,
false);
9362 case X86::VBLENDPDYrmi:
9363 case X86::VBLENDPDYrri:
9364 return SetBlendDomain(4,
true);
9365 case X86::BLENDPSrmi:
9366 case X86::BLENDPSrri:
9367 case X86::VBLENDPSrmi:
9368 case X86::VBLENDPSrri:
9369 case X86::VPBLENDDrmi:
9370 case X86::VPBLENDDrri:
9371 return SetBlendDomain(4,
false);
9372 case X86::VBLENDPSYrmi:
9373 case X86::VBLENDPSYrri:
9374 case X86::VPBLENDDYrmi:
9375 case X86::VPBLENDDYrri:
9376 return SetBlendDomain(8,
true);
9377 case X86::PBLENDWrmi:
9378 case X86::PBLENDWrri:
9379 case X86::VPBLENDWrmi:
9380 case X86::VPBLENDWrri:
9381 return SetBlendDomain(8,
false);
9382 case X86::VPBLENDWYrmi:
9383 case X86::VPBLENDWYrri:
9384 return SetBlendDomain(16,
true);
9385 case X86::VPANDDZ128rr:
9386 case X86::VPANDDZ128rm:
9387 case X86::VPANDDZ256rr:
9388 case X86::VPANDDZ256rm:
9389 case X86::VPANDQZ128rr:
9390 case X86::VPANDQZ128rm:
9391 case X86::VPANDQZ256rr:
9392 case X86::VPANDQZ256rm:
9393 case X86::VPANDNDZ128rr:
9394 case X86::VPANDNDZ128rm:
9395 case X86::VPANDNDZ256rr:
9396 case X86::VPANDNDZ256rm:
9397 case X86::VPANDNQZ128rr:
9398 case X86::VPANDNQZ128rm:
9399 case X86::VPANDNQZ256rr:
9400 case X86::VPANDNQZ256rm:
9401 case X86::VPORDZ128rr:
9402 case X86::VPORDZ128rm:
9403 case X86::VPORDZ256rr:
9404 case X86::VPORDZ256rm:
9405 case X86::VPORQZ128rr:
9406 case X86::VPORQZ128rm:
9407 case X86::VPORQZ256rr:
9408 case X86::VPORQZ256rm:
9409 case X86::VPXORDZ128rr:
9410 case X86::VPXORDZ128rm:
9411 case X86::VPXORDZ256rr:
9412 case X86::VPXORDZ256rm:
9413 case X86::VPXORQZ128rr:
9414 case X86::VPXORQZ128rm:
9415 case X86::VPXORQZ256rr:
9416 case X86::VPXORQZ256rm: {
9418 if (Subtarget.hasDQI())
9422 lookupAVX512(
MI.getOpcode(), dom, ReplaceableCustomAVX512LogicInstrs);
9423 assert(table &&
"Instruction not found in table?");
9426 if (
Domain == 3 && (dom == 1 || table[3] ==
MI.getOpcode()))
9431 case X86::UNPCKHPDrr:
9432 case X86::MOVHLPSrr:
9435 MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg() &&
9436 MI.getOperand(0).getSubReg() == 0 &&
9437 MI.getOperand(1).getSubReg() == 0 &&
9438 MI.getOperand(2).getSubReg() == 0) {
9439 commuteInstruction(
MI,
false);
9443 if (Opcode == X86::MOVHLPSrr)
9446 case X86::SHUFPDrri: {
9448 unsigned Imm =
MI.getOperand(3).getImm();
9449 unsigned NewImm = 0x44;
9454 MI.getOperand(3).setImm(NewImm);
9455 MI.setDesc(
get(X86::SHUFPSrri));
9463std::pair<uint16_t, uint16_t>
9466 unsigned opcode =
MI.getOpcode();
9472 return std::make_pair(domain, validDomains);
9474 if (
lookup(opcode, domain, ReplaceableInstrs)) {
9476 }
else if (
lookup(opcode, domain, ReplaceableInstrsAVX2)) {
9477 validDomains = Subtarget.hasAVX2() ? 0xe : 0x6;
9478 }
else if (
lookup(opcode, domain, ReplaceableInstrsFP)) {
9480 }
else if (
lookup(opcode, domain, ReplaceableInstrsAVX2InsertExtract)) {
9483 if (!Subtarget.hasAVX2())
9484 return std::make_pair(0, 0);
9486 }
else if (
lookupAVX512(opcode, domain, ReplaceableInstrsAVX512)) {
9488 }
else if (Subtarget.hasDQI() &&
9489 lookupAVX512(opcode, domain, ReplaceableInstrsAVX512DQ)) {
9491 }
else if (Subtarget.hasDQI()) {
9493 lookupAVX512(opcode, domain, ReplaceableInstrsAVX512DQMasked)) {
9494 if (domain == 1 || (domain == 3 && table[3] == opcode))
9501 return std::make_pair(domain, validDomains);
9507 assert(dom &&
"Not an SSE instruction");
9516 "256-bit vector operations only available in AVX2");
9517 table =
lookup(
MI.getOpcode(), dom, ReplaceableInstrsAVX2);
9520 table =
lookup(
MI.getOpcode(), dom, ReplaceableInstrsFP);
9522 "Can only select PackedSingle or PackedDouble");
9525 assert(Subtarget.hasAVX2() &&
9526 "256-bit insert/extract only available in AVX2");
9527 table =
lookup(
MI.getOpcode(), dom, ReplaceableInstrsAVX2InsertExtract);
9530 assert(Subtarget.hasAVX512() &&
"Requires AVX-512");
9531 table =
lookupAVX512(
MI.getOpcode(), dom, ReplaceableInstrsAVX512);
9533 if (table &&
Domain == 3 && table[3] ==
MI.getOpcode())
9537 assert((Subtarget.hasDQI() ||
Domain >= 3) &&
"Requires AVX-512DQ");
9538 table =
lookupAVX512(
MI.getOpcode(), dom, ReplaceableInstrsAVX512DQ);
9541 if (table &&
Domain == 3 && (dom == 1 || table[3] ==
MI.getOpcode()))
9545 assert((Subtarget.hasDQI() ||
Domain >= 3) &&
"Requires AVX-512DQ");
9546 table =
lookupAVX512(
MI.getOpcode(), dom, ReplaceableInstrsAVX512DQMasked);
9547 if (table &&
Domain == 3 && (dom == 1 || table[3] ==
MI.getOpcode()))
9550 assert(table &&
"Cannot change domain");
9576 case X86::DIVSDrm_Int:
9578 case X86::DIVSDrr_Int:
9580 case X86::DIVSSrm_Int:
9582 case X86::DIVSSrr_Int:
9588 case X86::SQRTSDm_Int:
9590 case X86::SQRTSDr_Int:
9592 case X86::SQRTSSm_Int:
9594 case X86::SQRTSSr_Int:
9598 case X86::VDIVPDYrm:
9599 case X86::VDIVPDYrr:
9602 case X86::VDIVPSYrm:
9603 case X86::VDIVPSYrr:
9605 case X86::VDIVSDrm_Int:
9607 case X86::VDIVSDrr_Int:
9609 case X86::VDIVSSrm_Int:
9611 case X86::VDIVSSrr_Int:
9614 case X86::VSQRTPDYm:
9615 case X86::VSQRTPDYr:
9618 case X86::VSQRTPSYm:
9619 case X86::VSQRTPSYr:
9621 case X86::VSQRTSDm_Int:
9623 case X86::VSQRTSDr_Int:
9625 case X86::VSQRTSSm_Int:
9627 case X86::VSQRTSSr_Int:
9629 case X86::VDIVPDZ128rm:
9630 case X86::VDIVPDZ128rmb:
9631 case X86::VDIVPDZ128rmbk:
9632 case X86::VDIVPDZ128rmbkz:
9633 case X86::VDIVPDZ128rmk:
9634 case X86::VDIVPDZ128rmkz:
9635 case X86::VDIVPDZ128rr:
9636 case X86::VDIVPDZ128rrk:
9637 case X86::VDIVPDZ128rrkz:
9638 case X86::VDIVPDZ256rm:
9639 case X86::VDIVPDZ256rmb:
9640 case X86::VDIVPDZ256rmbk:
9641 case X86::VDIVPDZ256rmbkz:
9642 case X86::VDIVPDZ256rmk:
9643 case X86::VDIVPDZ256rmkz:
9644 case X86::VDIVPDZ256rr:
9645 case X86::VDIVPDZ256rrk:
9646 case X86::VDIVPDZ256rrkz:
9647 case X86::VDIVPDZrrb:
9648 case X86::VDIVPDZrrbk:
9649 case X86::VDIVPDZrrbkz:
9650 case X86::VDIVPDZrm:
9651 case X86::VDIVPDZrmb:
9652 case X86::VDIVPDZrmbk:
9653 case X86::VDIVPDZrmbkz:
9654 case X86::VDIVPDZrmk:
9655 case X86::VDIVPDZrmkz:
9656 case X86::VDIVPDZrr:
9657 case X86::VDIVPDZrrk:
9658 case X86::VDIVPDZrrkz:
9659 case X86::VDIVPSZ128rm:
9660 case X86::VDIVPSZ128rmb:
9661 case X86::VDIVPSZ128rmbk:
9662 case X86::VDIVPSZ128rmbkz:
9663 case X86::VDIVPSZ128rmk:
9664 case X86::VDIVPSZ128rmkz:
9665 case X86::VDIVPSZ128rr:
9666 case X86::VDIVPSZ128rrk:
9667 case X86::VDIVPSZ128rrkz:
9668 case X86::VDIVPSZ256rm:
9669 case X86::VDIVPSZ256rmb:
9670 case X86::VDIVPSZ256rmbk:
9671 case X86::VDIVPSZ256rmbkz:
9672 case X86::VDIVPSZ256rmk:
9673 case X86::VDIVPSZ256rmkz:
9674 case X86::VDIVPSZ256rr:
9675 case X86::VDIVPSZ256rrk:
9676 case X86::VDIVPSZ256rrkz:
9677 case X86::VDIVPSZrrb:
9678 case X86::VDIVPSZrrbk:
9679 case X86::VDIVPSZrrbkz:
9680 case X86::VDIVPSZrm:
9681 case X86::VDIVPSZrmb:
9682 case X86::VDIVPSZrmbk:
9683 case X86::VDIVPSZrmbkz:
9684 case X86::VDIVPSZrmk:
9685 case X86::VDIVPSZrmkz:
9686 case X86::VDIVPSZrr:
9687 case X86::VDIVPSZrrk:
9688 case X86::VDIVPSZrrkz:
9689 case X86::VDIVSDZrm:
9690 case X86::VDIVSDZrr:
9691 case X86::VDIVSDZrm_Int:
9692 case X86::VDIVSDZrmk_Int:
9693 case X86::VDIVSDZrmkz_Int:
9694 case X86::VDIVSDZrr_Int:
9695 case X86::VDIVSDZrrk_Int:
9696 case X86::VDIVSDZrrkz_Int:
9697 case X86::VDIVSDZrrb_Int:
9698 case X86::VDIVSDZrrbk_Int:
9699 case X86::VDIVSDZrrbkz_Int:
9700 case X86::VDIVSSZrm:
9701 case X86::VDIVSSZrr:
9702 case X86::VDIVSSZrm_Int:
9703 case X86::VDIVSSZrmk_Int:
9704 case X86::VDIVSSZrmkz_Int:
9705 case X86::VDIVSSZrr_Int:
9706 case X86::VDIVSSZrrk_Int:
9707 case X86::VDIVSSZrrkz_Int:
9708 case X86::VDIVSSZrrb_Int:
9709 case X86::VDIVSSZrrbk_Int:
9710 case X86::VDIVSSZrrbkz_Int:
9711 case X86::VSQRTPDZ128m:
9712 case X86::VSQRTPDZ128mb:
9713 case X86::VSQRTPDZ128mbk:
9714 case X86::VSQRTPDZ128mbkz:
9715 case X86::VSQRTPDZ128mk:
9716 case X86::VSQRTPDZ128mkz:
9717 case X86::VSQRTPDZ128r:
9718 case X86::VSQRTPDZ128rk:
9719 case X86::VSQRTPDZ128rkz:
9720 case X86::VSQRTPDZ256m:
9721 case X86::VSQRTPDZ256mb:
9722 case X86::VSQRTPDZ256mbk:
9723 case X86::VSQRTPDZ256mbkz:
9724 case X86::VSQRTPDZ256mk:
9725 case X86::VSQRTPDZ256mkz:
9726 case X86::VSQRTPDZ256r:
9727 case X86::VSQRTPDZ256rk:
9728 case X86::VSQRTPDZ256rkz:
9729 case X86::VSQRTPDZm:
9730 case X86::VSQRTPDZmb:
9731 case X86::VSQRTPDZmbk:
9732 case X86::VSQRTPDZmbkz:
9733 case X86::VSQRTPDZmk:
9734 case X86::VSQRTPDZmkz:
9735 case X86::VSQRTPDZr:
9736 case X86::VSQRTPDZrb:
9737 case X86::VSQRTPDZrbk:
9738 case X86::VSQRTPDZrbkz:
9739 case X86::VSQRTPDZrk:
9740 case X86::VSQRTPDZrkz:
9741 case X86::VSQRTPSZ128m:
9742 case X86::VSQRTPSZ128mb:
9743 case X86::VSQRTPSZ128mbk:
9744 case X86::VSQRTPSZ128mbkz:
9745 case X86::VSQRTPSZ128mk:
9746 case X86::VSQRTPSZ128mkz:
9747 case X86::VSQRTPSZ128r:
9748 case X86::VSQRTPSZ128rk:
9749 case X86::VSQRTPSZ128rkz:
9750 case X86::VSQRTPSZ256m:
9751 case X86::VSQRTPSZ256mb:
9752 case X86::VSQRTPSZ256mbk:
9753 case X86::VSQRTPSZ256mbkz:
9754 case X86::VSQRTPSZ256mk:
9755 case X86::VSQRTPSZ256mkz:
9756 case X86::VSQRTPSZ256r:
9757 case X86::VSQRTPSZ256rk:
9758 case X86::VSQRTPSZ256rkz:
9759 case X86::VSQRTPSZm:
9760 case X86::VSQRTPSZmb:
9761 case X86::VSQRTPSZmbk:
9762 case X86::VSQRTPSZmbkz:
9763 case X86::VSQRTPSZmk:
9764 case X86::VSQRTPSZmkz:
9765 case X86::VSQRTPSZr:
9766 case X86::VSQRTPSZrb:
9767 case X86::VSQRTPSZrbk:
9768 case X86::VSQRTPSZrbkz:
9769 case X86::VSQRTPSZrk:
9770 case X86::VSQRTPSZrkz:
9771 case X86::VSQRTSDZm:
9772 case X86::VSQRTSDZm_Int:
9773 case X86::VSQRTSDZmk_Int:
9774 case X86::VSQRTSDZmkz_Int:
9775 case X86::VSQRTSDZr:
9776 case X86::VSQRTSDZr_Int:
9777 case X86::VSQRTSDZrk_Int:
9778 case X86::VSQRTSDZrkz_Int:
9779 case X86::VSQRTSDZrb_Int:
9780 case X86::VSQRTSDZrbk_Int:
9781 case X86::VSQRTSDZrbkz_Int:
9782 case X86::VSQRTSSZm:
9783 case X86::VSQRTSSZm_Int:
9784 case X86::VSQRTSSZmk_Int:
9785 case X86::VSQRTSSZmkz_Int:
9786 case X86::VSQRTSSZr:
9787 case X86::VSQRTSSZr_Int:
9788 case X86::VSQRTSSZrk_Int:
9789 case X86::VSQRTSSZrkz_Int:
9790 case X86::VSQRTSSZrb_Int:
9791 case X86::VSQRTSSZrbk_Int:
9792 case X86::VSQRTSSZrbkz_Int:
9794 case X86::VGATHERDPDYrm:
9795 case X86::VGATHERDPDZ128rm:
9796 case X86::VGATHERDPDZ256rm:
9797 case X86::VGATHERDPDZrm:
9798 case X86::VGATHERDPDrm:
9799 case X86::VGATHERDPSYrm:
9800 case X86::VGATHERDPSZ128rm:
9801 case X86::VGATHERDPSZ256rm:
9802 case X86::VGATHERDPSZrm:
9803 case X86::VGATHERDPSrm:
9804 case X86::VGATHERPF0DPDm:
9805 case X86::VGATHERPF0DPSm:
9806 case X86::VGATHERPF0QPDm:
9807 case X86::VGATHERPF0QPSm:
9808 case X86::VGATHERPF1DPDm:
9809 case X86::VGATHERPF1DPSm:
9810 case X86::VGATHERPF1QPDm:
9811 case X86::VGATHERPF1QPSm:
9812 case X86::VGATHERQPDYrm:
9813 case X86::VGATHERQPDZ128rm:
9814 case X86::VGATHERQPDZ256rm:
9815 case X86::VGATHERQPDZrm:
9816 case X86::VGATHERQPDrm:
9817 case X86::VGATHERQPSYrm:
9818 case X86::VGATHERQPSZ128rm:
9819 case X86::VGATHERQPSZ256rm:
9820 case X86::VGATHERQPSZrm:
9821 case X86::VGATHERQPSrm:
9822 case X86::VPGATHERDDYrm:
9823 case X86::VPGATHERDDZ128rm:
9824 case X86::VPGATHERDDZ256rm:
9825 case X86::VPGATHERDDZrm:
9826 case X86::VPGATHERDDrm:
9827 case X86::VPGATHERDQYrm:
9828 case X86::VPGATHERDQZ128rm:
9829 case X86::VPGATHERDQZ256rm:
9830 case X86::VPGATHERDQZrm:
9831 case X86::VPGATHERDQrm:
9832 case X86::VPGATHERQDYrm:
9833 case X86::VPGATHERQDZ128rm:
9834 case X86::VPGATHERQDZ256rm:
9835 case X86::VPGATHERQDZrm:
9836 case X86::VPGATHERQDrm:
9837 case X86::VPGATHERQQYrm:
9838 case X86::VPGATHERQQZ128rm:
9839 case X86::VPGATHERQQZ256rm:
9840 case X86::VPGATHERQQZrm:
9841 case X86::VPGATHERQQrm:
9842 case X86::VSCATTERDPDZ128mr:
9843 case X86::VSCATTERDPDZ256mr:
9844 case X86::VSCATTERDPDZmr:
9845 case X86::VSCATTERDPSZ128mr:
9846 case X86::VSCATTERDPSZ256mr:
9847 case X86::VSCATTERDPSZmr:
9848 case X86::VSCATTERPF0DPDm:
9849 case X86::VSCATTERPF0DPSm:
9850 case X86::VSCATTERPF0QPDm:
9851 case X86::VSCATTERPF0QPSm:
9852 case X86::VSCATTERPF1DPDm:
9853 case X86::VSCATTERPF1DPSm:
9854 case X86::VSCATTERPF1QPDm:
9855 case X86::VSCATTERPF1QPSm:
9856 case X86::VSCATTERQPDZ128mr:
9857 case X86::VSCATTERQPDZ256mr:
9858 case X86::VSCATTERQPDZmr:
9859 case X86::VSCATTERQPSZ128mr:
9860 case X86::VSCATTERQPSZ256mr:
9861 case X86::VSCATTERQPSZmr:
9862 case X86::VPSCATTERDDZ128mr:
9863 case X86::VPSCATTERDDZ256mr:
9864 case X86::VPSCATTERDDZmr:
9865 case X86::VPSCATTERDQZ128mr:
9866 case X86::VPSCATTERDQZ256mr:
9867 case X86::VPSCATTERDQZmr:
9868 case X86::VPSCATTERQDZ128mr:
9869 case X86::VPSCATTERQDZ256mr:
9870 case X86::VPSCATTERQDZmr:
9871 case X86::VPSCATTERQQZ128mr:
9872 case X86::VPSCATTERQQZ256mr:
9873 case X86::VPSCATTERQQZmr:
9883 unsigned UseIdx)
const {
9890 Inst.
getNumDefs() <= 2 &&
"Reassociation needs binary operators");
9900 assert((Inst.
getNumDefs() == 1 || FlagDef) &&
"Implicit def isn't flags?");
9901 if (FlagDef && !FlagDef->
isDead())
9912 bool Invert)
const {
9964 case X86::VPANDDZ128rr:
9965 case X86::VPANDDZ256rr:
9966 case X86::VPANDDZrr:
9967 case X86::VPANDQZ128rr:
9968 case X86::VPANDQZ256rr:
9969 case X86::VPANDQZrr:
9972 case X86::VPORDZ128rr:
9973 case X86::VPORDZ256rr:
9975 case X86::VPORQZ128rr:
9976 case X86::VPORQZ256rr:
9980 case X86::VPXORDZ128rr:
9981 case X86::VPXORDZ256rr:
9982 case X86::VPXORDZrr:
9983 case X86::VPXORQZ128rr:
9984 case X86::VPXORQZ256rr:
9985 case X86::VPXORQZrr:
9988 case X86::VANDPDYrr:
9989 case X86::VANDPSYrr:
9990 case X86::VANDPDZ128rr:
9991 case X86::VANDPSZ128rr:
9992 case X86::VANDPDZ256rr:
9993 case X86::VANDPSZ256rr:
9994 case X86::VANDPDZrr:
9995 case X86::VANDPSZrr:
10000 case X86::VORPDZ128rr:
10001 case X86::VORPSZ128rr:
10002 case X86::VORPDZ256rr:
10003 case X86::VORPSZ256rr:
10004 case X86::VORPDZrr:
10005 case X86::VORPSZrr:
10006 case X86::VXORPDrr:
10007 case X86::VXORPSrr:
10008 case X86::VXORPDYrr:
10009 case X86::VXORPSYrr:
10010 case X86::VXORPDZ128rr:
10011 case X86::VXORPSZ128rr:
10012 case X86::VXORPDZ256rr:
10013 case X86::VXORPSZ256rr:
10014 case X86::VXORPDZrr:
10015 case X86::VXORPSZrr:
10032 case X86::VPADDBrr:
10033 case X86::VPADDWrr:
10034 case X86::VPADDDrr:
10035 case X86::VPADDQrr:
10036 case X86::VPADDBYrr:
10037 case X86::VPADDWYrr:
10038 case X86::VPADDDYrr:
10039 case X86::VPADDQYrr:
10040 case X86::VPADDBZ128rr:
10041 case X86::VPADDWZ128rr:
10042 case X86::VPADDDZ128rr:
10043 case X86::VPADDQZ128rr:
10044 case X86::VPADDBZ256rr:
10045 case X86::VPADDWZ256rr:
10046 case X86::VPADDDZ256rr:
10047 case X86::VPADDQZ256rr:
10048 case X86::VPADDBZrr:
10049 case X86::VPADDWZrr:
10050 case X86::VPADDDZrr:
10051 case X86::VPADDQZrr:
10052 case X86::VPMULLWrr:
10053 case X86::VPMULLWYrr:
10054 case X86::VPMULLWZ128rr:
10055 case X86::VPMULLWZ256rr:
10056 case X86::VPMULLWZrr:
10057 case X86::VPMULLDrr:
10058 case X86::VPMULLDYrr:
10059 case X86::VPMULLDZ128rr:
10060 case X86::VPMULLDZ256rr:
10061 case X86::VPMULLDZrr:
10062 case X86::VPMULLQZ128rr:
10063 case X86::VPMULLQZ256rr:
10064 case X86::VPMULLQZrr:
10065 case X86::VPMAXSBrr:
10066 case X86::VPMAXSBYrr:
10067 case X86::VPMAXSBZ128rr:
10068 case X86::VPMAXSBZ256rr:
10069 case X86::VPMAXSBZrr:
10070 case X86::VPMAXSDrr:
10071 case X86::VPMAXSDYrr:
10072 case X86::VPMAXSDZ128rr:
10073 case X86::VPMAXSDZ256rr:
10074 case X86::VPMAXSDZrr:
10075 case X86::VPMAXSQZ128rr:
10076 case X86::VPMAXSQZ256rr:
10077 case X86::VPMAXSQZrr:
10078 case X86::VPMAXSWrr:
10079 case X86::VPMAXSWYrr:
10080 case X86::VPMAXSWZ128rr:
10081 case X86::VPMAXSWZ256rr:
10082 case X86::VPMAXSWZrr:
10083 case X86::VPMAXUBrr:
10084 case X86::VPMAXUBYrr:
10085 case X86::VPMAXUBZ128rr:
10086 case X86::VPMAXUBZ256rr:
10087 case X86::VPMAXUBZrr:
10088 case X86::VPMAXUDrr:
10089 case X86::VPMAXUDYrr:
10090 case X86::VPMAXUDZ128rr:
10091 case X86::VPMAXUDZ256rr:
10092 case X86::VPMAXUDZrr:
10093 case X86::VPMAXUQZ128rr:
10094 case X86::VPMAXUQZ256rr:
10095 case X86::VPMAXUQZrr:
10096 case X86::VPMAXUWrr:
10097 case X86::VPMAXUWYrr:
10098 case X86::VPMAXUWZ128rr:
10099 case X86::VPMAXUWZ256rr:
10100 case X86::VPMAXUWZrr:
10101 case X86::VPMINSBrr:
10102 case X86::VPMINSBYrr:
10103 case X86::VPMINSBZ128rr:
10104 case X86::VPMINSBZ256rr:
10105 case X86::VPMINSBZrr:
10106 case X86::VPMINSDrr:
10107 case X86::VPMINSDYrr:
10108 case X86::VPMINSDZ128rr:
10109 case X86::VPMINSDZ256rr:
10110 case X86::VPMINSDZrr:
10111 case X86::VPMINSQZ128rr:
10112 case X86::VPMINSQZ256rr:
10113 case X86::VPMINSQZrr:
10114 case X86::VPMINSWrr:
10115 case X86::VPMINSWYrr:
10116 case X86::VPMINSWZ128rr:
10117 case X86::VPMINSWZ256rr:
10118 case X86::VPMINSWZrr:
10119 case X86::VPMINUBrr:
10120 case X86::VPMINUBYrr:
10121 case X86::VPMINUBZ128rr:
10122 case X86::VPMINUBZ256rr:
10123 case X86::VPMINUBZrr:
10124 case X86::VPMINUDrr:
10125 case X86::VPMINUDYrr:
10126 case X86::VPMINUDZ128rr:
10127 case X86::VPMINUDZ256rr:
10128 case X86::VPMINUDZrr:
10129 case X86::VPMINUQZ128rr:
10130 case X86::VPMINUQZ256rr:
10131 case X86::VPMINUQZrr:
10132 case X86::VPMINUWrr:
10133 case X86::VPMINUWYrr:
10134 case X86::VPMINUWZ128rr:
10135 case X86::VPMINUWZ256rr:
10136 case X86::VPMINUWZrr:
10140 case X86::MAXCPDrr:
10141 case X86::MAXCPSrr:
10142 case X86::MAXCSDrr:
10143 case X86::MAXCSSrr:
10144 case X86::MINCPDrr:
10145 case X86::MINCPSrr:
10146 case X86::MINCSDrr:
10147 case X86::MINCSSrr:
10148 case X86::VMAXCPDrr:
10149 case X86::VMAXCPSrr:
10150 case X86::VMAXCPDYrr:
10151 case X86::VMAXCPSYrr:
10152 case X86::VMAXCPDZ128rr:
10153 case X86::VMAXCPSZ128rr:
10154 case X86::VMAXCPDZ256rr:
10155 case X86::VMAXCPSZ256rr:
10156 case X86::VMAXCPDZrr:
10157 case X86::VMAXCPSZrr:
10158 case X86::VMAXCSDrr:
10159 case X86::VMAXCSSrr:
10160 case X86::VMAXCSDZrr:
10161 case X86::VMAXCSSZrr:
10162 case X86::VMINCPDrr:
10163 case X86::VMINCPSrr:
10164 case X86::VMINCPDYrr:
10165 case X86::VMINCPSYrr:
10166 case X86::VMINCPDZ128rr:
10167 case X86::VMINCPSZ128rr:
10168 case X86::VMINCPDZ256rr:
10169 case X86::VMINCPSZ256rr:
10170 case X86::VMINCPDZrr:
10171 case X86::VMINCPSZrr:
10172 case X86::VMINCSDrr:
10173 case X86::VMINCSSrr:
10174 case X86::VMINCSDZrr:
10175 case X86::VMINCSSZrr:
10176 case X86::VMAXCPHZ128rr:
10177 case X86::VMAXCPHZ256rr:
10178 case X86::VMAXCPHZrr:
10179 case X86::VMAXCSHZrr:
10180 case X86::VMINCPHZ128rr:
10181 case X86::VMINCPHZ256rr:
10182 case X86::VMINCPHZrr:
10183 case X86::VMINCSHZrr:
10193 case X86::VADDPDrr:
10194 case X86::VADDPSrr:
10195 case X86::VADDPDYrr:
10196 case X86::VADDPSYrr:
10197 case X86::VADDPDZ128rr:
10198 case X86::VADDPSZ128rr:
10199 case X86::VADDPDZ256rr:
10200 case X86::VADDPSZ256rr:
10201 case X86::VADDPDZrr:
10202 case X86::VADDPSZrr:
10203 case X86::VADDSDrr:
10204 case X86::VADDSSrr:
10205 case X86::VADDSDZrr:
10206 case X86::VADDSSZrr:
10207 case X86::VMULPDrr:
10208 case X86::VMULPSrr:
10209 case X86::VMULPDYrr:
10210 case X86::VMULPSYrr:
10211 case X86::VMULPDZ128rr:
10212 case X86::VMULPSZ128rr:
10213 case X86::VMULPDZ256rr:
10214 case X86::VMULPSZ256rr:
10215 case X86::VMULPDZrr:
10216 case X86::VMULPSZrr:
10217 case X86::VMULSDrr:
10218 case X86::VMULSSrr:
10219 case X86::VMULSDZrr:
10220 case X86::VMULSSZrr:
10221 case X86::VADDPHZ128rr:
10222 case X86::VADDPHZ256rr:
10223 case X86::VADDPHZrr:
10224 case X86::VADDSHZrr:
10225 case X86::VMULPHZ128rr:
10226 case X86::VMULPHZ256rr:
10227 case X86::VMULPHZrr:
10228 case X86::VMULSHZrr:
10239static std::optional<ParamLoadedValue>
10242 Register DestReg =
MI.getOperand(0).getReg();
10243 Register SrcReg =
MI.getOperand(1).getReg();
10248 if (DestReg == DescribedReg)
10253 if (
unsigned SubRegIdx =
TRI->getSubRegIndex(DestReg, DescribedReg)) {
10254 Register SrcSubReg =
TRI->getSubReg(SrcReg, SubRegIdx);
10264 if (
MI.getOpcode() == X86::MOV8rr ||
MI.getOpcode() == X86::MOV16rr ||
10265 !
TRI->isSuperRegister(DestReg, DescribedReg))
10266 return std::nullopt;
10268 assert(
MI.getOpcode() == X86::MOV32rr &&
"Unexpected super-register case");
10272std::optional<ParamLoadedValue>
10279 switch (
MI.getOpcode()) {
10282 case X86::LEA64_32r: {
10284 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(), Reg))
10285 return std::nullopt;
10289 if (!
MI.getOperand(4).isImm() || !
MI.getOperand(2).isImm())
10290 return std::nullopt;
10299 if ((Op1.
isReg() && Op1.
getReg() ==
MI.getOperand(0).getReg()) ||
10300 Op2.
getReg() ==
MI.getOperand(0).getReg())
10301 return std::nullopt;
10302 else if ((Op1.
isReg() && Op1.
getReg() != X86::NoRegister &&
10303 TRI->regsOverlap(Op1.
getReg(),
MI.getOperand(0).getReg())) ||
10304 (Op2.
getReg() != X86::NoRegister &&
10305 TRI->regsOverlap(Op2.
getReg(),
MI.getOperand(0).getReg())))
10306 return std::nullopt;
10308 int64_t Coef =
MI.getOperand(2).getImm();
10309 int64_t
Offset =
MI.getOperand(4).getImm();
10312 if ((Op1.
isReg() && Op1.
getReg() != X86::NoRegister)) {
10314 }
else if (Op1.
isFI())
10317 if (
Op &&
Op->isReg() &&
Op->getReg() == Op2.
getReg() && Coef > 0) {
10318 Ops.push_back(dwarf::DW_OP_constu);
10319 Ops.push_back(Coef + 1);
10320 Ops.push_back(dwarf::DW_OP_mul);
10322 if (
Op && Op2.
getReg() != X86::NoRegister) {
10323 int dwarfReg =
TRI->getDwarfRegNum(Op2.
getReg(),
false);
10325 return std::nullopt;
10326 else if (dwarfReg < 32) {
10327 Ops.push_back(dwarf::DW_OP_breg0 + dwarfReg);
10330 Ops.push_back(dwarf::DW_OP_bregx);
10331 Ops.push_back(dwarfReg);
10341 Ops.push_back(dwarf::DW_OP_constu);
10342 Ops.push_back(Coef);
10343 Ops.push_back(dwarf::DW_OP_mul);
10346 if (((Op1.
isReg() && Op1.
getReg() != X86::NoRegister) || Op1.
isFI()) &&
10347 Op2.
getReg() != X86::NoRegister) {
10348 Ops.push_back(dwarf::DW_OP_plus);
10360 return std::nullopt;
10363 case X86::MOV64ri32:
10366 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(), Reg))
10367 return std::nullopt;
10374 case X86::XOR32rr: {
10377 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(), Reg))
10378 return std::nullopt;
10379 if (
MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg())
10381 return std::nullopt;
10383 case X86::MOVSX64rr32: {
10390 if (!
TRI->isSubRegisterEq(
MI.getOperand(0).getReg(), Reg))
10391 return std::nullopt;
10400 if (Reg ==
MI.getOperand(0).getReg())
10403 assert(getX86MCRegisterClass(X86::GR32RegClassID).
contains(Reg) &&
10404 "Unhandled sub-register case for MOVSX64rr32");
10409 assert(!
MI.isMoveImmediate() &&
"Unexpected MoveImm instruction");
10426 assert(!OldFlagDef1 == !OldFlagDef2 &&
10427 "Unexpected instruction type for reassociation");
10429 if (!OldFlagDef1 || !OldFlagDef2)
10433 "Must have dead EFLAGS operand in reassociable instruction");
10440 assert(NewFlagDef1 && NewFlagDef2 &&
10441 "Unexpected operand in reassociable instruction");
10451std::pair<unsigned, unsigned>
10453 return std::make_pair(TF, 0u);
10458 using namespace X86II;
10459 static const std::pair<unsigned, const char *> TargetFlags[] = {
10460 {MO_GOT_ABSOLUTE_ADDRESS,
"x86-got-absolute-address"},
10461 {MO_PIC_BASE_OFFSET,
"x86-pic-base-offset"},
10462 {MO_GOT,
"x86-got"},
10463 {MO_GOTOFF,
"x86-gotoff"},
10464 {MO_GOTPCREL,
"x86-gotpcrel"},
10465 {MO_GOTPCREL_NORELAX,
"x86-gotpcrel-norelax"},
10466 {MO_PLT,
"x86-plt"},
10467 {MO_TLSGD,
"x86-tlsgd"},
10468 {MO_TLSLD,
"x86-tlsld"},
10469 {MO_TLSLDM,
"x86-tlsldm"},
10470 {MO_GOTTPOFF,
"x86-gottpoff"},
10471 {MO_INDNTPOFF,
"x86-indntpoff"},
10472 {MO_TPOFF,
"x86-tpoff"},
10473 {MO_DTPOFF,
"x86-dtpoff"},
10474 {MO_NTPOFF,
"x86-ntpoff"},
10475 {MO_GOTNTPOFF,
"x86-gotntpoff"},
10476 {MO_DLLIMPORT,
"x86-dllimport"},
10477 {MO_DARWIN_NONLAZY,
"x86-darwin-nonlazy"},
10478 {MO_DARWIN_NONLAZY_PIC_BASE,
"x86-darwin-nonlazy-pic-base"},
10479 {MO_TLVP,
"x86-tlvp"},
10480 {MO_TLVP_PIC_BASE,
"x86-tlvp-pic-base"},
10481 {MO_SECREL,
"x86-secrel"},
10482 {MO_COFFSTUB,
"x86-coffstub"}};
10516std::optional<std::unique_ptr<outliner::OutlinedFunction>>
10519 std::vector<outliner::Candidate> &RepeatedSequenceLocs,
10520 unsigned MinRepeats)
const {
10521 unsigned SequenceSize = 0;
10522 for (
auto &
MI : RepeatedSequenceLocs[0]) {
10526 if (
MI.isDebugInstr() ||
MI.isKill())
10533 unsigned CFICount = 0;
10534 for (
auto &
I : RepeatedSequenceLocs[0]) {
10535 if (
I.isCFIInstruction())
10545 std::vector<MCCFIInstruction> CFIInstructions =
10546 C.getMF()->getFrameInstructions();
10548 if (CFICount > 0 && CFICount != CFIInstructions.size())
10549 return std::nullopt;
10553 if (RepeatedSequenceLocs[0].back().isTerminator()) {
10557 return std::make_unique<outliner::OutlinedFunction>(
10558 RepeatedSequenceLocs, SequenceSize,
10565 return std::nullopt;
10570 return std::make_unique<outliner::OutlinedFunction>(
10580 if (Subtarget.getFrameLowering()->has128ByteRedZone(MF)) {
10589 if (!OutlineFromLinkOnceODRs &&
F.hasLinkOnceODRLinkage())
10599 unsigned Flags)
const {
10603 if (
MI.isTerminator())
10617 if (
MI.modifiesRegister(X86::RSP, &RI) ||
MI.readsRegister(X86::RSP, &RI) ||
10618 MI.getDesc().hasImplicitUseOfPhysReg(X86::RSP) ||
10619 MI.getDesc().hasImplicitDefOfPhysReg(X86::RSP))
10623 if (
MI.readsRegister(X86::RIP, &RI) ||
10624 MI.getDesc().hasImplicitUseOfPhysReg(X86::RIP) ||
10625 MI.getDesc().hasImplicitDefOfPhysReg(X86::RIP))
10629 if (
MI.isCFIInstruction())
10645 MBB.insert(
MBB.end(), retq);
10655 .addGlobalAddress(M.getNamedValue(MF.
getName())));
10659 .addGlobalAddress(M.getNamedValue(MF.
getName())));
10668 bool AllowSideEffects)
const {
10673 if (ST.hasMMX() && X86::VR64RegClass.contains(Reg))
10677 if (
TRI.isGeneralPurposeRegister(MF, Reg)) {
10682 if (!AllowSideEffects)
10689 }
else if (X86::VR128RegClass.
contains(Reg)) {
10695 }
else if (X86::VR256RegClass.
contains(Reg)) {
10701 }
else if (X86::VR512RegClass.
contains(Reg)) {
10703 if (!ST.hasAVX512())
10707 }
else if (X86::VK1RegClass.
contains(Reg) || X86::VK2RegClass.
contains(Reg) ||
10709 X86::VK16RegClass.
contains(Reg)) {
10713 unsigned Op = ST.hasBWI() ? X86::KSET0Q : X86::KSET0W;
10720 bool DoRegPressureReduce)
const {
10723 case X86::VPDPWSSDrr:
10724 case X86::VPDPWSSDrm:
10725 case X86::VPDPWSSDYrr:
10726 case X86::VPDPWSSDYrm: {
10727 if (!Subtarget.hasFastDPWSSD()) {
10733 case X86::VPDPWSSDZ128rr:
10734 case X86::VPDPWSSDZ128rm:
10735 case X86::VPDPWSSDZ256rr:
10736 case X86::VPDPWSSDZ256rm:
10737 case X86::VPDPWSSDZrr:
10738 case X86::VPDPWSSDZrm: {
10739 if (Subtarget.hasBWI() && !Subtarget.hasFastDPWSSD()) {
10747 Patterns, DoRegPressureReduce);
10759 unsigned AddOpc = 0;
10760 unsigned MaddOpc = 0;
10763 assert(
false &&
"It should not reach here");
10769 case X86::VPDPWSSDrr:
10770 MaddOpc = X86::VPMADDWDrr;
10771 AddOpc = X86::VPADDDrr;
10773 case X86::VPDPWSSDrm:
10774 MaddOpc = X86::VPMADDWDrm;
10775 AddOpc = X86::VPADDDrr;
10777 case X86::VPDPWSSDZ128rr:
10778 MaddOpc = X86::VPMADDWDZ128rr;
10779 AddOpc = X86::VPADDDZ128rr;
10781 case X86::VPDPWSSDZ128rm:
10782 MaddOpc = X86::VPMADDWDZ128rm;
10783 AddOpc = X86::VPADDDZ128rr;
10789 case X86::VPDPWSSDYrr:
10790 MaddOpc = X86::VPMADDWDYrr;
10791 AddOpc = X86::VPADDDYrr;
10793 case X86::VPDPWSSDYrm:
10794 MaddOpc = X86::VPMADDWDYrm;
10795 AddOpc = X86::VPADDDYrr;
10797 case X86::VPDPWSSDZ256rr:
10798 MaddOpc = X86::VPMADDWDZ256rr;
10799 AddOpc = X86::VPADDDZ256rr;
10801 case X86::VPDPWSSDZ256rm:
10802 MaddOpc = X86::VPMADDWDZ256rm;
10803 AddOpc = X86::VPADDDZ256rr;
10809 case X86::VPDPWSSDZrr:
10810 MaddOpc = X86::VPMADDWDZrr;
10811 AddOpc = X86::VPADDDZrr;
10813 case X86::VPDPWSSDZrm:
10814 MaddOpc = X86::VPMADDWDZrm;
10815 AddOpc = X86::VPADDDZrr;
10827 InstrIdxForVirtReg.
insert(std::make_pair(NewReg, 0));
10849 DelInstrs, InstrIdxForVirtReg);
10853 InstrIdxForVirtReg);
10863 M.Base.FrameIndex = FI;
10864 M.getFullAddress(
Ops);
10873 get(X86::PREFETCHIT1),
10874 InsertBefore ==
MBB.instr_end() ?
MBB.findPrevDebugLoc(InsertBefore)
10875 : InsertBefore->getDebugLoc(),
10883 MIB.
addReg(X86::NoRegister);
10884 MBB.insert(InsertBefore, PrefetchInstr);
10885 return PrefetchInstr;
10888#define GET_INSTRINFO_HELPERS
10889#include "X86GenInstrInfo.inc"
MachineInstrBuilder & UseMI
MachineInstrBuilder MachineInstrBuilder & DefMI
static bool isFrameStoreOpcode(int Opcode)
static bool isFrameLoadOpcode(int Opcode)
MachineOutlinerClass
Constants defining how certain sequences should be outlined.
@ MachineOutlinerTailCall
Emit a save, restore, call, and return.
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
MachineBasicBlock MachineBasicBlock::iterator MBBI
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
DXIL Forward Handle Accesses
const HexagonInstrInfo * TII
Module.h This file contains the declarations for the Module class.
static bool lookup(const GsymReader &GR, GsymDataExtractor &Data, uint64_t &Offset, uint64_t BaseAddr, uint64_t Addr, SourceLocations &SrcLocs, llvm::Error &Err)
A Lookup helper functions.
const size_t AbstractManglingParser< Derived, Alloc >::NumOps
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
This file implements the LivePhysRegs utility for tracking liveness of physical registers.
static SDValue isNOT(SDValue V, SelectionDAG &DAG)
static bool Expand2AddrUndef(MachineInstrBuilder &MIB, const MCInstrDesc &Desc)
Expand a single-def pseudo instruction to a two-addr instruction with two undef reads of the register...
This file declares the MachineConstantPool class which is an abstract constant pool to keep track of ...
Register const TargetRegisterInfo * TRI
Promote Memory to Register
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
Provides some synthesis utilities to produce sequences of values.
static SPCC::CondCodes GetOppositeBranchCondition(SPCC::CondCodes CC)
#define FROM_TO(FROM, TO)
cl::opt< bool > X86EnableAPXForRelocation
static bool is64Bit(const char *name)
#define GET_EGPR_IF_ENABLED(OPC)
static bool isLEA(unsigned Opcode)
static void addOperands(MachineInstrBuilder &MIB, ArrayRef< MachineOperand > MOs, int PtrOffset=0)
static std::optional< ParamLoadedValue > describeMOVrrLoadedValue(const MachineInstr &MI, Register DescribedReg, const TargetRegisterInfo *TRI)
If DescribedReg overlaps with the MOVrr instruction's destination register then, if possible,...
static cl::opt< unsigned > PartialRegUpdateClearance("partial-reg-update-clearance", cl::desc("Clearance between two register writes " "for inserting XOR to avoid partial " "register update"), cl::init(64), cl::Hidden)
static bool shouldPreventUndefRegUpdateMemFold(MachineFunction &MF, MachineInstr &MI)
static unsigned CopyToFromAsymmetricReg(Register DestReg, Register SrcReg, const X86Subtarget &Subtarget)
static bool isConvertibleLEA(MachineInstr *MI)
static bool ExpandMOVImmSExti8(MachineInstrBuilder &MIB, const TargetInstrInfo &TII, const X86Subtarget &Subtarget)
static bool isAMXOpcode(unsigned Opc)
static int getJumpTableIndexFromReg(const MachineRegisterInfo &MRI, Register Reg)
static void updateOperandRegConstraints(MachineFunction &MF, MachineInstr &NewMI, const TargetInstrInfo &TII)
static int getJumpTableIndexFromAddr(const MachineInstr &MI)
static bool AdjustBlendMask(unsigned OldMask, unsigned OldWidth, unsigned NewWidth, unsigned *pNewMask=nullptr)
static bool expandMOV32r1(MachineInstrBuilder &MIB, const TargetInstrInfo &TII, bool MinusOne)
static unsigned getNewOpcFromTable(ArrayRef< X86TableEntry > Table, unsigned Opc)
static unsigned getStoreRegOpcode(Register SrcReg, const TargetRegisterClass *RC, bool IsStackAligned, const X86Subtarget &STI)
#define FOLD_BROADCAST(SIZE)
static cl::opt< unsigned > UndefRegClearance("undef-reg-clearance", cl::desc("How many idle instructions we would like before " "certain undef register reads"), cl::init(128), cl::Hidden)
#define CASE_BCAST_TYPE_OPC(TYPE, OP16, OP32, OP64)
static bool isTruncatedShiftCountForLEA(unsigned ShAmt)
Check whether the given shift count is appropriate can be represented by a LEA instruction.
static cl::opt< bool > ReMatPICStubLoad("remat-pic-stub-load", cl::desc("Re-materialize load from stub in PIC mode"), cl::init(false), cl::Hidden)
static SmallVector< MachineMemOperand *, 2 > extractLoadMMOs(ArrayRef< MachineMemOperand * > MMOs, MachineFunction &MF)
static MachineInstr * fuseTwoAddrInst(MachineFunction &MF, unsigned Opcode, ArrayRef< MachineOperand > MOs, MachineBasicBlock::iterator InsertPt, MachineInstr &MI, const TargetInstrInfo &TII)
static void printFailMsgforFold(const MachineInstr &MI, unsigned Idx)
static bool canConvert2Copy(unsigned Opc)
static cl::opt< bool > NoFusing("disable-spill-fusing", cl::desc("Disable fusing of spill code into instructions"), cl::Hidden)
static bool expandNOVLXStore(MachineInstrBuilder &MIB, const TargetRegisterInfo *TRI, const MCInstrDesc &StoreDesc, const MCInstrDesc &ExtractDesc, unsigned SubIdx)
static bool isX87Reg(Register Reg)
Return true if the Reg is X87 register.
static bool Expand2AddrKreg(MachineInstrBuilder &MIB, const MCInstrDesc &Desc, Register Reg)
Expand a single-def pseudo instruction to a two-addr instruction with two k0 reads.
#define VPERM_CASES_BROADCAST(Suffix)
static std::pair< X86::CondCode, unsigned > isUseDefConvertible(const MachineInstr &MI)
Check whether the use can be converted to remove a comparison against zero.
static bool findRedundantFlagInstr(MachineInstr &CmpInstr, MachineInstr &CmpValDefInstr, const MachineRegisterInfo *MRI, MachineInstr **AndInstr, const TargetRegisterInfo *TRI, const X86Subtarget &ST, bool &NoSignFlag, bool &ClearsOverflowFlag)
static bool expandSHXDROT(MachineInstrBuilder &MIB, const MCInstrDesc &Desc)
static unsigned getLoadRegOpcode(Register DestReg, const TargetRegisterClass *RC, bool IsStackAligned, const X86Subtarget &STI)
static void expandLoadStackGuard(MachineInstrBuilder &MIB, const TargetInstrInfo &TII)
static bool hasUndefRegUpdate(unsigned Opcode, unsigned OpNum, bool ForLoadFold=false)
static MachineInstr * makeM0Inst(const TargetInstrInfo &TII, unsigned Opcode, ArrayRef< MachineOperand > MOs, MachineBasicBlock::iterator InsertPt, MachineInstr &MI)
#define GET_ND_IF_ENABLED(OPC)
static bool expandMOVSHP(MachineInstrBuilder &MIB, MachineInstr &MI, const TargetInstrInfo &TII, bool HasAVX)
static bool hasPartialRegUpdate(unsigned Opcode, const X86Subtarget &Subtarget, bool ForLoadFold=false)
Return true for all instructions that only update the first 32 or 64-bits of the destination register...
static const uint16_t * lookupAVX512(unsigned opcode, unsigned domain, ArrayRef< uint16_t[4]> Table)
static unsigned getLoadStoreRegOpcode(Register Reg, const TargetRegisterClass *RC, bool IsStackAligned, const X86Subtarget &STI, bool Load)
#define VPERM_CASES(Suffix)
#define FROM_TO_SIZE(A, B, S)
static void commuteVPTERNLOG(MachineInstr &MI, unsigned SrcOpIdx1, unsigned SrcOpIdx2)
static bool isDefConvertible(const MachineInstr &MI, bool &NoSignFlag, bool &ClearsOverflowFlag)
Check whether the definition can be converted to remove a comparison against zero.
static MachineInstr * fuseInst(MachineFunction &MF, unsigned Opcode, unsigned OpNo, ArrayRef< MachineOperand > MOs, MachineBasicBlock::iterator InsertPt, MachineInstr &MI, const TargetInstrInfo &TII, int PtrOffset=0)
static X86::CondCode getSwappedCondition(X86::CondCode CC)
Assuming the flags are set by MI(a,b), return the condition code if we modify the instructions such t...
static unsigned getCommutedVPERMV3Opcode(unsigned Opcode)
static bool expandXorFP(MachineInstrBuilder &MIB, const TargetInstrInfo &TII)
static MachineBasicBlock * getFallThroughMBB(MachineBasicBlock *MBB, MachineBasicBlock *TBB)
static bool isNonFoldablePartialRegisterLoad(const MachineInstr &LoadMI, const MachineInstr &UserMI, const MachineFunction &MF)
Check if LoadMI is a partial register load that we can't fold into MI because the latter uses content...
static unsigned getLoadStoreOpcodeForFP16(bool Load, const X86Subtarget &STI)
static bool isHReg(Register Reg)
Test if the given register is a physical h register.
static cl::opt< bool > PrintFailedFusing("print-failed-fuse-candidates", cl::desc("Print instructions that the allocator wants to" " fuse, but the X86 backend currently can't"), cl::Hidden)
static bool expandNOVLXLoad(MachineInstrBuilder &MIB, const TargetRegisterInfo *TRI, const MCInstrDesc &LoadDesc, const MCInstrDesc &BroadcastDesc, unsigned SubIdx)
static void genAlternativeDpCodeSequence(MachineInstr &Root, const TargetInstrInfo &TII, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg)
static unsigned getThreeSrcCommuteCase(uint64_t TSFlags, unsigned SrcOpIdx1, unsigned SrcOpIdx2)
This determines which of three possible cases of a three source commute the source indexes correspond...
static unsigned getTruncatedShiftCount(const MachineInstr &MI, unsigned ShiftAmtOperandIdx)
Check whether the shift count for a machine operand is non-zero.
static SmallVector< MachineMemOperand *, 2 > extractStoreMMOs(ArrayRef< MachineMemOperand * > MMOs, MachineFunction &MF)
static unsigned getBroadcastOpcode(const X86FoldTableEntry *I, const TargetRegisterClass *RC, const X86Subtarget &STI)
static unsigned convertALUrr2ALUri(unsigned Opc)
Convert an ALUrr opcode to corresponding ALUri opcode.
static bool regIsPICBase(Register BaseReg, const MachineRegisterInfo &MRI)
Return true if register is PIC base; i.e.g defined by X86::MOVPC32r.
static bool isCommutableVPERMV3Instruction(unsigned Opcode)
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Represent a constant reference to an array (0 or more elements consecutively in memory),...
size_t size() const
Get the array size.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
@ FCMP_OEQ
0 0 0 1 True if ordered and equal
@ ICMP_SLT
signed less than
@ ICMP_SLE
signed less or equal
@ FCMP_OLT
0 1 0 0 True if ordered and less than
@ FCMP_ULE
1 1 0 1 True if unordered, less than, or equal
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
@ ICMP_UGE
unsigned greater or equal
@ ICMP_UGT
unsigned greater than
@ ICMP_SGT
signed greater than
@ FCMP_ULT
1 1 0 0 True if unordered or less than
@ FCMP_ONE
0 1 1 0 True if ordered and operands are unequal
@ FCMP_UEQ
1 0 0 1 True if unordered or equal
@ ICMP_ULT
unsigned less than
@ FCMP_UGT
1 0 1 0 True if unordered or greater than
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
@ FCMP_ORD
0 1 1 1 True if ordered (no nans)
@ ICMP_SGE
signed greater or equal
@ FCMP_UNE
1 1 1 0 True if unordered or not equal
@ ICMP_ULE
unsigned less or equal
@ FCMP_UGE
1 0 1 1 True if unordered, greater than, or equal
@ FCMP_UNO
1 0 0 0 True if unordered: isnan(X) | isnan(Y)
This is an important base class in LLVM.
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
static LLVM_ABI void appendOffset(SmallVectorImpl< uint64_t > &Ops, int64_t Offset)
Append Ops with operations to apply the Offset.
static LLVM_ABI DIExpression * appendExt(const DIExpression *Expr, unsigned FromSize, unsigned ToSize, bool Signed)
Append a zero- or sign-extension to Expr.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
bool hasOptSize() const
Optimize this function for size (-Os) or minimum size (-Oz).
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
LiveInterval - This class represents the liveness of a register, or stack slot.
SlotIndex InsertMachineInstrInMaps(MachineInstr &MI)
SlotIndex getInstructionIndex(const MachineInstr &Instr) const
Returns the base index of the given instruction.
LiveInterval & getInterval(Register Reg)
SlotIndex ReplaceMachineInstrInMaps(MachineInstr &MI, MachineInstr &NewMI)
A set of physical registers with utility functions to track liveness when walking backward/forward th...
const Segment * getSegmentContaining(SlotIndex Idx) const
Return the segment that contains the specified index, or null if there is none.
LLVM_ABI void replaceKillInstruction(Register Reg, MachineInstr &OldMI, MachineInstr &NewMI)
replaceKillInstruction - Update register kill info by replacing a kill instruction with a new one.
LLVM_ABI VarInfo & getVarInfo(Register Reg)
getVarInfo - Return the VarInfo structure for the specified VIRTUAL register.
static LocationSize precise(uint64_t Value)
bool usesWindowsCFI() const
static MCCFIInstruction createAdjustCfaOffset(MCSymbol *L, int64_t Adjustment, SMLoc Loc={})
.cfi_adjust_cfa_offset Same as .cfi_def_cfa_offset, but Offset is a relative value that is added/subt...
Instances of this class represent a single low-level machine instruction.
void setOpcode(unsigned Op)
Describe properties that are true of each instruction in the target description file.
This holds information about one operand of a machine instruction, indicating the register class for ...
Wrapper class representing physical registers. Should be passed by value.
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
MachineInstrBundleIterator< const MachineInstr > const_iterator
void push_back(MachineInstr *MI)
MachineInstr * remove(MachineInstr *I)
Remove the unbundled instruction from the instruction list without deleting it.
MachineInstrBundleIterator< MachineInstr, true > reverse_iterator
LLVM_ABI bool isLayoutSuccessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB will be emitted immediately after this block, such that if this bloc...
LLVM_ABI void eraseFromParent()
This method unlinks 'this' from the containing function and deletes it.
LLVM_ABI instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
iterator_range< succ_iterator > successors()
MachineInstrBundleIterator< MachineInstr > iterator
@ LQR_Dead
Register is known to be fully dead.
This class is a data container for one entry in a MachineConstantPool.
union llvm::MachineConstantPoolEntry::@004270020304201266316354007027341142157160323045 Val
The constant itself.
bool isMachineConstantPoolEntry() const
isMachineConstantPoolEntry - Return true if the MachineConstantPoolEntry is indeed a target specific ...
const Constant * ConstVal
The MachineConstantPool class keeps track of constants referenced by a function which must be spilled...
LLVM_ABI unsigned getConstantPoolIndex(const Constant *C, Align Alignment)
getConstantPoolIndex - Create a new entry in the constant pool or return an existing one.
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
Align getObjectAlign(int ObjectIdx) const
Return the alignment of the specified stack object.
int64_t getObjectSize(int ObjectIdx) const
Return the size of the specified object.
bool isFixedObjectIndex(int ObjectIdx) const
Returns true if the specified index corresponds to a fixed stack object.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
bool needsFrameMoves() const
True if this function needs frame moves for debug or exceptions.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
MachineConstantPool * getConstantPool()
getConstantPool - Return the constant pool object for the current function.
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Register getReg(unsigned Idx) const
Get the register for the operand index.
const MachineInstrBuilder & setMemRefs(ArrayRef< MachineMemOperand * > MMOs) const
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & setMIFlag(MachineInstr::MIFlag Flag) const
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addGlobalAddress(const GlobalValue *GV, int64_t Offset=0, unsigned TargetFlags=0) const
const MachineInstrBuilder & addDisp(const MachineOperand &Disp, int64_t off, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
const MachineInstrBuilder & copyImplicitOps(const MachineInstr &OtherMI) const
Copy all the implicit operands from OtherMI onto this one.
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
MachineInstr * getInstr() const
If conversion operators fail, use this method to get the MachineInstr explicitly.
Representation of each machine instruction.
mop_iterator operands_begin()
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
bool isImplicitDef() const
const MachineBasicBlock * getParent() const
void dropDebugNumber()
Drop any variable location debugging information associated with this instruction.
LLVM_ABI void addImplicitDefUseOperands(MachineFunction &MF)
Add all implicit def and use operands to this instruction.
bool getFlag(MIFlag Flag) const
Return whether an MI flag is set.
unsigned getNumOperands() const
Retuns the total number of operands.
LLVM_ABI void addOperand(MachineFunction &MF, const MachineOperand &Op)
Add the specified operand to the instruction.
LLVM_ABI unsigned getNumExplicitOperands() const
Returns the number of non-implicit operands.
bool modifiesRegister(Register Reg, const TargetRegisterInfo *TRI) const
Return true if the MachineInstr modifies (fully define or partially define) the specified register.
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
void untieRegOperand(unsigned OpIdx)
Break any tie involving OpIdx.
LLVM_ABI void setDesc(const MCInstrDesc &TID)
Replace the instruction descriptor (thus opcode) of the current instruction with a new one.
LLVM_ABI unsigned getNumExplicitDefs() const
Returns the number of non-implicit definitions.
LLVM_ABI void eraseFromBundle()
Unlink 'this' from its basic block and delete it.
bool hasOneMemOperand() const
Return true if this instruction has exactly one MachineMemOperand.
LLVM_ABI void substituteRegister(Register FromReg, Register ToReg, unsigned SubIdx, const TargetRegisterInfo &RegInfo)
Replace all occurrences of FromReg with ToReg:SubIdx, properly composing subreg indices where necessa...
mmo_iterator memoperands_begin() const
Access to memory operands of the instruction.
LLVM_ABI bool isIdenticalTo(const MachineInstr &Other, MICheckType Check=CheckDefs) const
Return true if this instruction is identical to Other.
LLVM_ABI const MachineFunction * getMF() const
Return the function that contains the basic block that this instruction belongs to.
void setFlag(MIFlag Flag)
Set a MI flag.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
LLVM_ABI void removeOperand(unsigned OpNo)
Erase an operand from an instruction, leaving it with one fewer operand than it started with.
LLVM_ABI void dump() const
const MachineOperand & getOperand(unsigned i) const
unsigned getNumDefs() const
Returns the total number of definitions.
LLVM_ABI MachineInstrBundleIterator< MachineInstr > eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
void setDebugLoc(DebugLoc DL)
Replace current source information with new such.
MachineOperand * findRegisterDefOperand(Register Reg, const TargetRegisterInfo *TRI, bool isDead=false, bool Overlap=false)
Wrapper for findRegisterDefOperandIdx, it returns a pointer to the MachineOperand rather than an inde...
A description of a memory reference used in the backend.
@ MODereferenceable
The memory access is dereferenceable (i.e., doesn't trap).
@ MOLoad
The memory access reads data.
@ MOInvariant
The memory access always returns the same value (or traps).
@ MOStore
The memory access writes data.
This class contains meta information specific to a module.
MachineOperand class - Representation of each machine instruction operand.
void setSubReg(unsigned subReg)
unsigned getSubReg() const
void setImplicit(bool Val=true)
void setImm(int64_t immVal)
bool readsReg() const
readsReg - Returns true if this operand reads the previous value of its register.
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
bool isCPI() const
isCPI - Tests if this is a MO_ConstantPoolIndex operand.
void setIsDead(bool Val=true)
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
void setIsKill(bool Val=true)
bool isJTI() const
isJTI - Tests if this is a MO_JumpTableIndex operand.
LLVM_ABI void ChangeToRegister(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isDebug=false)
ChangeToRegister - Replace this operand with a new register operand of the specified value.
static MachineOperand CreateImm(int64_t Val)
void setIsUndef(bool Val=true)
Register getReg() const
getReg - Returns the register number.
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
LLVM_ABI bool isIdenticalTo(const MachineOperand &Other) const
Returns true if this operand is identical to the specified operand except for liveness related flags ...
static MachineOperand CreateCPI(unsigned Idx, int Offset, unsigned TargetFlags=0)
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
int64_t getOffset() const
Return the offset from the symbol in this operand.
static MachineOperand CreateFI(int Idx)
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
iterator_range< def_instr_iterator > def_instructions(Register Reg) const
bool use_nodbg_empty(Register RegNo) const
use_nodbg_empty - Return true if there are no non-Debug instructions using the specified register.
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
const TargetRegisterInfo * getTargetRegisterInfo() const
LLVM_ABI const TargetRegisterClass * constrainRegClass(Register Reg, const TargetRegisterClass *RC, unsigned MinNumRegs=0)
constrainRegClass - Constrain the register class of the specified virtual register to be a common sub...
LLVM_ABI MachineInstr * getUniqueVRegDef(Register Reg) const
getUniqueVRegDef - Return the unique machine instr that defines the specified virtual register or nul...
A Module instance is used to store all the information related to an LLVM module.
Wrapper class representing virtual and physical registers.
constexpr bool isValid() const
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
bool isMachineOpcode() const
Test if this node has a post-isel opcode, directly corresponding to a MachineInstr opcode.
unsigned getMachineOpcode() const
This may only be called if isMachineOpcode returns true.
const SDValue & getOperand(unsigned Num) const
EVT getValueType(unsigned ResNo) const
Return the type of a specified result.
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
LLVM_ABI MachineSDNode * getMachineNode(unsigned Opcode, const SDLoc &dl, EVT VT)
These are used for target selectors to create a new node with specified return type(s),...
LLVM_ABI void setNodeMemRefs(MachineSDNode *N, ArrayRef< MachineMemOperand * > NewMemRefs)
Mutate the specified machine node's memory references to the provided list.
MachineFunction & getMachineFunction() const
SlotIndex - An opaque wrapper around machine indexes.
SlotIndex getBaseIndex() const
Returns the base index for associated with this index.
SlotIndex getRegSlot(bool EC=false) const
Returns the register use/def slot in the current instruction for a normal or early-clobber def.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Represent a constant reference to a string, i.e.
Information about stack frame layout on the target.
bool hasFP(const MachineFunction &MF) const
hasFP - Return true if the specified function should have a dedicated frame pointer register.
Align getStackAlign() const
getStackAlignment - This method returns the number of bytes to which the stack pointer must be aligne...
TargetInstrInfo - Interface to description of machine instruction set.
virtual const TargetRegisterClass * getRegClass(const MCInstrDesc &MCID, unsigned OpNum) const
Given a machine instruction descriptor, returns the register class constraint for OpNum,...
virtual bool findCommutedOpIndices(const MachineInstr &MI, unsigned &SrcOpIdx1, unsigned &SrcOpIdx2) const
Returns true iff the routine could find two commutable operands in the given machine instruction.
virtual bool hasReassociableOperands(const MachineInstr &Inst, const MachineBasicBlock *MBB) const
Return true when \P Inst has reassociable operands in the same \P MBB.
virtual void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstIdxForVirtReg) const
When getMachineCombinerPatterns() finds patterns, this function generates the instructions that could...
virtual std::optional< ParamLoadedValue > describeLoadedValue(const MachineInstr &MI, Register Reg) const
Produce the expression describing the MI loading a value into the physical register Reg.
virtual bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
virtual bool isReMaterializableImpl(const MachineInstr &MI) const
For instructions with opcodes for which the M_REMATERIALIZABLE flag is set, this hook lets the target...
virtual bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const
Test if the given instruction should be considered a scheduling boundary.
virtual MachineInstr * commuteInstructionImpl(MachineInstr &MI, bool NewMI, unsigned OpIdx1, unsigned OpIdx2) const
This method commutes the operands of the given machine instruction MI.
bool isPositionIndependent() const
const MCAsmInfo & getMCAsmInfo() const
Return target specific asm information.
CodeModel::Model getCodeModel() const
Returns the code model.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Provide an instruction scheduling machine model to CodeGen passes.
virtual const TargetFrameLowering * getFrameLowering() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
Target - Wrapper for Target specific information.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
static constexpr TypeSize getZero()
The instances of the Type class are immutable: once they are created, they are never changed.
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
static LLVM_ABI Type * getFP128Ty(LLVMContext &C)
static LLVM_ABI Type * getDoubleTy(LLVMContext &C)
static LLVM_ABI Type * getFloatTy(LLVMContext &C)
static LLVM_ABI Type * getHalfTy(LLVMContext &C)
SlotIndex def
The index of the defining instruction.
LLVM Value Representation.
MCRegister getPhys(Register virtReg) const
returns the physical register mapped to the specified virtual register
void BuildCFI(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, const MCCFIInstruction &CFIInst, MachineInstr::MIFlag Flag=MachineInstr::NoFlags) const
Wraps up getting a CFI index and building a MachineInstr for it.
void getFrameIndexOperands(SmallVectorImpl< MachineOperand > &Ops, int FI) const override
bool optimizeCompareInstr(MachineInstr &CmpInstr, Register SrcReg, Register SrcReg2, int64_t CmpMask, int64_t CmpValue, const MachineRegisterInfo *MRI) const override
Check if there exists an earlier instruction that operates on the same source operands and sets eflag...
bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const override
void copyPhysReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, const DebugLoc &DL, Register DestReg, Register SrcReg, bool KillSrc, bool RenamableDest=false, bool RenamableSrc=false) const override
bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const override
Overrides the isSchedulingBoundary from Codegen/TargetInstrInfo.cpp to make it capable of identifying...
MachineBasicBlock::iterator insertOutlinedCall(Module &M, MachineBasicBlock &MBB, MachineBasicBlock::iterator &It, MachineFunction &MF, outliner::Candidate &C) const override
void replaceBranchWithTailCall(MachineBasicBlock &MBB, SmallVectorImpl< MachineOperand > &Cond, const MachineInstr &TailCall) const override
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify) const override
bool canInsertSelect(const MachineBasicBlock &, ArrayRef< MachineOperand > Cond, Register, Register, Register, int &, int &, int &) const override
void insertSelect(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, const DebugLoc &DL, Register DstReg, ArrayRef< MachineOperand > Cond, Register TrueReg, Register FalseReg) const override
unsigned getOpcodeAfterMemoryUnfold(unsigned Opc, bool UnfoldLoad, bool UnfoldStore, unsigned *LoadRegIndex=nullptr) const override
bool findCommutedOpIndices(const MachineInstr &MI, unsigned &SrcOpIdx1, unsigned &SrcOpIdx2) const override
Returns true iff the routine could find two commutable operands in the given machine instruction.
bool areLoadsFromSameBasePtr(SDNode *Load1, SDNode *Load2, int64_t &Offset1, int64_t &Offset2) const override
void loadRegFromStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, Register DestReg, int FrameIndex, const TargetRegisterClass *RC, Register VReg, unsigned SubReg=0, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
X86InstrInfo(const X86Subtarget &STI)
static bool isDataInvariantLoad(MachineInstr &MI)
Returns true if the instruction has no behavior (specified or otherwise) that is based on the value l...
MachineInstr * commuteInstructionImpl(MachineInstr &MI, bool NewMI, unsigned CommuteOpIdx1, unsigned CommuteOpIdx2) const override
bool isFunctionSafeToOutlineFrom(MachineFunction &MF, bool OutlineFromLinkOnceODRs) const override
const X86RegisterInfo & getRegisterInfo() const
getRegisterInfo - TargetInstrInfo is a superset of MRegister info.
bool hasCommutePreference(MachineInstr &MI, bool &Commute) const override
Returns true if we have preference on the operands order in MI, the commute decision is returned in C...
bool hasLiveCondCodeDef(MachineInstr &MI) const
True if MI has a condition code def, e.g.
std::optional< ParamLoadedValue > describeLoadedValue(const MachineInstr &MI, Register Reg) const override
bool canMakeTailCallConditional(SmallVectorImpl< MachineOperand > &Cond, const MachineInstr &TailCall) const override
bool getMemOperandsWithOffsetWidth(const MachineInstr &LdSt, SmallVectorImpl< const MachineOperand * > &BaseOps, int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width, const TargetRegisterInfo *TRI) const override
bool unfoldMemoryOperand(MachineFunction &MF, MachineInstr &MI, Register Reg, bool UnfoldLoad, bool UnfoldStore, SmallVectorImpl< MachineInstr * > &NewMIs) const override
std::optional< DestSourcePair > isCopyInstrImpl(const MachineInstr &MI) const override
MachineInstr * convertToThreeAddress(MachineInstr &MI, LiveVariables *LV, LiveIntervals *LIS) const override
convertToThreeAddress - This method must be implemented by targets that set the M_CONVERTIBLE_TO_3_AD...
std::pair< unsigned, unsigned > decomposeMachineOperandsTargetFlags(unsigned TF) const override
bool expandPostRAPseudo(MachineInstr &MI) const override
void storeRegToStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, Register SrcReg, bool isKill, int FrameIndex, const TargetRegisterClass *RC, Register VReg, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
bool isAssociativeAndCommutative(const MachineInstr &Inst, bool Invert) const override
MCInst getNop() const override
Return the noop instruction to use for a noop.
outliner::InstrType getOutliningTypeImpl(const MachineModuleInfo &MMI, MachineBasicBlock::iterator &MIT, unsigned Flags) const override
bool shouldScheduleLoadsNear(SDNode *Load1, SDNode *Load2, int64_t Offset1, int64_t Offset2, unsigned NumLoads) const override
This is a used by the pre-regalloc scheduler to determine (in conjunction with areLoadsFromSameBasePt...
bool analyzeCompare(const MachineInstr &MI, Register &SrcReg, Register &SrcReg2, int64_t &CmpMask, int64_t &CmpValue) const override
bool getConstValDefinedInReg(const MachineInstr &MI, const Register Reg, int64_t &ImmVal) const override
std::optional< ExtAddrMode > getAddrModeFromMemoryOp(const MachineInstr &MemI, const TargetRegisterInfo *TRI) const override
Register isStoreToStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
isStoreToStackSlotPostFE - Check for post-frame ptr elimination stack locations as well.
const TargetRegisterClass * getRegClass(const MCInstrDesc &MCID, unsigned OpNum) const override
Given a machine instruction descriptor, returns the register class constraint for OpNum,...
bool isUnconditionalTailCall(const MachineInstr &MI) const override
void reMaterialize(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, Register DestReg, unsigned SubIdx, const MachineInstr &Orig, LaneBitmask UsedLanes=LaneBitmask::getAll()) const override
bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const override
std::optional< std::unique_ptr< outliner::OutlinedFunction > > getOutliningCandidateInfo(const MachineModuleInfo &MMI, std::vector< outliner::Candidate > &RepeatedSequenceLocs, unsigned MinRepeats) const override
bool classifyLEAReg(MachineInstr &MI, const MachineOperand &Src, unsigned LEAOpcode, bool AllowSP, Register &NewSrc, unsigned &NewSrcSubReg, bool &isKill, MachineOperand &ImplicitOp, LiveVariables *LV, LiveIntervals *LIS) const
Given an operand within a MachineInstr, insert preceding code to put it into the right format for a p...
Register isLoadFromStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
isLoadFromStackSlotPostFE - Check for post-frame ptr elimination stack locations as well.
void setExecutionDomain(MachineInstr &MI, unsigned Domain) const override
unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &DL, int *BytesAdded=nullptr) const override
ArrayRef< std::pair< unsigned, const char * > > getSerializableDirectMachineOperandTargetFlags() const override
Register isStoreToStackSlot(const MachineInstr &MI, int &FrameIndex) const override
bool setExecutionDomainCustom(MachineInstr &MI, unsigned Domain) const
int getSPAdjust(const MachineInstr &MI) const override
getSPAdjust - This returns the stack pointer adjustment made by this instruction.
bool verifyInstruction(const MachineInstr &MI, StringRef &ErrInfo) const override
bool isReMaterializableImpl(const MachineInstr &MI) const override
Register getGlobalBaseReg(MachineFunction *MF) const
getGlobalBaseReg - Return a virtual register initialized with the the global base register value.
int getJumpTableIndex(const MachineInstr &MI) const override
void insertNoop(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI) const override
void setSpecialOperandAttr(MachineInstr &OldMI1, MachineInstr &OldMI2, MachineInstr &NewMI1, MachineInstr &NewMI2) const override
This is an architecture-specific helper function of reassociateOps.
std::pair< uint16_t, uint16_t > getExecutionDomain(const MachineInstr &MI) const override
bool isCoalescableExtInstr(const MachineInstr &MI, Register &SrcReg, Register &DstReg, unsigned &SubIdx) const override
isCoalescableExtInstr - Return true if the instruction is a "coalescable" extension instruction.
void loadStoreTileReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, unsigned Opc, Register Reg, int FrameIdx, bool isKill=false) const
void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg) const override
When getMachineCombinerPatterns() finds potential patterns, this function generates the instructions ...
bool hasReassociableOperands(const MachineInstr &Inst, const MachineBasicBlock *MBB) const override
bool analyzeBranchPredicate(MachineBasicBlock &MBB, TargetInstrInfo::MachineBranchPredicate &MBP, bool AllowModify=false) const override
static bool isDataInvariant(MachineInstr &MI)
Returns true if the instruction has no behavior (specified or otherwise) that is based on the value o...
unsigned getUndefRegClearance(const MachineInstr &MI, unsigned OpNum, const TargetRegisterInfo *TRI) const override
Inform the BreakFalseDeps pass how many idle instructions we would like before certain undef register...
MachineInstr * foldMemoryOperandImpl(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, int FrameIndex, MachineInstr *&CopyMI, LiveIntervals *LIS=nullptr, VirtRegMap *VRM=nullptr) const override
Fold a load or store of the specified stack slot into the specified machine instruction for the speci...
void breakPartialRegDependency(MachineInstr &MI, unsigned OpNum, const TargetRegisterInfo *TRI) const override
void buildClearRegister(Register Reg, MachineBasicBlock &MBB, MachineBasicBlock::iterator Iter, DebugLoc &DL, bool AllowSideEffects=true) const override
Register isLoadFromStackSlot(const MachineInstr &MI, int &FrameIndex) const override
int64_t getFrameAdjustment(const MachineInstr &I) const
Returns the stack pointer adjustment that happens inside the frame setup..destroy sequence (e....
bool hasHighOperandLatency(const TargetSchedModel &SchedModel, const MachineRegisterInfo *MRI, const MachineInstr &DefMI, unsigned DefIdx, const MachineInstr &UseMI, unsigned UseIdx) const override
bool isSafeToMoveRegClassDefs(const TargetRegisterClass *RC) const override
uint16_t getExecutionDomainCustom(const MachineInstr &MI) const
bool isHighLatencyDef(int opc) const override
void buildOutlinedFrame(MachineBasicBlock &MBB, MachineFunction &MF, const outliner::OutlinedFunction &OF) const override
bool foldImmediate(MachineInstr &UseMI, MachineInstr &DefMI, Register Reg, MachineRegisterInfo *MRI) const override
foldImmediate - 'Reg' is known to be defined by a move immediate instruction, try to fold the immedia...
unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const override
unsigned getFMA3OpcodeToCommuteOperands(const MachineInstr &MI, unsigned SrcOpIdx1, unsigned SrcOpIdx2, const X86InstrFMA3Group &FMA3Group) const
Returns an adjusted FMA opcode that must be used in FMA instruction that performs the same computatio...
bool preservesZeroValueInReg(const MachineInstr *MI, const Register NullValueReg, const TargetRegisterInfo *TRI) const override
unsigned getPartialRegUpdateClearance(const MachineInstr &MI, unsigned OpNum, const TargetRegisterInfo *TRI) const override
Inform the BreakFalseDeps pass how many idle instructions we would like before a partial register upd...
X86MachineFunctionInfo - This class is derived from MachineFunction and contains private X86 target-s...
Register getGlobalBaseReg() const
int getTCReturnAddrDelta() const
void setGlobalBaseReg(Register Reg)
bool getUsesRedZone() const
const TargetRegisterClass * constrainRegClassToNonRex2(const TargetRegisterClass *RC) const
const X86RegisterInfo * getRegisterInfo() const override
const X86FrameLowering * getFrameLowering() const override
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
@ C
The default llvm calling convention, compatible with C.
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
@ X86
Windows x64, Windows Itanium (IA-64)
X86II - This namespace holds all of the target specific flags that instruction info tracks.
bool isKMergeMasked(uint64_t TSFlags)
bool hasNewDataDest(uint64_t TSFlags)
@ MO_GOT_ABSOLUTE_ADDRESS
MO_GOT_ABSOLUTE_ADDRESS - On a symbol operand, this represents a relocation of: SYMBOL_LABEL + [.
@ MO_INDNTPOFF
MO_INDNTPOFF - On a symbol operand this indicates that the immediate is the absolute address of the G...
@ MO_GOTNTPOFF
MO_GOTNTPOFF - On a symbol operand this indicates that the immediate is the offset of the GOT entry w...
@ MO_GOTTPOFF
MO_GOTTPOFF - On a symbol operand this indicates that the immediate is the offset of the GOT entry wi...
@ MO_GOTPCREL
MO_GOTPCREL - On a symbol operand this indicates that the immediate is offset to the GOT entry for th...
@ EVEX
EVEX - Specifies that this instruction use EVEX form which provides syntax support up to 32 512-bit r...
@ SSEDomainShift
Execution domain for SSE instructions.
bool canUseApxExtendedReg(const MCInstrDesc &Desc)
bool isPseudo(uint64_t TSFlags)
bool isKMasked(uint64_t TSFlags)
int getMemoryOperandNo(uint64_t TSFlags)
unsigned getOperandBias(const MCInstrDesc &Desc)
Compute whether all of the def operands are repeated in the uses and therefore should be skipped.
Define some predicates that are used for node matching.
CondCode getCondFromBranch(const MachineInstr &MI)
CondCode getCondFromCFCMov(const MachineInstr &MI)
CondCode getCondFromMI(const MachineInstr &MI)
Return the condition code of the instruction.
int getFirstAddrOperandIdx(const MachineInstr &MI)
Return the index of the instruction's first address operand, if it has a memory reference,...
unsigned getSwappedVCMPImm(unsigned Imm)
Get the VCMP immediate if the opcodes are swapped.
CondCode GetOppositeBranchCondition(CondCode CC)
GetOppositeBranchCondition - Return the inverse of the specified cond, e.g.
unsigned getSwappedVPCOMImm(unsigned Imm)
Get the VPCOM immediate if the opcodes are swapped.
bool isX87Instruction(MachineInstr &MI)
Check if the instruction is X87 instruction.
unsigned getNonNDVariant(unsigned Opc)
unsigned getVPCMPImmForCond(ISD::CondCode CC)
Get the VPCMP immediate for the given condition.
std::pair< CondCode, bool > getX86ConditionCode(CmpInst::Predicate Predicate)
Return a pair of condition code for the given predicate and whether the instruction operands should b...
CondCode getCondFromSETCC(const MachineInstr &MI)
unsigned getSwappedVPCMPImm(unsigned Imm)
Get the VPCMP immediate if the opcodes are swapped.
CondCode getCondFromCCMP(const MachineInstr &MI)
int getCCMPCondFlagsFromCondCode(CondCode CC)
int getCondSrcNoFromDesc(const MCInstrDesc &MCID)
Return the source operand # for condition code by MCID.
const Constant * getConstantFromPool(const MachineInstr &MI, unsigned OpNo)
Find any constant pool entry associated with a specific instruction operand.
unsigned getMOVriOpcode(bool Use64BitReg, int64_t Imm)
Return a MOVri opcode for materializing Imm into a 32- or 64-bit GPR.
unsigned getCMovOpcode(unsigned RegBytes, bool HasMemoryOperand=false, bool HasNDD=false)
Return a cmov opcode for the given register size in bytes, and operand type.
unsigned getNFVariant(unsigned Opc)
unsigned getVectorRegisterWidth(const MCOperandInfo &Info)
Get the width of the vector register operand.
CondCode getCondFromCMov(const MachineInstr &MI)
initializer< Ty > init(const Ty &Val)
InstrType
Represents how an instruction should be mapped by the outliner.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
static bool isAddMemInstrWithRelocation(const MachineInstr &MI)
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
LLVM_ABI bool isNullConstant(SDValue V)
Returns true if V is a constant integer zero.
RegState
Flags to represent properties of register accesses.
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Kill
The last use of a register.
@ Undef
Value of the register doesn't matter.
@ Define
Register definition.
static bool isMem(const MachineInstr &MI, unsigned Op)
constexpr RegState getKillRegState(bool B)
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
bool isAligned(Align Lhs, uint64_t SizeInBytes)
Checks that SizeInBytes is a multiple of the alignment.
MCRegister getX86SubSuperRegister(MCRegister Reg, unsigned Size, bool High=false)
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
static const MachineInstrBuilder & addRegReg(const MachineInstrBuilder &MIB, Register Reg1, bool isKill1, unsigned SubReg1, Register Reg2, bool isKill2, unsigned SubReg2)
addRegReg - This function is used to add a memory reference of the form: [Reg + Reg].
static const MachineInstrBuilder & addFrameReference(const MachineInstrBuilder &MIB, int FI, int Offset=0, bool mem=true)
addFrameReference - This function is used to add a reference to the base of an abstract object on the...
constexpr RegState getDeadRegState(bool B)
constexpr int popcount(T Value) noexcept
Count the number of set bits in a value.
bool isNonFoldableWithSameMask(unsigned RegOp)
const X86FoldTableEntry * lookupBroadcastFoldTable(unsigned RegOp, unsigned OpNum)
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
const X86InstrFMA3Group * getFMA3Group(unsigned Opcode, uint64_t TSFlags)
Returns a reference to a group of FMA3 opcodes to where the given Opcode is included.
auto reverse(ContainerTy &&C)
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
const X86FoldTableEntry * lookupTwoAddrFoldTable(unsigned RegOp)
constexpr uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
bool is_sorted(R &&Range, Compare C)
Wrapper function around std::is_sorted to check if elements in a range R are sorted with respect to a...
constexpr RegState getDefRegState(bool B)
constexpr bool isUInt(uint64_t x)
Checks if an unsigned integer fits into the given bit width.
RegState getRegState(const MachineOperand &RegOp)
Get all register state flags from machine operand RegOp.
static bool isMemInstrWithGOTPCREL(const MachineInstr &MI)
static const MachineInstrBuilder & addOffset(const MachineInstrBuilder &MIB, int Offset)
auto lower_bound(R &&Range, T &&Value)
Provide wrappers to std::lower_bound which take ranges instead of having to pass begin/end explicitly...
@ Sub
Subtraction of integers.
RelativeUniformCounterPtr ValuesPtrExpr VTableAddr Count
MaybeAlign getStackAlign(const CallBase &I, unsigned Index)
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
const X86FoldTableEntry * lookupUnfoldTable(unsigned MemOp)
constexpr unsigned BitWidth
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
bool matchBroadcastSize(const X86FoldTableEntry &Entry, unsigned BroadcastBits)
std::pair< MachineOperand, DIExpression * > ParamLoadedValue
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
const X86FoldTableEntry * lookupFoldTable(unsigned RegOp, unsigned OpNum)
static const MachineInstrBuilder & addRegOffset(const MachineInstrBuilder &MIB, Register Reg, bool isKill, int Offset)
addRegOffset - This function is used to add a memory reference of the form [Reg + Offset],...
constexpr RegState getUndefRegState(bool B)
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
This struct is a compact representation of a valid (non-zero power of two) alignment.
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Used to describe addressing mode similar to ExtAddrMode in CodeGenPrepare.
This represents a simple continuous liveness interval for a value.
std::vector< MachineInstr * > Kills
Kills - List of MachineInstruction's which are the last use of this virtual register (kill it) in the...
This class contains a discriminated union of information about pointers in memory operands,...
static LLVM_ABI MachinePointerInfo getGOT(MachineFunction &MF)
Return a MachinePointerInfo record that refers to a GOT entry.
X86AddressMode - This struct holds a generalized full x86 address mode.
enum llvm::X86AddressMode::@202116273335065351270200035056227005202106004277 BaseType
This class is used to group {132, 213, 231} forms of FMA opcodes together.
unsigned get213Opcode() const
Returns the 213 form of FMA opcode.
unsigned get231Opcode() const
Returns the 231 form of FMA opcode.
bool isIntrinsic() const
Returns true iff the group of FMA opcodes holds intrinsic opcodes.
unsigned get132Opcode() const
Returns the 132 form of FMA opcode.
An individual sequence of instructions to be replaced with a call to an outlined function.
The information necessary to create an outlined function for some class of candidate.