49#define GET_GICOMBINER_DEPS
50#include "AArch64GenPostLegalizeGILowering.inc"
51#undef GET_GICOMBINER_DEPS
53#define DEBUG_TYPE "aarch64-postlegalizer-lowering"
61#define GET_GICOMBINER_TYPES
62#include "AArch64GenPostLegalizeGILowering.inc"
63#undef GET_GICOMBINER_TYPES
68struct ShuffleVectorPseudo {
73 std::initializer_list<SrcOp> SrcOps)
74 :
Opc(
Opc), Dst(Dst), SrcOps(SrcOps){};
75 ShuffleVectorPseudo() =
default;
81 assert(
MI.getOpcode() == TargetOpcode::G_FCONSTANT);
84 if (DstSize != 16 && DstSize != 32 && DstSize != 64)
96 assert(
MI.getOpcode() == TargetOpcode::G_FCONSTANT);
98 const APFloat &ImmValAPF =
MI.getOperand(1).getFPImm()->getValueAPF();
100 MI.eraseFromParent();
105std::optional<std::pair<bool, uint64_t>> getExtMask(
ArrayRef<int> M,
108 auto FirstRealElt =
find_if(M, [](
int Elt) {
return Elt >= 0; });
109 if (FirstRealElt == M.end())
114 APInt ExpectedElt =
APInt(MaskBits, *FirstRealElt + 1,
false,
true);
120 [&ExpectedElt](
int Elt) { return Elt != ExpectedElt++ && Elt >= 0; }))
130 bool ReverseExt =
false;
142 return std::make_pair(ReverseExt, Imm);
154 int NumInputElements) {
155 if (M.size() !=
static_cast<size_t>(NumInputElements))
157 int NumLHSMatch = 0, NumRHSMatch = 0;
158 int LastLHSMismatch = -1, LastRHSMismatch = -1;
159 for (
int Idx = 0; Idx < NumInputElements; ++Idx) {
165 M[Idx] == Idx ? ++NumLHSMatch : LastLHSMismatch = Idx;
166 M[Idx] == Idx + NumInputElements ? ++NumRHSMatch : LastRHSMismatch = Idx;
168 const int NumNeededToMatch = NumInputElements - 1;
169 if (NumLHSMatch == NumNeededToMatch)
170 return std::make_pair(
true, LastLHSMismatch);
171 if (NumRHSMatch == NumNeededToMatch)
172 return std::make_pair(
false, LastRHSMismatch);
179 ShuffleVectorPseudo &MatchInfo) {
180 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
191 unsigned NumElts = Ty.getNumElements();
194 for (
unsigned LaneSize : {64U, 32U, 16U}) {
195 if (
isREVMask(ShuffleMask, EltSize, NumElts, LaneSize)) {
198 Opcode = AArch64::G_REV64;
199 else if (LaneSize == 32U)
200 Opcode = AArch64::G_REV32;
202 Opcode = AArch64::G_BSWAP;
204 MatchInfo = ShuffleVectorPseudo(Opcode, Dst, {Src});
215 ShuffleVectorPseudo &MatchInfo) {
216 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
217 unsigned WhichResult;
218 unsigned OperandOrder;
222 if (!
isTRNMask(ShuffleMask, NumElts, WhichResult, OperandOrder))
224 unsigned Opc = (WhichResult == 0) ? AArch64::G_TRN1 :
AArch64::G_TRN2;
225 Register V1 =
MI.getOperand(OperandOrder == 0 ? 1 : 2).getReg();
226 Register V2 =
MI.getOperand(OperandOrder == 0 ? 2 : 1).getReg();
227 MatchInfo = ShuffleVectorPseudo(
Opc, Dst, {V1, V2});
237 ShuffleVectorPseudo &MatchInfo) {
238 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
239 unsigned WhichResult;
243 if (!
isUZPMask(ShuffleMask, NumElts, WhichResult))
245 unsigned Opc = (WhichResult == 0) ? AArch64::G_UZP1 :
AArch64::G_UZP2;
248 MatchInfo = ShuffleVectorPseudo(
Opc, Dst, {V1, V2});
253 ShuffleVectorPseudo &MatchInfo) {
254 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
255 unsigned WhichResult;
256 unsigned OperandOrder;
260 if (!
isZIPMask(ShuffleMask, NumElts, WhichResult, OperandOrder))
262 unsigned Opc = (WhichResult == 0) ? AArch64::G_ZIP1 :
AArch64::G_ZIP2;
263 Register V1 =
MI.getOperand(OperandOrder == 0 ? 1 : 2).getReg();
264 Register V2 =
MI.getOperand(OperandOrder == 0 ? 2 : 1).getReg();
265 MatchInfo = ShuffleVectorPseudo(
Opc, Dst, {V1, V2});
272 ShuffleVectorPseudo &MatchInfo) {
291 auto *InsMI =
getOpcodeDef(TargetOpcode::G_INSERT_VECTOR_ELT,
292 MI.getOperand(1).getReg(), MRI);
296 if (!
getOpcodeDef(TargetOpcode::G_IMPLICIT_DEF, InsMI->getOperand(1).getReg(),
304 MatchInfo = ShuffleVectorPseudo(AArch64::G_DUP,
MI.getOperand(0).getReg(),
305 {InsMI->getOperand(2).getReg()});
312 ShuffleVectorPseudo &MatchInfo) {
313 assert(Lane >= 0 &&
"Expected positive lane?");
319 MI.getOperand(Lane < NumElements ? 1 : 2).getReg(), MRI);
321 if (NumElements <= Lane)
326 Register Reg = BuildVecMI->getOperand(Lane + 1).getReg();
328 ShuffleVectorPseudo(AArch64::G_DUP,
MI.getOperand(0).getReg(), {Reg});
333 ShuffleVectorPseudo &MatchInfo) {
334 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
338 int Lane = *MaybeLane;
342 if (matchDupFromInsertVectorElt(Lane,
MI, MRI, MatchInfo))
344 if (matchDupFromBuildVector(Lane,
MI, MRI, MatchInfo))
352 unsigned NumElts = Ty.getNumElements();
361 unsigned ExpectedElt = M[0];
362 for (
unsigned I = 1;
I < NumElts; ++
I) {
366 if (ExpectedElt == NumElts)
371 if (ExpectedElt !=
static_cast<unsigned>(M[
I]))
379 ShuffleVectorPseudo &MatchInfo) {
380 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
385 auto Mask =
MI.getOperand(3).getShuffleMask();
392 !isSingletonExtMask(Mask, DstTy))
396 MatchInfo = ShuffleVectorPseudo(AArch64::G_EXT, Dst, {V1, V1,
Imm});
400 std::tie(ReverseExt, Imm) = *ExtInfo;
404 MatchInfo = ShuffleVectorPseudo(AArch64::G_EXT, Dst, {V1, V2,
Imm});
411 ShuffleVectorPseudo &MatchInfo) {
413 if (MatchInfo.Opc == TargetOpcode::G_BSWAP) {
414 assert(MatchInfo.SrcOps.size() == 1);
419 :
LLT::fixed_vector(8, 16);
421 auto BS1 = MIRBuilder.buildInstr(TargetOpcode::G_BITCAST, {BSTy},
422 MatchInfo.SrcOps[0]);
423 auto BS2 = MIRBuilder.buildInstr(MatchInfo.Opc, {BSTy}, {BS1});
424 MIRBuilder.buildInstr(TargetOpcode::G_BITCAST, {MatchInfo.Dst}, {BS2});
426 MIRBuilder.buildInstr(MatchInfo.Opc, {MatchInfo.Dst}, MatchInfo.SrcOps);
427 MI.eraseFromParent();
435 if (MatchInfo.SrcOps[2].getImm() == 0)
436 MIRBuilder.buildCopy(MatchInfo.Dst, MatchInfo.SrcOps[0]);
440 MIRBuilder.buildConstant(
LLT::scalar(32), MatchInfo.SrcOps[2].getImm());
441 MIRBuilder.buildInstr(MatchInfo.Opc, {MatchInfo.Dst},
442 {MatchInfo.SrcOps[0], MatchInfo.SrcOps[1], Cst});
444 MI.eraseFromParent();
452 "Expected 128bit vector in applyFullRev");
454 auto Cst = MIRBuilder.buildConstant(
LLT::scalar(32), 8);
455 auto Rev = MIRBuilder.buildInstr(AArch64::G_REV64, {DstTy}, {Src});
456 MIRBuilder.buildInstr(AArch64::G_EXT, {Dst}, {Rev, Rev, Cst});
457 MI.eraseFromParent();
461 assert(
MI.getOpcode() == TargetOpcode::G_INSERT_VECTOR_ELT);
471 Builder.setInstrAndDebugLoc(Insert);
489 auto StackTemp = Builder.buildFrameIndex(FramePtrTy, FrameIdx);
491 Builder.buildStore(
Insert.getOperand(1), StackTemp, PtrInfo,
Align(8));
496 "Expected a power-2 vector size");
499 auto EltSize = Builder.buildConstant(IdxTy, EltTy.
getSizeInBytes());
502 Builder.buildPtrAdd(MRI.
getType(StackTemp.getReg(0)), StackTemp,
Mul)
506 Builder.buildStore(
Insert.getElementReg(), EltPtr, PtrInfo,
Align(1));
508 Builder.buildLoad(
Insert.getReg(0), StackTemp, PtrInfo,
Align(8));
524 std::tuple<Register, int, Register, int> &MatchInfo) {
525 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
529 auto DstIsLeftAndDstLane =
isINSMask(ShuffleMask, NumElts);
530 if (!DstIsLeftAndDstLane)
534 std::tie(DstIsLeft, DstLane) = *DstIsLeftAndDstLane;
540 int SrcLane = ShuffleMask[DstLane];
541 if (SrcLane >= NumElts) {
546 MatchInfo = std::make_tuple(DstVec, DstLane, SrcVec, SrcLane);
552 std::tuple<Register, int, Register, int> &MatchInfo) {
553 Builder.setInstrAndDebugLoc(
MI);
557 int DstLane, SrcLane;
558 std::tie(DstVec, DstLane, SrcVec, SrcLane) = MatchInfo;
559 auto SrcCst = Builder.buildConstant(
LLT::scalar(64), SrcLane);
560 auto Extract = Builder.buildExtractVectorElement(ScalarTy, SrcVec, SrcCst);
561 auto DstCst = Builder.buildConstant(
LLT::scalar(64), DstLane);
562 Builder.buildInsertVectorElement(Dst, DstVec, Extract, DstCst);
563 MI.eraseFromParent();
571 assert(Ty.isVector() &&
"vector shift count is not a vector type");
577 int64_t ElementBits = Ty.getScalarSizeInBits();
578 return Cnt >= 1 && Cnt <= ElementBits;
584 assert(
MI.getOpcode() == TargetOpcode::G_ASHR ||
585 MI.getOpcode() == TargetOpcode::G_LSHR);
594 unsigned Opc =
MI.getOpcode();
595 assert(
Opc == TargetOpcode::G_ASHR ||
Opc == TargetOpcode::G_LSHR);
597 Opc == TargetOpcode::G_ASHR ? AArch64::G_VASHR : AArch64::G_VLSHR;
599 MIB.buildInstr(NewOpc, {
MI.getOperand(0)}, {
MI.getOperand(1)}).addImm(Imm);
600 MI.eraseFromParent();
610std::optional<std::pair<uint64_t, CmpInst::Predicate>>
616 unsigned Size = Ty.getSizeInBits();
617 assert((
Size == 32 ||
Size == 64) &&
"Expected 32 or 64 bit compare only?");
624 uint64_t OriginalC = ValAndVReg->Value.getZExtValue();
643 (
Size == 32 &&
static_cast<int32_t
>(
C) == INT32_MIN))
656 assert(
C != 0 &&
"C should not be zero here!");
668 if ((
Size == 32 &&
static_cast<int32_t
>(
C) == INT32_MAX) ||
682 if ((
Size == 32 &&
static_cast<uint32_t>(
C) == UINT32_MAX) ||
703 if (NumberOfInstrToLoadImm(OriginalC) > NumberOfInstrToLoadImm(
C))
717bool matchAdjustICmpImmAndPred(
719 std::pair<uint64_t, CmpInst::Predicate> &MatchInfo) {
720 assert(
MI.getOpcode() == TargetOpcode::G_ICMP);
723 if (
auto MaybeNewImmAndPred = tryAdjustICmpImmAndPred(
RHS, Pred, MRI)) {
724 MatchInfo = *MaybeNewImmAndPred;
730void applyAdjustICmpImmAndPred(
731 MachineInstr &
MI, std::pair<uint64_t, CmpInst::Predicate> &MatchInfo,
739 RHS.setReg(Cst->getOperand(0).getReg());
740 MI.getOperand(1).setPredicate(MatchInfo.second);
745 std::pair<unsigned, int> &MatchInfo) {
746 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
749 const LLT DstTy = MRI.
getType(
MI.getOperand(0).getReg());
756 if (*LaneIdx >= SrcTy.getNumElements())
766 switch (SrcTy.getNumElements()) {
768 if (ScalarSize == 64)
769 Opc = AArch64::G_DUPLANE64;
770 else if (ScalarSize == 32)
771 Opc = AArch64::G_DUPLANE32;
774 if (ScalarSize == 32)
775 Opc = AArch64::G_DUPLANE32;
776 else if (ScalarSize == 16)
777 Opc = AArch64::G_DUPLANE16;
781 Opc = AArch64::G_DUPLANE8;
782 else if (ScalarSize == 16)
783 Opc = AArch64::G_DUPLANE16;
787 Opc = AArch64::G_DUPLANE8;
795 MatchInfo.first =
Opc;
796 MatchInfo.second = *LaneIdx;
802 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
806 B.setInstrAndDebugLoc(
MI);
807 auto Lane =
B.buildConstant(
LLT::scalar(64), MatchInfo.second);
812 if (SrcTy.getSizeInBits() == 64) {
813 auto Undef =
B.buildUndef(SrcTy);
814 DupSrc =
B.buildConcatVectors(SrcTy.multiplyElements(2),
815 {Src1Reg, Undef.getReg(0)})
818 B.buildInstr(MatchInfo.first, {MI.getOperand(0).getReg()}, {DupSrc, Lane});
819 MI.eraseFromParent();
824 Register Src1Reg = Unmerge.getReg(Unmerge.getNumOperands() - 1);
826 if (SrcTy.getSizeInBits() != 128 && SrcTy.getSizeInBits() != 64)
828 return SrcTy.
isVector() && !SrcTy.isScalable() &&
829 Unmerge.getNumOperands() == (
unsigned)SrcTy.getNumElements() + 1;
835 Register Src1Reg = Unmerge.getReg(Unmerge.getNumOperands() - 1);
837 assert((SrcTy.isVector() && !SrcTy.isScalable()) &&
838 "Expected a fixed length vector");
840 for (
int I = 0;
I < SrcTy.getNumElements(); ++
I)
841 B.buildExtractVectorElementConstant(Unmerge.getReg(
I), Src1Reg,
I);
842 MI.eraseFromParent();
846 assert(
MI.getOpcode() == TargetOpcode::G_BUILD_VECTOR);
859 B.setInstrAndDebugLoc(
MI);
860 B.buildInstr(AArch64::G_DUP, {
MI.getOperand(0).getReg()},
861 {
MI.getOperand(1).getReg()});
862 MI.eraseFromParent();
874 if (
MI.getOpcode() == TargetOpcode::G_SEXT_INREG)
876 if (
MI.getOpcode() != TargetOpcode::G_AND)
883 return (Mask == 0xFF || Mask == 0xFFFF || Mask == 0xFFFFFFFF);
887 if (IsSupportedExtend(*Def))
890 unsigned Opc =
Def->getOpcode();
891 if (
Opc != TargetOpcode::G_SHL &&
Opc != TargetOpcode::G_ASHR &&
892 Opc != TargetOpcode::G_LSHR)
899 uint64_t ShiftAmt = MaybeShiftAmt->Value.getZExtValue();
906 if (IsSupportedExtend(*ShiftLHS))
907 return (ShiftAmt <= 4) ? 2 : 1;
913 if ((ShiftSize == 32 && ShiftAmt <= 31) ||
914 (ShiftSize == 64 && ShiftAmt <= 63))
922 assert(
MI.getOpcode() == TargetOpcode::G_ICMP);
943 return isCMN(Def, Pred, MRI) ?
Def->getOperand(2).getReg() :
Reg;
963 MI.getOperand(2).setReg(
RHS);
964 MI.getOperand(3).setReg(
LHS);
1011 assert(
MI.getOpcode() == TargetOpcode::G_FCMP);
1020 if (EltSize == 16 && !
ST.hasFullFP16())
1022 if (EltSize != 16 && EltSize != 32 && EltSize != 64)
1031 assert(
MI.getOpcode() == TargetOpcode::G_FCMP);
1042 bool Invert =
false;
1063 auto Cmp = getVectorFCMP(CC,
LHS,
RHS, NoNans, MRI);
1068 auto Cmp2 = getVectorFCMP(CC2,
LHS,
RHS, NoNans, MRI);
1069 auto Cmp2Dst = Cmp2(MIB);
1070 auto Cmp1Dst =
Cmp(MIB);
1076 MI.eraseFromParent();
1084 for (
unsigned I = 0;
I < GBuildVec->getNumSources(); ++
I) {
1088 if (!ConstVal.has_value())
1098 LLT DstTy = MRI.
getType(GBuildVec->getReg(0));
1099 Register DstReg =
B.buildUndef(DstTy).getReg(0);
1101 for (
unsigned I = 0;
I < GBuildVec->getNumSources(); ++
I) {
1102 Register SrcReg = GBuildVec->getSourceReg(
I);
1107 B.buildInsertVectorElement(DstTy, DstReg, SrcReg, IdxReg).getReg(0);
1109 B.buildCopy(GBuildVec->getReg(0), DstReg);
1110 GBuildVec->eraseFromParent();
1115 assert(
MI.getOpcode() == TargetOpcode::G_STORE);
1129 assert(
MI.getOpcode() == TargetOpcode::G_STORE);
1131 MI.getOperand(0).setReg(SrcReg);
1139 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
1147 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
1148 B.setInstrAndDebugLoc(
MI);
1150 Helper.lower(
MI, 0,
LLT());
1158 if (Unmerge.getNumDefs() != 2)
1175 if (!LowestVal || LowestVal->Value.getZExtValue() != DstTy.
getSizeInBytes())
1181 MatchInfo = ExtSrc1;
1191 MI.getOperand(0).setReg(
MI.getOperand(1).getReg());
1192 MI.getOperand(1).setReg(Dst1);
1193 MI.getOperand(2).setReg(SrcReg);
1210 assert(
MI.getOpcode() == TargetOpcode::G_MUL &&
1211 "Expected a G_MUL instruction");
1217 Helper.fewerElementsVector(
1222class AArch64PostLegalizerLoweringImpl :
public Combiner {
1224 const CombinerHelper Helper;
1225 const AArch64PostLegalizerLoweringImplRuleConfig &RuleConfig;
1226 const AArch64Subtarget &STI;
1229 AArch64PostLegalizerLoweringImpl(
1230 MachineFunction &MF, CombinerInfo &CInfo,
const TargetPassConfig *TPC,
1231 GISelCSEInfo *CSEInfo,
1232 const AArch64PostLegalizerLoweringImplRuleConfig &RuleConfig,
1233 const AArch64Subtarget &STI);
1235 static const char *
getName() {
return "AArch6400PreLegalizerCombiner"; }
1237 bool tryCombineAll(MachineInstr &
I)
const override;
1240#define GET_GICOMBINER_CLASS_MEMBERS
1241#include "AArch64GenPostLegalizeGILowering.inc"
1242#undef GET_GICOMBINER_CLASS_MEMBERS
1245#define GET_GICOMBINER_IMPL
1246#include "AArch64GenPostLegalizeGILowering.inc"
1247#undef GET_GICOMBINER_IMPL
1249AArch64PostLegalizerLoweringImpl::AArch64PostLegalizerLoweringImpl(
1252 const AArch64PostLegalizerLoweringImplRuleConfig &RuleConfig,
1254 :
Combiner(MF, CInfo, TPC, nullptr, CSEInfo),
1255 Helper(Observer,
B,
true), RuleConfig(RuleConfig),
1258#include
"AArch64GenPostLegalizeGILowering.inc"
1267 AArch64PostLegalizerLowering();
1270 return "AArch64PostLegalizerLowering";
1277 AArch64PostLegalizerLoweringImplRuleConfig RuleConfig;
1281void AArch64PostLegalizerLowering::getAnalysisUsage(
AnalysisUsage &AU)
const {
1288AArch64PostLegalizerLowering::AArch64PostLegalizerLowering()
1290 if (!RuleConfig.parseCommandLineOption())
1294bool AArch64PostLegalizerLowering::runOnMachineFunction(
MachineFunction &MF) {
1298 auto *TPC = &getAnalysis<TargetPassConfig>();
1304 F.hasOptSize(),
F.hasMinSize());
1306 CInfo.MaxIterations = 1;
1309 CInfo.EnableFullDCE =
false;
1310 AArch64PostLegalizerLoweringImpl Impl(MF, CInfo, TPC,
nullptr,
1312 return Impl.combineMachineInstrs();
1315char AArch64PostLegalizerLowering::ID = 0;
1317 "Lower AArch64 MachineInstrs after legalization",
false,
1321 "Lower AArch64 MachineInstrs after legalization",
false,
1326 return new AArch64PostLegalizerLowering();
static bool isVShiftRImm(SDValue Op, EVT VT, bool isNarrow, int64_t &Cnt)
isVShiftRImm - Check if this is a valid build_vector for the immediate operand of a vector shift righ...
static bool isINSMask(ArrayRef< int > M, int NumInputElements, bool &DstIsLeft, int &Anomaly)
static unsigned getCmpOperandFoldingProfit(SDValue Op)
Returns how profitable it is to fold a comparison's operand's shift and/or extension operations.
This file declares the targeting of the Machinelegalizer class for AArch64.
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
#define GET_GICOMBINER_CONSTRUCTOR_INITS
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This contains common combine transformations that may be used in a combine pass,or by the target else...
Option class for Targets to specify which operations are combined how and when.
This contains the base class for all Combiners generated by TableGen.
This contains common code to allow clients to notify changes to machine instr.
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
Contains matchers for matching SSA Machine Instructions.
This file declares the MachineIRBuilder class.
Promote Memory to Register
static MCRegister getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
static StringRef getName(Value *V)
Target-Independent Code Generator Pass Configuration Options pass.
APInt bitcastToAPInt() const
Class for arbitrary precision integers.
uint64_t getZExtValue() const
Get zero extended value.
unsigned logBase2() const
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
LLVM_ABI void setPreservesCFG()
This function should be called by the pass, iff they do not:
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
This class is the base class for the comparison instructions.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
@ ICMP_SLT
signed less than
@ ICMP_SLE
signed less or equal
@ ICMP_UGE
unsigned greater or equal
@ ICMP_UGT
unsigned greater than
@ ICMP_SGT
signed greater than
@ ICMP_ULT
unsigned less than
@ FCMP_ORD
0 1 1 1 True if ordered (no nans)
@ ICMP_SGE
signed greater or equal
@ ICMP_ULE
unsigned less or equal
@ FCMP_UNO
1 0 0 0 True if unordered: isnan(X) | isnan(Y)
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
FunctionPass class - This class is used to implement most global optimizations.
Abstract class that contains various methods for clients to notify about changes.
virtual void changingInstr(MachineInstr &MI)=0
This instruction is about to be mutated in some way.
virtual void changedInstr(MachineInstr &MI)=0
This instruction was mutated in some way.
constexpr bool isScalableVector() const
Returns true if the LLT is a scalable vector.
constexpr unsigned getScalarSizeInBits() const
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr TypeSize getSizeInBits() const
Returns the total size of the type. Must only be called on sized types.
constexpr LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
constexpr ElementCount getElementCount() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
constexpr LLT changeElementCount(ElementCount EC) const
Return a vector or scalar with the same element type and the new element count.
constexpr TypeSize getSizeInBytes() const
Returns the total size of the type in bytes, i.e.
LLVM_ABI int CreateStackObject(uint64_t Size, Align Alignment, bool isSpillSlot, const AllocaInst *Alloca=nullptr, uint8_t ID=0)
Create a new statically sized stack object, returning a nonnegative identifier to represent it.
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
virtual bool runOnMachineFunction(MachineFunction &MF)=0
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Function & getFunction()
Return the LLVM function that this machine code represents.
const MachineFunctionProperties & getProperties() const
Get the function properties.
Helper class to build MachineInstr.
MachineInstrBuilder buildNot(const DstOp &Dst, const SrcOp &Src0)
Build and insert a bitwise not, NegOne = G_CONSTANT -1 Res = G_OR Op0, NegOne.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
void setInstrAndDebugLoc(MachineInstr &MI)
Set the insertion point to before MI, and set the debug loc to MI's loc.
MachineRegisterInfo * getMRI()
Getter for MRI.
MachineInstrBuilder buildOr(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_OR Op0, Op1.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
Register getReg(unsigned Idx) const
Get the register for the operand index.
Representation of each machine instruction.
const MachineOperand & getOperand(unsigned i) const
MachineOperand class - Representation of each machine instruction operand.
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
bool use_nodbg_empty(Register RegNo) const
use_nodbg_empty - Return true if there are no non-Debug instructions using the specified register.
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
iterator_range< use_instr_nodbg_iterator > use_nodbg_instructions(Register Reg) const
LLVM_ABI Register cloneVirtualRegister(Register VReg, StringRef Name="")
Create and return a new virtual register in the function with the same attributes as the given regist...
LLVM_ABI void replaceRegWith(Register FromReg, Register ToReg)
replaceRegWith - Replace all instances of FromReg with ToReg in the machine function.
virtual StringRef getPassName() const
getPassName - Return a nice clean name for a pass.
Wrapper class representing virtual and physical registers.
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Target-Independent Code Generator Pass Configuration Options.
A Use represents the edge between a Value definition and its users.
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
constexpr LeafTy divideCoefficientBy(ScalarTy RHS) const
We do not provide the '/' operator here because division for polynomial types does not work in the sa...
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
std::optional< RegOrConstant > getAArch64VectorSplat(const MachineInstr &MI, const MachineRegisterInfo &MRI)
constexpr bool isLegalArithImmed(const uint64_t C)
void changeVectorFCMPPredToAArch64CC(const CmpInst::Predicate P, AArch64CC::CondCode &CondCode, AArch64CC::CondCode &CondCode2, bool &Invert)
Find the AArch64 condition codes necessary to represent P for a vector floating point comparison.
bool isCMN(const MachineInstr *MaybeSub, const CmpInst::Predicate &Pred, const MachineRegisterInfo &MRI)
std::optional< int64_t > getAArch64VectorSplatScalar(const MachineInstr &MI, const MachineRegisterInfo &MRI)
void expandMOVImm(uint64_t Imm, unsigned BitSize, SmallVectorImpl< ImmInsnModel > &Insn)
Expand a MOVi32imm or MOVi64imm pseudo instruction to one or more real move-immediate instructions to...
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ C
The default llvm calling convention, compatible with C.
operand_type_match m_Reg()
SpecificConstantMatch m_ZeroInt()
Convenience matchers for specific integer values.
ImplicitDefMatch m_GImplicitDef()
bool mi_match(Reg R, const MachineRegisterInfo &MRI, Pattern &&P)
UnaryOp_match< SrcTy, TargetOpcode::G_TRUNC > m_GTrunc(const SrcTy &Src)
Predicate getPredicate(unsigned Condition, unsigned Hint)
Return predicate consisting of specified condition and hint bits.
NodeAddr< DefNode * > Def
This is an optimization pass for GlobalISel generic memory operations.
LLVM_ABI bool isBuildVectorAllZeros(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndef=false)
Return true if the specified instruction is a G_BUILD_VECTOR or G_BUILD_VECTOR_TRUNC where all of the...
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI MachineInstr * getOpcodeDef(unsigned Opcode, Register Reg, const MachineRegisterInfo &MRI)
See if Reg is defined by an single def instruction that is Opcode.
bool isZIPMask(ArrayRef< int > M, unsigned NumElts, unsigned &WhichResultOut, unsigned &OperandOrderOut)
Return true for zip1 or zip2 masks of the form: <0, 8, 1, 9, 2, 10, 3, 11> (WhichResultOut = 0,...
@ Undef
Value of the register doesn't matter.
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
LLVM_ABI MachineInstr * getDefIgnoringCopies(Register Reg, const MachineRegisterInfo &MRI)
Find the def instruction for Reg, folding away any trivial copies.
FunctionPass * createAArch64PostLegalizerLowering()
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
bool isUZPMask(ArrayRef< int > M, unsigned NumElts, unsigned &WhichResultOut)
Return true for uzp1 or uzp2 masks of the form: <0, 2, 4, 6, 8, 10, 12, 14> or <1,...
bool isREVMask(ArrayRef< int > M, unsigned EltSize, unsigned NumElts, unsigned BlockSize)
isREVMask - Check if a vector shuffle corresponds to a REV instruction with the specified blocksize.
LLVM_ABI std::optional< ValueAndVReg > getAnyConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true, bool LookThroughAnyExt=false)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_CONSTANT or G_FCONST...
LLVM_ABI bool isBuildVectorAllOnes(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndef=false)
Return true if the specified instruction is a G_BUILD_VECTOR or G_BUILD_VECTOR_TRUNC where all of the...
LLVM_ABI void getSelectionDAGFallbackAnalysisUsage(AnalysisUsage &AU)
Modify analysis usage so it preserves passes required for the SelectionDAG fallback.
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
LLVM_ABI std::optional< ValueAndVReg > getIConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_CONSTANT returns its...
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
bool isTRNMask(ArrayRef< int > M, unsigned NumElts, unsigned &WhichResultOut, unsigned &OperandOrderOut)
Return true for trn1 or trn2 masks of the form: <0, 8, 2, 10, 4, 12, 6, 14> (WhichResultOut = 0,...
LLVM_ABI int getSplatIndex(ArrayRef< int > Mask)
If all non-negative Mask elements are the same value, return that value.
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
This struct is a compact representation of a valid (non-zero power of two) alignment.
@ SinglePass
Enables Observer-based DCE and additional heuristics that retry combining defined and used instructio...
This class contains a discriminated union of information about pointers in memory operands,...
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.