51#define GET_GICOMBINER_DEPS
52#include "AArch64GenPostLegalizeGILowering.inc"
53#undef GET_GICOMBINER_DEPS
55#define DEBUG_TYPE "aarch64-postlegalizer-lowering"
61#define GET_GICOMBINER_TYPES
62#include "AArch64GenPostLegalizeGILowering.inc"
63#undef GET_GICOMBINER_TYPES
70struct ShuffleVectorPseudo {
75 std::initializer_list<SrcOp> SrcOps)
76 :
Opc(
Opc), Dst(Dst), SrcOps(SrcOps){};
77 ShuffleVectorPseudo() =
default;
82std::optional<std::pair<bool, uint64_t>> getExtMask(
ArrayRef<int> M,
85 auto FirstRealElt =
find_if(M, [](
int Elt) {
return Elt >= 0; });
86 if (FirstRealElt == M.end())
91 APInt ExpectedElt =
APInt(MaskBits, *FirstRealElt + 1,
false,
true);
97 [&ExpectedElt](
int Elt) { return Elt != ExpectedElt++ && Elt >= 0; }))
107 bool ReverseExt =
false;
119 return std::make_pair(ReverseExt, Imm);
131 int NumInputElements) {
132 if (M.size() !=
static_cast<size_t>(NumInputElements))
134 int NumLHSMatch = 0, NumRHSMatch = 0;
135 int LastLHSMismatch = -1, LastRHSMismatch = -1;
136 for (
int Idx = 0; Idx < NumInputElements; ++Idx) {
142 M[Idx] == Idx ? ++NumLHSMatch : LastLHSMismatch = Idx;
143 M[Idx] == Idx + NumInputElements ? ++NumRHSMatch : LastRHSMismatch = Idx;
145 const int NumNeededToMatch = NumInputElements - 1;
146 if (NumLHSMatch == NumNeededToMatch)
147 return std::make_pair(
true, LastLHSMismatch);
148 if (NumRHSMatch == NumNeededToMatch)
149 return std::make_pair(
false, LastRHSMismatch);
156 ShuffleVectorPseudo &MatchInfo) {
157 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
168 unsigned NumElts = Ty.getNumElements();
171 for (
unsigned LaneSize : {64U, 32U, 16U}) {
172 if (
isREVMask(ShuffleMask, EltSize, NumElts, LaneSize)) {
175 Opcode = AArch64::G_REV64;
176 else if (LaneSize == 32U)
177 Opcode = AArch64::G_REV32;
179 Opcode = AArch64::G_BSWAP;
181 MatchInfo = ShuffleVectorPseudo(Opcode, Dst, {Src});
192 ShuffleVectorPseudo &MatchInfo) {
193 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
194 unsigned WhichResult;
195 unsigned OperandOrder;
199 if (!
isTRNMask(ShuffleMask, NumElts, WhichResult, OperandOrder))
201 unsigned Opc = (WhichResult == 0) ? AArch64::G_TRN1 : AArch64::G_TRN2;
202 Register V1 =
MI.getOperand(OperandOrder == 0 ? 1 : 2).getReg();
203 Register V2 =
MI.getOperand(OperandOrder == 0 ? 2 : 1).getReg();
204 MatchInfo = ShuffleVectorPseudo(
Opc, Dst, {
V1, V2});
214 ShuffleVectorPseudo &MatchInfo) {
215 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
216 unsigned WhichResult;
220 if (!
isUZPMask(ShuffleMask, NumElts, WhichResult))
222 unsigned Opc = (WhichResult == 0) ? AArch64::G_UZP1 : AArch64::G_UZP2;
225 MatchInfo = ShuffleVectorPseudo(
Opc, Dst, {
V1, V2});
230 ShuffleVectorPseudo &MatchInfo) {
231 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
232 unsigned WhichResult;
233 unsigned OperandOrder;
237 if (!
isZIPMask(ShuffleMask, NumElts, WhichResult, OperandOrder))
239 unsigned Opc = (WhichResult == 0) ? AArch64::G_ZIP1 : AArch64::G_ZIP2;
240 Register V1 =
MI.getOperand(OperandOrder == 0 ? 1 : 2).getReg();
241 Register V2 =
MI.getOperand(OperandOrder == 0 ? 2 : 1).getReg();
242 MatchInfo = ShuffleVectorPseudo(
Opc, Dst, {
V1, V2});
249 ShuffleVectorPseudo &MatchInfo) {
268 auto *InsMI =
getOpcodeDef(TargetOpcode::G_INSERT_VECTOR_ELT,
269 MI.getOperand(1).getReg(), MRI);
273 if (!
getOpcodeDef(TargetOpcode::G_IMPLICIT_DEF, InsMI->getOperand(1).getReg(),
281 MatchInfo = ShuffleVectorPseudo(AArch64::G_DUP,
MI.getOperand(0).getReg(),
282 {InsMI->getOperand(2).getReg()});
289 ShuffleVectorPseudo &MatchInfo) {
290 assert(Lane >= 0 &&
"Expected positive lane?");
296 MI.getOperand(Lane < NumElements ? 1 : 2).getReg(), MRI);
298 if (NumElements <= Lane)
303 Register Reg = BuildVecMI->getOperand(Lane + 1).getReg();
305 ShuffleVectorPseudo(AArch64::G_DUP,
MI.getOperand(0).getReg(), {Reg});
310 ShuffleVectorPseudo &MatchInfo) {
311 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
315 int Lane = *MaybeLane;
319 if (matchDupFromInsertVectorElt(Lane,
MI, MRI, MatchInfo))
321 if (matchDupFromBuildVector(Lane,
MI, MRI, MatchInfo))
329 unsigned NumElts = Ty.getNumElements();
338 unsigned ExpectedElt = M[0];
339 for (
unsigned I = 1;
I < NumElts; ++
I) {
343 if (ExpectedElt == NumElts)
348 if (ExpectedElt !=
static_cast<unsigned>(M[
I]))
356 ShuffleVectorPseudo &MatchInfo) {
357 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
362 auto Mask =
MI.getOperand(3).getShuffleMask();
369 !isSingletonExtMask(Mask, DstTy))
372 Imm = Mask[0] * ExtFactor;
373 MatchInfo = ShuffleVectorPseudo(AArch64::G_EXT, Dst, {
V1,
V1, Imm});
377 std::tie(ReverseExt, Imm) = *ExtInfo;
381 MatchInfo = ShuffleVectorPseudo(AArch64::G_EXT, Dst, {
V1, V2, Imm});
388 ShuffleVectorPseudo &MatchInfo) {
390 if (MatchInfo.Opc == TargetOpcode::G_BSWAP) {
391 assert(MatchInfo.SrcOps.size() == 1);
399 auto BS1 = MIRBuilder.
buildInstr(TargetOpcode::G_BITCAST, {BSTy},
400 MatchInfo.SrcOps[0]);
401 auto BS2 = MIRBuilder.
buildInstr(MatchInfo.Opc, {BSTy}, {BS1});
402 MIRBuilder.
buildInstr(TargetOpcode::G_BITCAST, {MatchInfo.Dst}, {BS2});
404 MIRBuilder.
buildInstr(MatchInfo.Opc, {MatchInfo.Dst}, MatchInfo.SrcOps);
405 MI.eraseFromParent();
413 if (MatchInfo.SrcOps[2].getImm() == 0)
414 MIRBuilder.
buildCopy(MatchInfo.Dst, MatchInfo.SrcOps[0]);
418 MatchInfo.SrcOps[2].getImm());
419 MIRBuilder.
buildInstr(MatchInfo.Opc, {MatchInfo.Dst},
420 {MatchInfo.SrcOps[0], MatchInfo.SrcOps[1], Cst});
422 MI.eraseFromParent();
430 "Expected 128bit vector in applyFullRev");
433 auto Rev = MIRBuilder.
buildInstr(AArch64::G_REV64, {DstTy}, {Src});
434 MIRBuilder.
buildInstr(AArch64::G_EXT, {Dst}, {Rev, Rev, Cst});
435 MI.eraseFromParent();
439 assert(
MI.getOpcode() == TargetOpcode::G_INSERT_VECTOR_ELT);
449 Builder.setInstrAndDebugLoc(Insert);
453 LLT EltTy = MRI.
getType(Insert.getElementReg());
454 LLT IdxTy = MRI.
getType(Insert.getIndexReg());
467 auto StackTemp = Builder.buildFrameIndex(FramePtrTy, FrameIdx);
469 Builder.buildStore(Insert.getOperand(1), StackTemp, PtrInfo,
Align(8));
474 "Expected a power-2 vector size");
475 auto Mask = Builder.buildConstant(IdxTy, VecTy.
getNumElements() - 1);
477 auto EltSize = Builder.buildConstant(IdxTy, EltTy.
getSizeInBytes());
480 Builder.buildPtrAdd(MRI.
getType(StackTemp.getReg(0)), StackTemp,
Mul)
484 Builder.buildStore(Insert.getElementReg(), EltPtr, PtrInfo,
Align(1));
486 Builder.buildLoad(Insert.getReg(0), StackTemp, PtrInfo,
Align(8));
487 Insert.eraseFromParent();
502 std::tuple<Register, int, Register, int> &MatchInfo) {
503 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
507 auto DstIsLeftAndDstLane =
isINSMask(ShuffleMask, NumElts);
508 if (!DstIsLeftAndDstLane)
512 std::tie(DstIsLeft, DstLane) = *DstIsLeftAndDstLane;
518 int SrcLane = ShuffleMask[DstLane];
519 if (SrcLane >= NumElts) {
524 MatchInfo = std::make_tuple(DstVec, DstLane, SrcVec, SrcLane);
530 std::tuple<Register, int, Register, int> &MatchInfo) {
531 Builder.setInstrAndDebugLoc(
MI);
535 int DstLane, SrcLane;
536 std::tie(DstVec, DstLane, SrcVec, SrcLane) = MatchInfo;
537 auto SrcCst = Builder.buildConstant(
LLT::integer(64), SrcLane);
538 auto Extract = Builder.buildExtractVectorElement(ScalarTy, SrcVec, SrcCst);
539 auto DstCst = Builder.buildConstant(
LLT::integer(64), DstLane);
540 Builder.buildInsertVectorElement(Dst, DstVec, Extract, DstCst);
541 MI.eraseFromParent();
549 assert(Ty.isVector() &&
"vector shift count is not a vector type");
555 int64_t ElementBits = Ty.getScalarSizeInBits();
556 return Cnt >= 1 && Cnt <= ElementBits;
562 assert(
MI.getOpcode() == TargetOpcode::G_ASHR ||
563 MI.getOpcode() == TargetOpcode::G_LSHR);
572 unsigned Opc =
MI.getOpcode();
573 assert(
Opc == TargetOpcode::G_ASHR ||
Opc == TargetOpcode::G_LSHR);
575 Opc == TargetOpcode::G_ASHR ? AArch64::G_VASHR : AArch64::G_VLSHR;
577 MIB.
buildInstr(NewOpc, {
MI.getOperand(0)}, {
MI.getOperand(1)}).addImm(Imm);
578 MI.eraseFromParent();
635std::optional<std::pair<uint64_t, CmpInst::Predicate>>
641 assert((Ty.getSizeInBits() == 32 || Ty.getSizeInBits() == 64) &&
642 "Expected 32 or 64 bit compare only?");
649 APInt C = ValAndVReg->Value;
671 if (
C.isMinSignedValue())
684 assert(!
C.isZero() &&
"C should not be zero here!");
696 if (
C.isMaxSignedValue())
722 auto NumberOfInstrToLoadImm = [=](
uint64_t Imm) {
728 if (NumberOfInstrToLoadImm(OriginalC) > NumberOfInstrToLoadImm(NewC))
742bool matchAdjustICmpImmAndPred(
744 std::pair<uint64_t, CmpInst::Predicate> &MatchInfo) {
745 assert(
MI.getOpcode() == TargetOpcode::G_ICMP);
749 if (
auto MaybeNewImmAndPred = tryAdjustICmpImmAndPred(
LHS,
RHS, Pred, MRI)) {
750 MatchInfo = *MaybeNewImmAndPred;
756void applyAdjustICmpImmAndPred(
757 MachineInstr &
MI, std::pair<uint64_t, CmpInst::Predicate> &MatchInfo,
765 RHS.setReg(Cst->getOperand(0).getReg());
766 MI.getOperand(1).setPredicate(MatchInfo.second);
771 std::pair<unsigned, int> &MatchInfo) {
772 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
775 const LLT DstTy = MRI.
getType(
MI.getOperand(0).getReg());
782 if (*LaneIdx >= SrcTy.getNumElements())
792 switch (SrcTy.getNumElements()) {
794 if (ScalarSize == 64)
795 Opc = AArch64::G_DUPLANE64;
796 else if (ScalarSize == 32)
797 Opc = AArch64::G_DUPLANE32;
800 if (ScalarSize == 32)
801 Opc = AArch64::G_DUPLANE32;
802 else if (ScalarSize == 16)
803 Opc = AArch64::G_DUPLANE16;
807 Opc = AArch64::G_DUPLANE8;
808 else if (ScalarSize == 16)
809 Opc = AArch64::G_DUPLANE16;
813 Opc = AArch64::G_DUPLANE8;
821 MatchInfo.first =
Opc;
822 MatchInfo.second = *LaneIdx;
828 assert(
MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR);
832 B.setInstrAndDebugLoc(
MI);
833 auto Lane =
B.buildConstant(
LLT::integer(64), MatchInfo.second);
838 if (SrcTy.getSizeInBits() == 64) {
839 auto Undef =
B.buildUndef(SrcTy);
840 DupSrc =
B.buildConcatVectors(SrcTy.multiplyElements(2),
841 {Src1Reg, Undef.getReg(0)})
844 B.buildInstr(MatchInfo.first, {MI.getOperand(0).getReg()}, {DupSrc, Lane});
845 MI.eraseFromParent();
850 Register Src1Reg = Unmerge.getReg(Unmerge.getNumOperands() - 1);
852 if (SrcTy.getSizeInBits() != 128 && SrcTy.getSizeInBits() != 64)
854 return SrcTy.
isVector() && !SrcTy.isScalable() &&
855 (Unmerge.getNumOperands() == (
unsigned)SrcTy.getNumElements() + 1 ||
856 (Unmerge.getNumDefs() == 2 && SrcTy.getSizeInBits() == 128 &&
863 Register Src1Reg = Unmerge.getReg(Unmerge.getNumOperands() - 1);
865 const LLT DstTy = MRI.
getType(Unmerge.getReg(0));
866 assert((SrcTy.isVector() && !SrcTy.isScalable()) &&
867 "Expected a fixed length vector");
870 assert(Unmerge.getNumDefs() == 2);
872 B.buildExtractSubvector(Unmerge.getReg(0), Src1Reg, 0);
874 B.buildExtractSubvector(Unmerge.getReg(1), Src1Reg,
875 SrcTy.getNumElements() / 2);
877 for (
int I = 0;
I < SrcTy.getNumElements(); ++
I)
879 B.buildExtractVectorElementConstant(Unmerge.getReg(
I), Src1Reg,
I);
881 MI.eraseFromParent();
886 assert(
MI.getOpcode() == TargetOpcode::G_BUILD_VECTOR);
898 unsigned NumNonUndef = 0;
905 else if (
Op.getReg() !=
Reg)
911 return Reg && NumNonUndef > 1;
916 B.setInstrAndDebugLoc(
MI);
917 B.buildInstr(AArch64::G_DUP, {
MI.getOperand(0).getReg()}, {Src});
918 MI.eraseFromParent();
927 if (
MI.getOpcode() == TargetOpcode::G_SEXT_INREG)
929 if (
MI.getOpcode() == TargetOpcode::G_AND) {
933 uint64_t Mask = ValAndVReg->Value.getZExtValue();
934 return (Mask == 0xFF || Mask == 0xFFFF || Mask == 0xFFFFFFFF);
945 if (IsSupportedExtend(*Def))
948 unsigned Opc = Def->getOpcode();
949 if (
Opc == TargetOpcode::G_SHL ||
Opc == TargetOpcode::G_LSHR ||
950 Opc == TargetOpcode::G_ASHR) {
954 uint64_t ShiftAmt = MaybeShiftAmt->Value.getZExtValue();
957 if (IsSupportedExtend(*ShiftLHS))
958 return (ShiftAmt <= 4) ? 2 : 1;
959 LLT Ty = MRI.
getType(Def->getOperand(0).getReg());
963 if ((ShiftSize == 32 && ShiftAmt <= 31) ||
964 (ShiftSize == 64 && ShiftAmt <= 63))
975 assert(
MI.getOpcode() == TargetOpcode::G_ICMP);
996 return isCMN(Def, Pred, MRI) ? Def->getOperand(2).getReg() :
Reg;
1016 MI.getOperand(2).setReg(
RHS);
1017 MI.getOperand(3).setReg(
LHS);
1065 assert(
MI.getOpcode() == TargetOpcode::G_FCMP);
1070 if (!DstTy.
isVector() || !ST.hasNEON())
1074 if (EltSize == 16 && !ST.hasFullFP16())
1076 if (EltSize != 16 && EltSize != 32 && EltSize != 64)
1085 assert(
MI.getOpcode() == TargetOpcode::G_FCMP);
1096 bool Invert =
false;
1117 auto Cmp = getVectorFCMP(CC,
LHS,
RHS, NoNans, MRI);
1122 auto Cmp2 = getVectorFCMP(CC2,
LHS,
RHS, NoNans, MRI);
1123 auto Cmp2Dst = Cmp2(MIB);
1124 auto Cmp1Dst = Cmp(MIB);
1130 MI.eraseFromParent();
1138 for (
unsigned I = 0;
I < GBuildVec->getNumSources(); ++
I) {
1142 if (!ConstVal.has_value())
1152 LLT DstTy = MRI.
getType(GBuildVec->getReg(0));
1153 Register DstReg =
B.buildUndef(DstTy).getReg(0);
1155 for (
unsigned I = 0;
I < GBuildVec->getNumSources(); ++
I) {
1156 Register SrcReg = GBuildVec->getSourceReg(
I);
1161 B.buildInsertVectorElement(DstTy, DstReg, SrcReg, IdxReg).getReg(0);
1163 B.buildCopy(GBuildVec->getReg(0), DstReg);
1164 GBuildVec->eraseFromParent();
1169 assert(
MI.getOpcode() == TargetOpcode::G_STORE);
1183 assert(
MI.getOpcode() == TargetOpcode::G_STORE);
1185 MI.getOperand(0).setReg(SrcReg);
1193 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
1201 assert(
MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
1202 B.setInstrAndDebugLoc(
MI);
1212 if (Unmerge.getNumDefs() != 2)
1229 if (!LowestVal || LowestVal->Value.getZExtValue() != DstTy.
getSizeInBytes())
1235 MatchInfo = ExtSrc1;
1245 MI.getOperand(0).setReg(
MI.getOperand(1).getReg());
1246 MI.getOperand(1).setReg(Dst1);
1247 MI.getOperand(2).setReg(SrcReg);
1264 assert(
MI.getOpcode() == TargetOpcode::G_MUL &&
1265 "Expected a G_MUL instruction");
1276class AArch64PostLegalizerLoweringImpl :
public Combiner {
1279 const AArch64PostLegalizerLoweringImplRuleConfig &RuleConfig;
1283 AArch64PostLegalizerLoweringImpl(
1285 const AArch64PostLegalizerLoweringImplRuleConfig &RuleConfig,
1288 static const char *
getName() {
return "AArch6400PreLegalizerCombiner"; }
1293#define GET_GICOMBINER_CLASS_MEMBERS
1294#include "AArch64GenPostLegalizeGILowering.inc"
1295#undef GET_GICOMBINER_CLASS_MEMBERS
1298#define GET_GICOMBINER_IMPL
1299#include "AArch64GenPostLegalizeGILowering.inc"
1300#undef GET_GICOMBINER_IMPL
1302AArch64PostLegalizerLoweringImpl::AArch64PostLegalizerLoweringImpl(
1304 const AArch64PostLegalizerLoweringImplRuleConfig &RuleConfig,
1306 :
Combiner(MF, CInfo, nullptr, CSEInfo),
1307 Helper(Observer,
B,
true), RuleConfig(RuleConfig),
1310#include
"AArch64GenPostLegalizeGILowering.inc"
1315bool runPostLegalizerLowering(
1317 const AArch64PostLegalizerLoweringImplRuleConfig &RuleConfig) {
1325 F.hasOptSize(),
F.hasMinSize());
1327 CInfo.MaxIterations = 1;
1330 CInfo.EnableFullDCE =
false;
1331 AArch64PostLegalizerLoweringImpl Impl(MF, CInfo,
nullptr,
1333 return Impl.combineMachineInstrs();
1340 AArch64PostLegalizerLoweringLegacy();
1342 StringRef getPassName()
const override {
1343 return "AArch64PostLegalizerLowering";
1346 bool runOnMachineFunction(MachineFunction &MF)
override;
1347 void getAnalysisUsage(AnalysisUsage &AU)
const override;
1350 AArch64PostLegalizerLoweringImplRuleConfig RuleConfig;
1354void AArch64PostLegalizerLoweringLegacy::getAnalysisUsage(
1361AArch64PostLegalizerLoweringLegacy::AArch64PostLegalizerLoweringLegacy()
1362 : MachineFunctionPass(
ID) {
1363 if (!RuleConfig.parseCommandLineOption())
1367bool AArch64PostLegalizerLoweringLegacy::runOnMachineFunction(
1370 return runPostLegalizerLowering(MF, RuleConfig);
1373char AArch64PostLegalizerLoweringLegacy::ID = 0;
1375 "Lower AArch64 MachineInstrs after legalization",
false,
1378 "Lower AArch64 MachineInstrs after legalization",
false,
1383 std::make_unique<AArch64PostLegalizerLoweringImplRuleConfig>()) {
1384 if (!RuleConfig->parseCommandLineOption())
1397 const bool Changed = runPostLegalizerLowering(MF, *RuleConfig);
1409 return new AArch64PostLegalizerLoweringLegacy();
static bool isVShiftRImm(SDValue Op, EVT VT, bool isNarrow, int64_t &Cnt)
isVShiftRImm - Check if this is a valid build_vector for the immediate operand of a vector shift righ...
static bool isINSMask(ArrayRef< int > M, int NumInputElements, bool &DstIsLeft, int &Anomaly)
static unsigned getCmpOperandFoldingProfit(SDValue Op, bool AllowExtend)
Returns how profitable it is to fold a comparison's operand's shift and/or extension operations.
static bool shouldBeAdjustedToZero(SDValue LHS, const APInt &C, ISD::CondCode &CC)
This file declares the targeting of the Machinelegalizer class for AArch64.
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
#define GET_GICOMBINER_CONSTRUCTOR_INITS
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This contains common combine transformations that may be used in a combine pass,or by the target else...
Option class for Targets to specify which operations are combined how and when.
This contains the base class for all Combiners generated by TableGen.
This contains common code to allow clients to notify changes to machine instr.
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
Contains matchers for matching SSA Machine Instructions.
This file declares the MachineIRBuilder class.
Promote Memory to Register
static MCRegister getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
static StringRef getName(Value *V)
PreservedAnalyses run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
~AArch64PostLegalizerLoweringPass()
AArch64PostLegalizerLoweringPass()
Class for arbitrary precision integers.
uint64_t getZExtValue() const
Get zero extended value.
unsigned logBase2() const
Represent the analysis usage information of a pass.
LLVM_ABI void setPreservesCFG()
This function should be called by the pass, iff they do not:
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Represents analyses that only rely on functions' control flow.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
@ ICMP_SLT
signed less than
@ ICMP_SLE
signed less or equal
@ ICMP_UGE
unsigned greater or equal
@ ICMP_UGT
unsigned greater than
@ ICMP_SGT
signed greater than
@ ICMP_ULT
unsigned less than
@ FCMP_ORD
0 1 1 1 True if ordered (no nans)
@ ICMP_SGE
signed greater or equal
@ ICMP_ULE
unsigned less or equal
@ FCMP_UNO
1 0 0 0 True if unordered: isnan(X) | isnan(Y)
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
FunctionPass class - This class is used to implement most global optimizations.
Abstract class that contains various methods for clients to notify about changes.
virtual void changingInstr(MachineInstr &MI)=0
This instruction is about to be mutated in some way.
virtual void changedInstr(MachineInstr &MI)=0
This instruction was mutated in some way.
LLT changeElementCount(ElementCount EC) const
Return a vector or scalar with the same element type and the new element count.
constexpr bool isScalableVector() const
Returns true if the LLT is a scalable vector.
constexpr unsigned getScalarSizeInBits() const
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr TypeSize getSizeInBits() const
Returns the total size of the type. Must only be called on sized types.
constexpr ElementCount getElementCount() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
static LLT integer(unsigned SizeInBits)
constexpr TypeSize getSizeInBytes() const
Returns the total size of the type in bytes, i.e.
LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
LLVM_ABI LegalizeResult lower(MachineInstr &MI, unsigned TypeIdx, LLT Ty)
Legalize an instruction by splitting it into simpler parts, hopefully understood by the target.
LLVM_ABI LegalizeResult fewerElementsVector(MachineInstr &MI, unsigned TypeIdx, LLT NarrowTy)
Legalize a vector instruction by splitting into multiple components, each acting on the same scalar t...
An RAII based helper class to modify MachineFunctionProperties when running pass.
LLVM_ABI int CreateStackObject(uint64_t Size, Align Alignment, bool isSpillSlot, const AllocaInst *Alloca=nullptr, uint8_t ID=0)
Create a new statically sized stack object, returning a nonnegative identifier to represent it.
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Function & getFunction()
Return the LLVM function that this machine code represents.
const MachineFunctionProperties & getProperties() const
Get the function properties.
Helper class to build MachineInstr.
MachineInstrBuilder buildNot(const DstOp &Dst, const SrcOp &Src0)
Build and insert a bitwise not, NegOne = G_CONSTANT -1 Res = G_OR Op0, NegOne.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
void setInstrAndDebugLoc(MachineInstr &MI)
Set the insertion point to before MI, and set the debug loc to MI's loc.
MachineRegisterInfo * getMRI()
Getter for MRI.
MachineInstrBuilder buildOr(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_OR Op0, Op1.
MachineInstrBuilder buildCopy(const DstOp &Res, const SrcOp &Op)
Build and insert Res = COPY Op.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
Register getReg(unsigned Idx) const
Get the register for the operand index.
Representation of each machine instruction.
const MachineOperand & getOperand(unsigned i) const
MachineOperand class - Representation of each machine instruction operand.
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
bool use_nodbg_empty(Register RegNo) const
use_nodbg_empty - Return true if there are no non-Debug instructions using the specified register.
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
LLVM_ABI Register cloneVirtualRegister(Register VReg, StringRef Name="")
Create and return a new virtual register in the function with the same attributes as the given regist...
LLVM_ABI void replaceRegWith(Register FromReg, Register ToReg)
replaceRegWith - Replace all instances of FromReg with ToReg in the machine function.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
PreservedAnalyses & preserveSet()
Mark an analysis set as preserved.
Wrapper class representing virtual and physical registers.
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
constexpr LeafTy divideCoefficientBy(ScalarTy RHS) const
We do not provide the '/' operator here because division for polynomial types does not work in the sa...
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
void changeVectorFCMPPredToAArch64CC(const CmpInst::Predicate P, AArch64CC::CondCode &CondCode, AArch64CC::CondCode &CondCode2, bool &Invert)
Find the AArch64 condition codes necessary to represent P for a vector floating point comparison.
bool isCMN(const MachineInstr *MaybeSub, const CmpInst::Predicate &Pred, const MachineRegisterInfo &MRI)
std::optional< int64_t > getAArch64VectorSplatScalar(const MachineInstr &MI, const MachineRegisterInfo &MRI)
static bool isLegalCmpImmed(const APInt &C)
isLegalCmpImmed -
void expandMOVImm(uint64_t Imm, unsigned BitSize, SmallVectorImpl< ImmInsnModel > &Insn)
Expand a MOVi32imm or MOVi64imm pseudo instruction to one or more real move-immediate instructions to...
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ C
The default llvm calling convention, compatible with C.
operand_type_match m_Reg()
SpecificConstantMatch m_ZeroInt()
Convenience matchers for specific integer values.
ImplicitDefMatch m_GImplicitDef()
bool mi_match(Reg R, const MachineRegisterInfo &MRI, Pattern &&P)
UnaryOp_match< SrcTy, TargetOpcode::G_TRUNC > m_GTrunc(const SrcTy &Src)
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
LLVM_ABI bool isBuildVectorAllZeros(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndef=false)
Return true if the specified instruction is a G_BUILD_VECTOR or G_BUILD_VECTOR_TRUNC where all of the...
LLVM_ABI MachineInstr * getOpcodeDef(unsigned Opcode, Register Reg, const MachineRegisterInfo &MRI)
See if Reg is defined by an single def instruction that is Opcode.
bool isZIPMask(ArrayRef< int > M, unsigned NumElts, unsigned &WhichResultOut, unsigned &OperandOrderOut)
Return true for zip1 or zip2 masks of the form: <0, 8, 1, 9, 2, 10, 3, 11> (WhichResultOut = 0,...
@ Undef
Value of the register doesn't matter.
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
AnalysisManager< MachineFunction > MachineFunctionAnalysisManager
LLVM_ABI MachineInstr * getDefIgnoringCopies(Register Reg, const MachineRegisterInfo &MRI)
Find the def instruction for Reg, folding away any trivial copies.
LLVM_ABI PreservedAnalyses getMachineFunctionPassPreservedAnalyses()
Returns the minimum set of Analyses that all machine function passes must preserve.
FunctionPass * createAArch64PostLegalizerLowering()
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
bool isUZPMask(ArrayRef< int > M, unsigned NumElts, unsigned &WhichResultOut)
Return true for uzp1 or uzp2 masks of the form: <0, 2, 4, 6, 8, 10, 12, 14> or <1,...
bool isREVMask(ArrayRef< int > M, unsigned EltSize, unsigned NumElts, unsigned BlockSize)
isREVMask - Check if a vector shuffle corresponds to a REV instruction with the specified blocksize.
LLVM_ABI std::optional< ValueAndVReg > getAnyConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true, bool LookThroughAnyExt=false)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_CONSTANT or G_FCONST...
LLVM_ABI bool isBuildVectorAllOnes(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndef=false)
Return true if the specified instruction is a G_BUILD_VECTOR or G_BUILD_VECTOR_TRUNC where all of the...
LLVM_ABI void getSelectionDAGFallbackAnalysisUsage(AnalysisUsage &AU)
Modify analysis usage so it preserves passes required for the SelectionDAG fallback.
DWARFExpression::Operation Op
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
LLVM_ABI std::optional< ValueAndVReg > getIConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_CONSTANT returns its...
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
bool isTRNMask(ArrayRef< int > M, unsigned NumElts, unsigned &WhichResultOut, unsigned &OperandOrderOut)
Return true for trn1 or trn2 masks of the form: <0, 8, 2, 10, 4, 12, 6, 14> (WhichResultOut = 0,...
LLVM_ABI int getSplatIndex(ArrayRef< int > Mask)
If all non-negative Mask elements are the same value, return that value.
LLVM_ABI void reportFatalUsageError(Error Err)
Report a fatal error that does not indicate a bug in LLVM.
Implement std::hash so that hash_code can be used in STL containers.
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
This struct is a compact representation of a valid (non-zero power of two) alignment.
@ SinglePass
Enables Observer-based DCE and additional heuristics that retry combining defined and used instructio...
This class contains a discriminated union of information about pointers in memory operands,...
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.