53#define DEBUG_TYPE "loop-utils"
71 "Must start with an empty predecessors list!");
76 bool IsDedicatedExit =
true;
78 if (L->contains(PredBB)) {
85 IsDedicatedExit =
false;
88 assert(!InLoopPredecessors.
empty() &&
"Must have *some* loop predecessor!");
95 BB, InLoopPredecessors,
".loopexit", DT, LI, MSSAU, PreserveLCSSA);
99 dbgs() <<
"WARNING: Can't create a dedicated exit block for loop: "
102 LLVM_DEBUG(
dbgs() <<
"LoopSimplify: Creating dedicated exit block "
103 << NewExitBB->getName() <<
"\n");
110 for (
auto *BB : L->blocks())
113 if (L->contains(SuccBB))
117 if (!Visited.
insert(SuccBB).second)
120 Changed |= RewriteExit(SuccBB);
130 for (
auto *
Block : L->getBlocks())
133 for (
auto &Inst : *
Block) {
134 auto Users = Inst.users();
137 return !L->contains(
Use->getParent());
224 for (
unsigned i = 1, ie = LoopID->
getNumOperands(); i < ie; ++i) {
227 if (
Node->getNumOperands() == 2) {
253std::optional<ElementCount>
255 std::optional<int> Width =
260 TheLoop,
"llvm.loop.vectorize.scalable.enable");
269 const char *InheritOptionsExceptPrefix,
bool AlwaysNew) {
278 bool InheritAllAttrs = !InheritOptionsExceptPrefix;
279 bool InheritSomeAttrs =
280 InheritOptionsExceptPrefix && InheritOptionsExceptPrefix[0] !=
'\0';
285 if (InheritAllAttrs || InheritSomeAttrs) {
289 auto InheritThisAttribute = [InheritSomeAttrs,
290 InheritOptionsExceptPrefix](
MDNode *
Op) {
291 if (!InheritSomeAttrs)
295 if (
Op->getNumOperands() == 0)
303 return !AttrName.
starts_with(InheritOptionsExceptPrefix);
306 if (InheritThisAttribute(
Op))
316 bool HasAnyFollowup =
false;
317 for (
StringRef OptionName : FollowupOptions) {
322 HasAnyFollowup =
true;
331 if (!AlwaysNew && !HasAnyFollowup)
345 return FollowupLoopID;
359 if (IsVectorBody && IsEpilogue)
360 return "vectorized epilogue ";
362 return "vectorized ";
372 std::optional<int>
Count =
393 std::optional<int>
Count =
408 std::optional<bool>
Enable =
414 std::optional<ElementCount> VectorizeWidth =
416 std::optional<int> InterleaveCount =
421 if (
Enable ==
true && VectorizeWidth && VectorizeWidth->isScalar() &&
422 InterleaveCount == 1)
431 if ((VectorizeWidth && VectorizeWidth->isScalar()) && InterleaveCount == 1)
434 if ((VectorizeWidth && VectorizeWidth->isVector()) || InterleaveCount > 1)
467 const Loop *CurLoop) {
476 AddRegionToWorklist(
N);
478 for (
size_t I = 0;
I < Worklist.
size();
I++) {
480 AddRegionToWorklist(Child);
488 assert(LatchIdx != -1 &&
"LatchBlock is not a case in this PHINode");
492 if (U !=
Cond && U != IncV)
return false;
495 if (U !=
Cond && U != PN)
return false;
502 assert((!DT || L->isLCSSAForm(*DT)) &&
"Expected LCSSA!");
503 auto *Preheader = L->getLoopPreheader();
504 assert(Preheader &&
"Preheader should exist!");
506 std::unique_ptr<MemorySSAUpdater> MSSAU;
508 MSSAU = std::make_unique<MemorySSAUpdater>(MSSA);
526 "Preheader must end with a side-effect-free terminator");
528 "Preheader must have a single successor");
556 auto *ExitBlock = L->getUniqueExitBlock();
559 assert(ExitBlock &&
"Should have a unique exit block!");
560 assert(L->hasDedicatedExits() &&
"Loop should have dedicated exits!");
562 Builder.CreateCondBr(Builder.getFalse(), L->getHeader(), ExitBlock);
568 for (
PHINode &
P : ExitBlock->phis()) {
573 P.setIncomingBlock(PredIndex, Preheader);
577 P.removeIncomingValueIf([](
unsigned Idx) {
return Idx != 0; },
580 assert((
P.getNumIncomingValues() == 1 &&
581 P.getIncomingBlock(PredIndex) == Preheader) &&
582 "Should have exactly one value and that's from the preheader!");
596 Builder.SetInsertPoint(Preheader->getTerminator());
597 Builder.CreateBr(ExitBlock);
599 Preheader->getTerminator()->eraseFromParent();
601 assert(L->hasNoExitBlocks() &&
602 "Loop should have either zero or one exit blocks.");
604 Builder.SetInsertPoint(OldTerm);
605 Builder.CreateUnreachable();
606 Preheader->getTerminator()->eraseFromParent();
616 MSSAU->removeBlocks(DeadBlockSet);
634 for (
auto *
Block : L->blocks())
639 if (L->contains(Usr->getParent()))
645 "Unexpected user in reachable block");
656 DVR.getDebugLoc().get());
660 DVR.removeFromParent();
675 ExitBlock->getFirstInsertionPt();
676 assert(InsertDbgValueBefore != ExitBlock->end() &&
677 "There should be a non-PHI instruction in exit block, else these "
678 "instructions will have no parent.");
685 ExitBlock->insertDbgRecordBefore(DVR, InsertDbgValueBefore);
690 for (
auto *
Block : L->blocks())
691 Block->dropAllReferences();
705 BB->eraseFromParent();
712 if (
Loop *ParentLoop = L->getParentLoop()) {
714 assert(
I != ParentLoop->end() &&
"Couldn't find loop");
715 ParentLoop->removeChildLoop(
I);
718 assert(
I != LI->
end() &&
"Couldn't find loop");
727 auto *Latch = L->getLoopLatch();
728 assert(Latch &&
"multiple latches not yet supported");
729 auto *Header = L->getHeader();
730 Loop *OutermostLoop = L->getOutermostLoop();
735 std::unique_ptr<MemorySSAUpdater> MSSAU;
737 MSSAU = std::make_unique<MemorySSAUpdater>(MSSA);
750 if (L->isLoopExiting(Latch)) {
755 const unsigned ExitIdx = L->contains(BI->getSuccessor(0)) ? 1 : 0;
756 BasicBlock *ExitBB = BI->getSuccessor(ExitIdx);
759 Header->removePredecessor(Latch,
true);
762 auto *NewBI = Builder.CreateBr(ExitBB);
765 NewBI->copyMetadata(*BI, {LLVMContext::MD_dbg,
766 LLVMContext::MD_annotation});
768 BI->eraseFromParent();
779 auto *BackedgeBB =
SplitEdge(Latch, Header, &DT, &LI, MSSAU.get());
783 true, &DTU, MSSAU.get());
795 if (OutermostLoop != L)
809 if (!LatchBR || !L->isLoopExiting(Latch))
814 "At least one edge out of the latch must go to the header");
827 D.L->getHeader()->getParent()->printAsOperand(OS,
false);
828 return OS <<
" " << *
D.L;
838 if (!ExitingBranch) {
839 LLVM_DEBUG(
dbgs() <<
"estimateLoopTripCount: Failed to find exiting "
840 <<
"latch branch of required form in " <<
DbgLoop(L)
850 LLVM_DEBUG(
dbgs() <<
"estimateLoopTripCount: Failed to extract branch "
851 <<
"weights for " <<
DbgLoop(L) <<
"\n");
860 LLVM_DEBUG(
dbgs() <<
"estimateLoopTripCount: Failed because of zero exit "
861 <<
"probability for " <<
DbgLoop(L) <<
"\n");
870 if (ExitCount >= std::numeric_limits<unsigned>::max())
871 return std::numeric_limits<unsigned>::max();
875 LLVM_DEBUG(
dbgs() <<
"estimateLoopTripCount: Estimated trip count of " << TC
876 <<
" for " <<
DbgLoop(L) <<
"\n");
880std::optional<unsigned>
882 unsigned *EstimatedLoopInvocationWeight) {
915 if (EstimatedLoopInvocationWeight) {
916 uint64_t LoopWeight = 0, ExitWeight = 0;
923 *EstimatedLoopInvocationWeight = ExitWeight;
941 if (std::optional<unsigned> TC =
945 <<
"count of " << *TC
946 << (*TC == 0 ?
" (returning std::nullopt)" :
"")
947 <<
" for " <<
DbgLoop(L) <<
"\n");
948 return *TC == 0 ? std::nullopt : TC;
956 Loop *L,
unsigned EstimatedTripCount,
957 std::optional<unsigned> EstimatedloopInvocationWeight) {
977 if (!EstimatedloopInvocationWeight)
982 unsigned BackedgeTakenWeight = 0;
984 if (EstimatedTripCount != 0) {
985 LatchExitWeight = *EstimatedloopInvocationWeight;
986 BackedgeTakenWeight = (EstimatedTripCount - 1) * LatchExitWeight;
991 std::swap(BackedgeTakenWeight, LatchExitWeight);
1004 bool FirstTargetIsLoop = LatchBranch->
getSuccessor(0) == L->getHeader();
1012 bool FirstTargetIsLoop = LatchBranch->
getSuccessor(0) == L->getHeader();
1018 bool ForFirstTarget) {
1022 uint64_t Denominator = Weight0 + Weight1;
1023 if (Denominator == 0)
1025 if (!ForFirstTarget)
1031 assert(Src != Dst &&
"Passed in same source as destination");
1044 "Missing weights in branch_weights");
1050 Numerator += Weight;
1058 if (
Total == 0 ||
Total > std::numeric_limits<uint32_t>::max())
1065 bool ForFirstTarget) {
1068 if (!ForFirstTarget)
1082 const SCEV *InnerLoopBECountSC = SE.
getExitCount(InnerLoop, InnerLoopLatch);
1103 return Intrinsic::vector_reduce_add;
1105 return Intrinsic::vector_reduce_mul;
1107 return Intrinsic::vector_reduce_and;
1109 return Intrinsic::vector_reduce_or;
1111 return Intrinsic::vector_reduce_xor;
1116 return Intrinsic::vector_reduce_fadd;
1118 return Intrinsic::vector_reduce_fmul;
1120 return Intrinsic::vector_reduce_smax;
1122 return Intrinsic::vector_reduce_smin;
1124 return Intrinsic::vector_reduce_umax;
1126 return Intrinsic::vector_reduce_umin;
1129 return Intrinsic::vector_reduce_fmax;
1132 return Intrinsic::vector_reduce_fmin;
1134 return Intrinsic::vector_reduce_fmaximum;
1136 return Intrinsic::vector_reduce_fminimum;
1138 return Intrinsic::vector_reduce_fmax;
1140 return Intrinsic::vector_reduce_fmin;
1148 case Intrinsic::umin:
1149 return Intrinsic::vector_reduce_umin;
1150 case Intrinsic::umax:
1151 return Intrinsic::vector_reduce_umax;
1152 case Intrinsic::smin:
1153 return Intrinsic::vector_reduce_smin;
1154 case Intrinsic::smax:
1155 return Intrinsic::vector_reduce_smax;
1162 case Intrinsic::vector_reduce_fadd:
1163 return Instruction::FAdd;
1164 case Intrinsic::vector_reduce_fmul:
1165 return Instruction::FMul;
1166 case Intrinsic::vector_reduce_add:
1167 return Instruction::Add;
1168 case Intrinsic::vector_reduce_mul:
1169 return Instruction::Mul;
1170 case Intrinsic::vector_reduce_and:
1171 return Instruction::And;
1172 case Intrinsic::vector_reduce_or:
1173 return Instruction::Or;
1174 case Intrinsic::vector_reduce_xor:
1175 return Instruction::Xor;
1176 case Intrinsic::vector_reduce_smax:
1177 case Intrinsic::vector_reduce_smin:
1178 case Intrinsic::vector_reduce_umax:
1179 case Intrinsic::vector_reduce_umin:
1180 return Instruction::ICmp;
1181 case Intrinsic::vector_reduce_fmax:
1182 case Intrinsic::vector_reduce_fmin:
1183 return Instruction::FCmp;
1194 case Instruction::Add:
1195 return Intrinsic::vector_reduce_add;
1196 case Instruction::Mul:
1197 return Intrinsic::vector_reduce_mul;
1198 case Instruction::And:
1199 return Intrinsic::vector_reduce_and;
1200 case Instruction::Or:
1201 return Intrinsic::vector_reduce_or;
1202 case Instruction::Xor:
1203 return Intrinsic::vector_reduce_xor;
1204 case Instruction::FAdd:
1205 return Intrinsic::vector_reduce_fadd;
1206 case Instruction::FMul:
1207 return Intrinsic::vector_reduce_fmul;
1216 case Intrinsic::vector_reduce_umin:
1217 return Intrinsic::umin;
1218 case Intrinsic::vector_reduce_umax:
1219 return Intrinsic::umax;
1220 case Intrinsic::vector_reduce_smin:
1221 return Intrinsic::smin;
1222 case Intrinsic::vector_reduce_smax:
1223 return Intrinsic::smax;
1224 case Intrinsic::vector_reduce_fmin:
1225 return Intrinsic::minnum;
1226 case Intrinsic::vector_reduce_fmax:
1227 return Intrinsic::maxnum;
1228 case Intrinsic::vector_reduce_fminimum:
1229 return Intrinsic::minimum;
1230 case Intrinsic::vector_reduce_fmaximum:
1231 return Intrinsic::maximum;
1240 return Intrinsic::umin;
1242 return Intrinsic::umax;
1244 return Intrinsic::smin;
1246 return Intrinsic::smax;
1249 return Intrinsic::minnum;
1252 return Intrinsic::maxnum;
1254 return Intrinsic::minimum;
1256 return Intrinsic::maximum;
1258 return Intrinsic::minimumnum;
1260 return Intrinsic::maximumnum;
1266 case Intrinsic::vector_reduce_smax:
1268 case Intrinsic::vector_reduce_smin:
1270 case Intrinsic::vector_reduce_umax:
1272 case Intrinsic::vector_reduce_umin:
1274 case Intrinsic::vector_reduce_fmax:
1276 case Intrinsic::vector_reduce_fmin:
1308 if (Ty->isIntOrIntVectorTy() ||
1313 return Builder.CreateIntrinsic(Ty, Id, {
Left,
Right},
nullptr,
1317 Value *Cmp = Builder.CreateCmp(Pred,
Left,
Right,
"rdx.minmax.cmp");
1333 Value *Result = Acc;
1334 for (
unsigned ExtractIdx = 0; ExtractIdx != VF; ++ExtractIdx) {
1336 Builder.CreateExtractElement(Src, Builder.getInt32(ExtractIdx));
1338 if (
Op != Instruction::ICmp &&
Op != Instruction::FCmp) {
1352 unsigned RdxOpcode,
Value *Acc,
1355 Type *EltTy = VTy->getElementType();
1356 Function *
F = Builder.GetInsertBlock()->getParent();
1360 unsigned MinElts = VTy->getElementCount().getKnownMinValue();
1361 Value *NumElts = Builder.CreateVScale(IdxTy);
1362 NumElts = Builder.CreateMul(NumElts, ConstantInt::get(IdxTy, MinElts));
1364 BasicBlock *EntryBB = Builder.GetInsertBlock();
1367 nullptr,
"rdx.exit");
1370 Builder.SetInsertPoint(EntryBB);
1371 Builder.CreateBr(LoopBB);
1373 Builder.SetInsertPoint(LoopBB);
1374 PHINode *
IV = Builder.CreatePHI(IdxTy, 2,
"rdx.iv");
1375 PHINode *AccPhi = Builder.CreatePHI(EltTy, 2,
"rdx.acc");
1376 IV->addIncoming(ConstantInt::get(IdxTy, 0), EntryBB);
1379 Value *Elt = Builder.CreateExtractElement(Vec,
IV);
1384 Builder.CreateNUWAdd(
IV, ConstantInt::get(IdxTy, 1),
"rdx.next");
1385 IV->addIncoming(NextIV, LoopBB);
1388 Value *
Done = Builder.CreateICmpEQ(NextIV, NumElts,
"rdx.done");
1389 Builder.CreateCondBr(
Done, ExitBB, LoopBB);
1408 Builder.SetInsertPoint(ExitBB, ExitBB->
begin());
1422 "Reduction emission only supported for pow2 vectors!");
1430 auto BuildShuffledOp = [&Builder, &
Op,
1432 Value *&TmpVec) ->
void {
1433 Value *Shuf = Builder.CreateShuffleVector(TmpVec, ShuffleMask,
"rdx.shuf");
1434 if (
Op != Instruction::ICmp &&
Op != Instruction::FCmp) {
1444 Value *TmpVec = Src;
1447 for (
unsigned stride = 1; stride < VF; stride <<= 1) {
1450 for (
unsigned j = 0; j < VF; j += stride << 1) {
1451 ShuffleMask[j] = j + stride;
1453 BuildShuffledOp(ShuffleMask, TmpVec);
1457 for (
unsigned i = VF; i != 1; i >>= 1) {
1459 for (
unsigned j = 0; j != i / 2; ++j)
1460 ShuffleMask[j] = i / 2 + j;
1463 std::fill(&ShuffleMask[i / 2], ShuffleMask.end(), -1);
1464 BuildShuffledOp(ShuffleMask, TmpVec);
1468 return Builder.CreateExtractElement(TmpVec, Builder.getInt32(0));
1473 Value *NewVal =
nullptr;
1478 for (
auto *U : OrigPhi->
users()) {
1482 assert(
SI &&
"One user of the original phi should be a select");
1484 if (
SI->getTrueValue() == OrigPhi)
1485 NewVal =
SI->getFalseValue();
1487 assert(
SI->getFalseValue() == OrigPhi &&
1488 "At least one input to the select should be the original Phi");
1489 NewVal =
SI->getTrueValue();
1494 Src->getType()->isVectorTy() ? Builder.CreateOrReduce(Src) : Src;
1498 return Builder.CreateSelect(
AnyOf, NewVal, InitVal,
"rdx.select");
1503 bool Negative =
false;
1507 case Intrinsic::vector_reduce_add:
1508 case Intrinsic::vector_reduce_mul:
1509 case Intrinsic::vector_reduce_or:
1510 case Intrinsic::vector_reduce_xor:
1511 case Intrinsic::vector_reduce_and:
1512 case Intrinsic::vector_reduce_fadd:
1513 case Intrinsic::vector_reduce_fmul: {
1516 Flags.noSignedZeros());
1518 case Intrinsic::vector_reduce_umax:
1519 case Intrinsic::vector_reduce_umin:
1520 case Intrinsic::vector_reduce_smin:
1521 case Intrinsic::vector_reduce_smax: {
1525 case Intrinsic::vector_reduce_fmax:
1526 case Intrinsic::vector_reduce_fmaximum:
1529 case Intrinsic::vector_reduce_fmin:
1530 case Intrinsic::vector_reduce_fminimum: {
1531 bool PropagatesNaN = RdxID == Intrinsic::vector_reduce_fminimum ||
1532 RdxID == Intrinsic::vector_reduce_fmaximum;
1534 return (!Flags.noNaNs() && !PropagatesNaN)
1546 "nnan, nsz is expected to be set for FP min/max reduction.");
1554 auto getIdentity = [&]() {
1556 Builder.getFastMathFlags());
1583 return Builder.CreateFAddReduce(getIdentity(), Src);
1585 return Builder.CreateFMulReduce(getIdentity(), Src);
1595 "AnyOf and FindIV reductions are not supported.");
1599 "No VPIntrinsic for this reduction");
1602 Value *
Ops[] = {Iden, Src, Mask, EVL};
1603 return Builder.CreateIntrinsic(EltTy, VPID,
Ops);
1609 "Unexpected reduction kind");
1610 assert(Src->getType()->isVectorTy() &&
"Expected a vector type");
1611 assert(!Start->getType()->isVectorTy() &&
"Expected a scalar type");
1613 return B.CreateFAddReduce(Start, Src);
1620 "Unexpected reduction kind");
1621 assert(Src->getType()->isVectorTy() &&
"Expected a vector type");
1622 assert(!Start->getType()->isVectorTy() &&
"Expected a scalar type");
1627 "No VPIntrinsic for this reduction");
1629 Value *
Ops[] = {Start, Src, Mask, EVL};
1630 return Builder.CreateIntrinsic(EltTy, VPID,
Ops);
1634 bool IncludeWrapFlags) {
1642 const unsigned Opcode = Intersection->getOpcode();
1643 VecOp->copyIRFlags(Intersection, IncludeWrapFlags);
1644 for (
auto *V : VL) {
1648 if (OpValue ==
nullptr || Opcode == Instr->getOpcode())
1649 VecOp->andIRFlags(V);
1713 while (!WorkList.
empty()) {
1716 if (!L->contains(Curr))
1722 for (
const auto *U : Curr->
users()) {
1724 if (Visited.
insert(UI).second)
1750 BasicBlock *Preheader = L->getLoopPreheader();
1760 L->getExitingBlocks(ExitingBlocks);
1762 L->getUniqueExitBlocks(ExitBlocks);
1763 if (ExitBlocks.
size() != 1 || ExitingBlocks.
size() != 1)
1769 Value *Incoming =
P->getIncomingValueForBlock(ExitingBlocks[0]);
1775 for (
const RewritePhi &Phi : RewritePhiSet) {
1776 unsigned i = Phi.Ith;
1777 if (Phi.PN ==
P && (Phi.PN)->getIncomingValue(i) == Incoming) {
1785 if (!L->hasLoopInvariantOperands(
I))
1791 for (
auto *BB : L->blocks())
1793 return I.mayHaveSideEffects();
1807 if (!L->getLoopPreheader())
1809 if (Phi->getParent() != L->getHeader())
1821 assert(L->isRecursivelyLCSSAForm(*DT, *LI) &&
1822 "Caller did not preserve LCSSA!");
1825 L->getUniqueExitBlocks(ExitBlocks);
1849 for (
unsigned i = 0; i != NumPreds; ++i) {
1862 if (!L->contains(Inst))
1879 if (!isa<PHINode>(U) && !isa<BinaryOperator>(U))
1881 BinaryOperator *B = dyn_cast<BinaryOperator>(U);
1882 if (B && B != ID.getInductionBinOp())
1894 PHINode *Phi = dyn_cast<PHINode>(U);
1895 if (Phi != PN && !checkIsIndPhi(Phi, L, SE, ID))
1900 if (
B !=
ID.getInductionBinOp())
1914 !Rewriter.isSafeToExpand(ExitValue)) {
1923 if (AddRec->getLoop() == L)
1924 ExitValue = AddRec->evaluateAtIteration(ExitCount, *SE);
1927 !Rewriter.isSafeToExpand(ExitValue))
1941 bool HighCost = Rewriter.isHighCostExpansion(
1953 &*Inst->
getParent()->getFirstInsertionPt() : Inst;
1954 RewritePhiSet.
emplace_back(PN, i, ExitValue, InsertPt, HighCost);
1965 int NumReplaced = 0;
1968 for (
const RewritePhi &Phi : RewritePhiSet) {
1975 !LoopCanBeDel && Phi.HighCost)
1978 Value *ExitVal = Rewriter.expandCodeFor(
1979 Phi.ExpansionSCEV, Phi.PN->getType(), Phi.ExpansionPoint);
1981 LLVM_DEBUG(
dbgs() <<
"rewriteLoopExitValues: AfterLoopVal = " << *ExitVal
1983 <<
" LoopVal = " << *(Phi.ExpansionPoint) <<
"\n");
1990 if (
auto *EVL = LI->
getLoopFor(ExitInsn->getParent()))
1992 assert(EVL->contains(L) &&
"LCSSA breach detected!");
2020 Rewriter.clearInsertPoint();
2027template <
typename RangeT>
2037 assert(PreOrderLoops.
empty() &&
"Must start with an empty preorder walk.");
2039 "Must start with an empty preorder walk worklist.");
2043 PreOrderWorklist.
append(L->begin(), L->end());
2045 }
while (!PreOrderWorklist.
empty());
2047 Worklist.
insert(std::move(PreOrderLoops));
2048 PreOrderLoops.
clear();
2052template <
typename RangeT>
2075 PL->addChildLoop(&New);
2112 Value *Start =
nullptr, *End =
nullptr;
2132 const SCEV *Recur = LowAR->getStepRecurrence(SE);
2133 if (Recur == HighAR->getStepRecurrence(SE) &&
2134 HighAR->getLoop() == OuterLoop && LowAR->getLoop() == OuterLoop) {
2139 const SCEV *NewHigh =
2142 LLVM_DEBUG(
dbgs() <<
"LAA: Expanded RT check for range to include "
2143 "outer loop in order to permit hoisting\n");
2153 << *Stride <<
'\n');
2160 Start = Exp.expandCodeFor(
Low, PtrArithTy,
Loc);
2161 End = Exp.expandCodeFor(
High, PtrArithTy,
Loc);
2164 Start = Builder.CreateFreeze(Start, Start->getName() +
".fr");
2165 End = Builder.CreateFreeze(End, End->getName() +
".fr");
2168 Stride ? Exp.expandCodeFor(Stride, Stride->getType(),
Loc) :
nullptr;
2170 return {Start, End, StrideVal};
2182 transform(PointerChecks, std::back_inserter(ChecksWithBounds),
2188 return std::make_pair(
First, Second);
2191 return ChecksWithBounds;
2200 auto ExpandedChecks =
2207 Value *MemoryRuntimeCheck =
nullptr;
2209 for (
const auto &[
A,
B] : ExpandedChecks) {
2213 assert((
A.Start->getType()->getPointerAddressSpace() ==
2214 B.End->getType()->getPointerAddressSpace()) &&
2215 (
B.Start->getType()->getPointerAddressSpace() ==
2216 A.End->getType()->getPointerAddressSpace()) &&
2217 "Trying to bounds check pointers with different address spaces");
2229 Value *IsConflict = ChkBuilder.
CreateAnd(Cmp0, Cmp1,
"found.conflict");
2230 if (
A.StrideToCheck) {
2232 A.StrideToCheck, ConstantInt::get(
A.StrideToCheck->getType(), 0),
2234 IsConflict = ChkBuilder.
CreateOr(IsConflict, IsNegativeStride);
2236 if (
B.StrideToCheck) {
2238 B.StrideToCheck, ConstantInt::get(
B.StrideToCheck->getType(), 0),
2240 IsConflict = ChkBuilder.
CreateOr(IsConflict, IsNegativeStride);
2242 if (MemoryRuntimeCheck) {
2244 ChkBuilder.
CreateOr(MemoryRuntimeCheck, IsConflict,
"conflict.rdx");
2246 MemoryRuntimeCheck = IsConflict;
2249 Exp.eraseDeadInstructions(MemoryRuntimeCheck);
2250 return MemoryRuntimeCheck;
2262 const SCEV *visitPtrToIntExpr(
const SCEVPtrToIntExpr *
E) {
2263 const SCEV *
Op =
visit(
E->getOperand());
2264 if (
E->getType() == DL.getAddressType(
E->getOperand()->getType()))
2265 return SE.getPtrToAddrExpr(
Op);
2266 return Op ==
E->getOperand() ?
E : SE.getPtrToIntExpr(
Op,
E->getType());
2279 Value *MemoryRuntimeCheck =
nullptr;
2281 auto &SE = *Expander.
getSE();
2287 for (
const auto &[SrcStart, SinkStart, AccessSize, NeedsFreeze] : Checks) {
2288 Type *Ty = SinkStart->getType();
2290 auto *VFTimesICTimesSize =
2291 ChkBuilder.
CreateMul(GetVF(ChkBuilder, Ty->getScalarSizeInBits()),
2292 ConstantInt::get(Ty, IC * AccessSize));
2293 const SCEV *SinkStartRewritten = Rewriter.visit(SinkStart);
2294 const SCEV *SrcStartRewritten = Rewriter.visit(SrcStart);
2296 SE.getMinusSCEV(SinkStartRewritten, SrcStartRewritten), Ty,
Loc);
2300 Value *IsConflict = SeenCompares.
lookup({Diff, VFTimesICTimesSize});
2305 ChkBuilder.
CreateICmpULT(Diff, VFTimesICTimesSize,
"diff.check");
2306 SeenCompares.
insert({{Diff, VFTimesICTimesSize}, IsConflict});
2310 if (MemoryRuntimeCheck) {
2312 ChkBuilder.
CreateOr(MemoryRuntimeCheck, IsConflict,
"conflict.rdx");
2314 MemoryRuntimeCheck = IsConflict;
2318 return MemoryRuntimeCheck;
2321std::optional<IVConditionInfo>
2340 WorkList.
append(CondI->op_begin(), CondI->op_end());
2344 while (!WorkList.
empty()) {
2346 if (!
I || !L.contains(
I))
2355 if (LI->isVolatile() || LI->isAtomic())
2362 AccessesToCheck.
push_back(MemUse->getDefiningAccess());
2370 WorkList.
append(
I->op_begin(),
I->op_end());
2373 if (InstToDuplicate.
empty())
2377 L.getExitingBlocks(ExitingBlocks);
2378 auto HasNoClobbersOnPath =
2379 [&L, &
AA, &AccessedLocs, &ExitingBlocks, &InstToDuplicate,
2382 -> std::optional<IVConditionInfo> {
2394 while (!WorkList.
empty()) {
2396 if (!L.contains(Current))
2398 const auto &SeenIns = Seen.
insert(Current);
2399 if (!SeenIns.second)
2402 Info.PathIsNoop &=
all_of(
2403 *Current, [](
Instruction &
I) {
return !
I.mayHaveSideEffects(); });
2409 if (Seen.
size() < 2)
2417 while (!AccessesToCheck.
empty()) {
2419 auto SeenI = SeenAccesses.
insert(Current);
2436 AA.getModRefInfo(CurrentDef->getMemoryInst(),
Loc));
2441 for (
Use &U : Current->
uses())
2452 if (Info.PathIsNoop) {
2453 for (
auto *Exiting : ExitingBlocks) {
2457 if (L.contains(Succ))
2460 Info.PathIsNoop &= Succ->phis().empty() &&
2461 (!Info.ExitForPath || Info.ExitForPath == Succ);
2462 if (!Info.PathIsNoop)
2464 assert((!Info.ExitForPath || Info.ExitForPath == Succ) &&
2465 "cannot have multiple exit blocks");
2466 Info.ExitForPath = Succ;
2470 if (!Info.ExitForPath)
2471 Info.PathIsNoop =
false;
2473 Info.InstToDuplicate = std::move(InstToDuplicate);
2479 if (TI->getSuccessor(0) == TI->getSuccessor(1))
2482 if (
auto Info = HasNoClobbersOnPath(TI->getSuccessor(0), L.getHeader(),
2487 if (
auto Info = HasNoClobbersOnPath(TI->getSuccessor(1), L.getHeader(),
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
AMDGPU Register Bank Select
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
This is the interface for LLVM's primary stateless and local alias analysis.
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
#define LLVM_EXPORT_TEMPLATE
This file defines the DenseSet and SmallDenseSet classes.
This is the interface for a simple mod/ref and alias analysis over globals.
ManagedStatic< HTTPClientCleanup > Cleanup
Module.h This file contains the declarations for the Module class.
iv Induction Variable Users
static cl::opt< ReplaceExitVal > ReplaceExitValue("replexitval", cl::Hidden, cl::init(OnlyCheapRepl), cl::desc("Choose the strategy to replace exit value in IndVarSimplify"), cl::values(clEnumValN(NeverRepl, "never", "never replace exit value"), clEnumValN(OnlyCheapRepl, "cheap", "only replace exit value when the cost is cheap"), clEnumValN(UnusedIndVarInLoop, "unusedindvarinloop", "only replace exit value when it is an unused " "induction variable in the loop and has cheap replacement cost"), clEnumValN(NoHardUse, "noharduse", "only replace exit values when loop def likely dead"), clEnumValN(AlwaysRepl, "always", "always replace exit value whenever possible")))
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
static cl::opt< bool, true > HoistRuntimeChecks("hoist-runtime-checks", cl::Hidden, cl::desc("Hoist inner loop runtime memory checks to outer loop if possible"), cl::location(VectorizerParams::HoistRuntimeChecks), cl::init(true))
static bool hasHardUserWithinLoop(const Loop *L, const Instruction *I)
static CondBrInst * getExpectedExitLoopLatchBranch(Loop *L)
Checks if L has an exiting latch branch.
static const char * LLVMLoopDisableLICM
static PointerBounds expandBounds(const RuntimeCheckingPtrGroup *CG, Loop *TheLoop, Instruction *Loc, SCEVExpander &Exp, bool HoistRuntimeChecks)
Expand code for the lower and upper bound of the pointer group CG in TheLoop.
static bool canLoopBeDeleted(Loop *L, SmallVector< RewritePhi, 8 > &RewritePhiSet)
static const char * LLVMLoopDisableNonforced
static MDNode * createStringMetadata(Loop *TheLoop, StringRef Name, unsigned V)
Create MDNode for input string.
static std::optional< unsigned > estimateLoopTripCount(Loop *L)
static bool checkIsIndPhi(PHINode *Phi, Loop *L, ScalarEvolution *SE, InductionDescriptor &ID)
Checks if it is safe to call InductionDescriptor::isInductionPHI for Phi, and returns true if this Ph...
This file exposes an interface to building/using memory SSA to walk memory instructions using a use/d...
#define INITIALIZE_PASS_DEPENDENCY(depName)
This file provides a priority worklist.
This file contains the declarations for profiling metadata utility functions.
const SmallVectorImpl< MachineOperand > & Cond
static void visit(BasicBlock &Start, std::function< bool(BasicBlock *)> op)
This is the interface for a SCEV-based alias analysis.
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...
This file implements a set that has insertion order iteration characteristics.
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
Virtual Register Rewriter
static const uint32_t IV[8]
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Class for arbitrary precision integers.
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
static APInt getMinValue(unsigned numBits)
Gets minimum unsigned value of APInt for a specific bit width.
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Represent the analysis usage information of a pass.
LLVM_ABI AnalysisUsage & addRequiredID(const void *ID)
AnalysisUsage & addPreservedID(const void *ID)
AnalysisUsage & addRequired()
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Legacy wrapper pass to provide the BasicAAResult object.
LLVM Basic Block Representation.
iterator begin()
Instruction iterator methods.
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
InstListType::iterator iterator
Instruction iterators...
LLVM_ABI LLVMContext & getContext() const
Get the context in which this basic block lives.
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction; assumes that the block is well-formed.
static LLVM_ABI BranchProbability getBranchProbability(uint64_t Numerator, uint64_t Denominator)
static BranchProbability getUnknown()
uint32_t getNumerator() const
static BranchProbability getZero()
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
@ ICMP_SLT
signed less than
@ ICMP_SLE
signed less or equal
@ FCMP_OLT
0 1 0 0 True if ordered and less than
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
@ ICMP_UGT
unsigned greater than
@ ICMP_SGT
signed greater than
@ ICMP_ULT
unsigned less than
@ ICMP_SGE
signed greater or equal
Conditional Branch instruction.
BasicBlock * getSuccessor(unsigned i) const
static LLVM_ABI Constant * getIntrinsicIdentity(Intrinsic::ID, Type *Ty)
static LLVM_ABI Constant * getBinOpIdentity(unsigned Opcode, Type *Ty, bool AllowRHSConstant=false, bool NSZ=false)
Return the identity constant for a binary opcode.
static LLVM_ABI ConstantFP * getQNaN(Type *Ty, bool Negative=false, APInt *Payload=nullptr)
static LLVM_ABI ConstantFP * getInfinity(Type *Ty, bool Negative=false)
This is the shared class of boolean and integer constants.
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
int64_t getSExtValue() const
Return the constant as a 64-bit integer value after it has been sign extended as appropriate for the ...
A parsed version of the target data layout string in and methods for querying it.
Record of a variable value-assignment, aka a non instruction representation of the dbg....
Identifies a unique instance of a variable.
ValueT lookup(const_arg_type_t< KeyT > Val) const
Return the entry for the specified key, or a default constructed value if no such entry exists.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
iterator_range< iterator > children()
void applyUpdates(ArrayRef< UpdateType > Updates)
Inform the dominator tree about a sequence of CFG edge insertions and deletions and perform a batch u...
static constexpr UpdateKind Delete
static constexpr UpdateKind Insert
DomTreeNodeBase< NodeT > * getNode(const NodeT *BB) const
getNode - return the (Post)DominatorTree node for the specified basic block.
Legacy analysis pass which computes a DominatorTree.
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
LLVM_ABI bool isReachableFromEntry(const Use &U) const
Provide an overload for a Use.
static constexpr ElementCount get(ScalarTy MinVal, bool Scalable)
Convenience struct for specifying and reasoning about fast-math flags.
bool noSignedZeros() const
void applyUpdates(ArrayRef< UpdateT > Updates)
Submit updates to all available trees.
Legacy wrapper pass to provide the GlobalsAAResult object.
Common base class shared among various IRBuilders.
Value * CreateICmpULT(Value *LHS, Value *RHS, const Twine &Name="")
Value * CreateFreeze(Value *V, const Twine &Name="")
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Value * CreateICmpSLT(Value *LHS, Value *RHS, const Twine &Name="")
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="", bool IsDisjoint=false)
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
A struct for saving information about induction variables.
static LLVM_ABI bool isInductionPHI(PHINode *Phi, const Loop *L, ScalarEvolution *SE, InductionDescriptor &D, ArrayRef< const SCEVPredicate * > NoWrapPreds={}, const SCEV *Expr=nullptr, SmallVectorImpl< Instruction * > *CastsToIgnore=nullptr)
Returns true if Phi is an induction in the loop L.
InstSimplifyFolder - Use InstructionSimplify to fold operations to existing values.
LLVM_ABI unsigned getNumSuccessors() const LLVM_READONLY
Return the number of successors that this instruction has.
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
LLVM_ABI BasicBlock * getSuccessor(unsigned Idx) const LLVM_READONLY
Return the specified successor. This instruction must be a terminator.
LLVM_ABI bool mayHaveSideEffects() const LLVM_READONLY
Return true if the instruction may have side effects.
This is an important class for using LLVM in a threaded context.
bool contains(const LoopT *L) const
Return true if the specified loop is contained within in this loop.
typename std::vector< Loop * >::const_iterator iterator
BlockT * getLoopLatch() const
If there is a single latch block for this loop, return it.
BlockT * getHeader() const
void addBasicBlockToLoop(BlockT *NewBB, LoopInfoBase< BlockT, LoopT > &LI)
This method is used by other analyses to update loop information.
void addChildLoop(LoopT *NewChild)
Add the specified loop to be a child of this loop.
LoopT * getParentLoop() const
Return the parent loop if it exists or nullptr for top level loops.
void addTopLevelLoop(LoopT *New)
This adds the specified loop to the collection of top-level loops.
void removeBlock(BlockT *BB)
This method completely removes BB from all data structures, including all of the Loop objects it is n...
LoopT * AllocateLoop(ArgsTy &&...Args)
LoopT * removeLoop(iterator I)
This removes the specified top-level loop from this loop info object.
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
void destroy(LoopT *L)
Destroy a loop that has been removed from the LoopInfo nest.
The legacy pass manager's analysis pass to compute loop information.
bool replacementPreservesLCSSAForm(Instruction *From, Value *To)
Returns true if replacing From with To everywhere is guaranteed to preserve LCSSA form.
LLVM_ABI void erase(Loop *L)
Update LoopInfo after removing the last backedge from a loop.
Represents a single loop in the control flow graph.
void setLoopID(MDNode *LoopID) const
Set the llvm.loop loop id metadata for this loop.
MDNode * getLoopID() const
Return the llvm.loop loop id metadata node for this loop if it is present.
LLVM_ABI void replaceOperandWith(unsigned I, Metadata *New)
Replace a specific operand.
const MDOperand & getOperand(unsigned I) const
ArrayRef< MDOperand > operands() const
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
unsigned getNumOperands() const
Return number of MDNode operands.
LLVMContext & getContext() const
Tracking metadata reference owned by Metadata.
LLVM_ABI StringRef getString() const
static LLVM_ABI MDString * get(LLVMContext &Context, StringRef Str)
BasicBlock * getBlock() const
Representation for a specific memory location.
static LLVM_ABI MemoryLocation get(const LoadInst *LI)
Return a location with information about the memory reference by the given instruction.
Legacy analysis pass which computes MemorySSA.
Encapsulates MemorySSA, including all data associated with memory accesses.
LLVM_ABI void verifyMemorySSA(VerificationLevel=VerificationLevel::Fast) const
Verify that MemorySSA is self consistent (IE definitions dominate all uses, uses appear in the right ...
MemoryUseOrDef * getMemoryAccess(const Instruction *I) const
Given a memory Mod/Ref'ing instruction, get the MemorySSA access associated with it.
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
void setIncomingValue(unsigned i, Value *V)
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
int getBasicBlockIndex(const BasicBlock *BB) const
Return the first index of the specified basic block in the value list for this PHI.
unsigned getNumIncomingValues() const
Return the number of incoming edges.
PassRegistry - This class manages the registration and intitialization of the pass subsystem as appli...
static LLVM_ABI PointerType * get(Type *ElementType, unsigned AddressSpace)
This constructs a pointer to an object of the specified type in a numbered address space.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
bool insert(const T &X)
Insert a new element into the PriorityWorklist.
static bool isAnyOfRecurrenceKind(RecurKind Kind)
Returns true if the recurrence kind is of the form select(cmp(),x,y) where one of (x,...
static bool isFindRecurrenceKind(RecurKind Kind)
static bool isMinMaxRecurrenceKind(RecurKind Kind)
Returns true if the recurrence kind is any min/max kind.
A global registry used in conjunction with static constructors to make pluggable components (like tar...
Legacy wrapper pass to provide the SCEVAAResult object.
This class uses information about analyze scalars to rewrite expressions in canonical form.
ScalarEvolution * getSE()
LLVM_ABI Value * expandCodeFor(SCEVUse SH, Type *Ty, BasicBlock::iterator I)
Insert code to directly compute the specified SCEV expression into the program.
LLVM_ABI void eraseDeadInstructions(Value *Root)
Remove inserted instructions that are dead, e.g.
This visitor recursively visits a SCEV expression and re-writes it.
This class represents an analyzed expression in the program.
LLVM_ABI Type * getType() const
Return the LLVM type of this SCEV expression.
The main scalar evolution driver.
LLVM_ABI bool isKnownNonNegative(const SCEV *S)
Test if the given expression is known to be non-negative.
LLVM_ABI bool isLoopEntryGuardedByCond(const Loop *L, CmpPredicate Pred, const SCEV *LHS, const SCEV *RHS)
Test whether entry to the loop is protected by a conditional between LHS and RHS.
LLVM_ABI const SCEV * getSCEVAtScope(const SCEV *S, const Loop *L)
Return a SCEV expression for the specified value at the specified scope in the program.
const SCEV * getZero(Type *Ty)
Return a SCEV for the constant 0 of a specific type.
LLVM_ABI const SCEV * getConstant(ConstantInt *V)
LLVM_ABI const SCEV * getSCEV(Value *V)
Return a SCEV expression for the full generality of the specified expression.
LLVM_ABI void forgetLoop(const Loop *L)
This method should be called by the client when it has changed a loop in a way that may effect Scalar...
LLVM_ABI bool isLoopInvariant(const SCEV *S, const Loop *L)
Return true if the value of the given SCEV is unchanging in the specified loop.
LLVM_ABI LoopDisposition getLoopDisposition(const SCEV *S, const Loop *L)
Return the "disposition" of the given SCEV with respect to the given loop.
LLVM_ABI bool isSCEVable(Type *Ty) const
Test if values of the given type are analyzable within the SCEV framework.
LLVM_ABI void forgetValue(Value *V)
This method should be called by the client when it has changed a value in a way that may effect its v...
LLVM_ABI void forgetBlockAndLoopDispositions(Value *V=nullptr)
Called when the client has changed the disposition of values in a loop or block.
LoopDisposition
An enum describing the relationship between a SCEV and a loop.
@ LoopInvariant
The SCEV is loop-invariant.
LLVM_ABI bool isAvailableAtLoopEntry(const SCEV *S, const Loop *L)
Determine if the SCEV can be evaluated at loop's entry.
LLVM_ABI const SCEV * getExitCount(const Loop *L, const BasicBlock *ExitingBlock, ExitCountKind Kind=Exact)
Return the number of times the backedge executes before the given exit would be taken; if not exactly...
LLVM_ABI const SCEV * applyLoopGuards(const SCEV *Expr, const Loop *L)
Try to apply information from loop guards for L to Expr.
This class represents the LLVM 'select' instruction.
Implements a dense probed hash-table based set with some number of buckets stored inline.
A version of PriorityWorklist that selects small size optimized data structures for the vector and ma...
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
bool contains(ConstPtrType Ptr) const
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
A SetVector that performs no allocations if smaller than a certain size.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
reference emplace_back(ArgTypes &&... Args)
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Represent a constant reference to a string, i.e.
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
Provides information about what library functions are available for the current target.
Value handle that tracks a Value across RAUW.
The instances of the Type class are immutable: once they are created, they are never changed.
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
bool isIntegerTy() const
True if this is an instance of IntegerType.
A Use represents the edge between a Value definition and its users.
static LLVM_ABI Intrinsic::ID getForIntrinsic(Intrinsic::ID Id)
The llvm.vp.
static LLVM_ABI bool isVPReduction(Intrinsic::ID ID)
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
iterator_range< user_iterator > users()
iterator_range< use_iterator > uses()
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
std::pair< iterator, bool > insert(const ValueT &V)
An efficient, type-erasing, non-owning reference to a callable.
const ParentTy * getParent() const
This class implements an extremely fast bulk output stream that can only output to a stream.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Abstract Attribute helper functions.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
std::enable_if_t< detail::IsValidPointer< X, Y >::value, X * > extract_or_null(Y &&MD)
Extract a Value from Metadata, allowing null.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
LLVM_ABI Value * createSimpleReduction(IRBuilderBase &B, Value *Src, RecurKind RdxKind)
Create a reduction of the given vector.
LLVM_ABI std::optional< ElementCount > getOptionalElementCountLoopAttribute(const Loop *TheLoop)
Find a combination of metadata ("llvm.loop.vectorize.width" and "llvm.loop.vectorize....
LLVM_ABI BranchProbability getBranchProbability(CondBrInst *B, bool ForFirstTarget)
Based on branch weight metadata, return either:
@ Low
Lower the current thread's priority such that it does not affect foreground tasks significantly.
LLVM_ABI Value * addRuntimeChecks(Instruction *Loc, Loop *TheLoop, const SmallVectorImpl< RuntimePointerCheck > &PointerChecks, SCEVExpander &Expander, bool HoistRuntimeChecks=false)
Add code that checks at runtime if the accessed arrays in PointerChecks overlap.
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
void fill(R &&Range, T &&Value)
Provide wrappers to std::fill which take ranges instead of having to pass begin/end explicitly.
cl::opt< bool > ProfcheckDisableMetadataFixes
LLVM_ABI std::optional< unsigned > getLoopEstimatedTripCount(Loop *L, unsigned *EstimatedLoopInvocationWeight=nullptr)
Return either:
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI Intrinsic::ID getMinMaxReductionIntrinsicOp(Intrinsic::ID RdxID)
Returns the min/max intrinsic used when expanding a min/max reduction.
LLVM_ABI bool getBooleanLoopAttribute(const Loop *TheLoop, StringRef Name)
Returns true if Name is applied to TheLoop and enabled.
LLVM_ABI bool isKnownNonPositiveInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE)
Returns true if we can prove that S is defined and always non-positive in loop L.
LLVM_ABI std::optional< bool > getOptionalBoolLoopAttribute(const Loop *TheLoop, StringRef Name)
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
LLVM_ABI void setExplicitlyUnknownBranchWeightsIfProfiled(Instruction &I, StringRef PassName, const Function *F=nullptr)
Like setExplicitlyUnknownBranchWeights(...), but only sets unknown branch weights in the new instruct...
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
void appendReversedLoopsToWorklist(RangeT &&, SmallPriorityWorklist< Loop *, 4 > &)
Utility that implements appending of loops onto a worklist given a range.
auto successors(const MachineBasicBlock *BB)
LLVM_ABI void initializeLoopPassPass(PassRegistry &)
Manually defined generic "LoopPass" dependency initialization.
constexpr from_range_t from_range
LLVM_ABI bool formLCSSARecursively(Loop &L, const DominatorTree &DT, const LoopInfo *LI, ScalarEvolution *SE)
Put a loop nest into LCSSA form.
LLVM_ABI Value * getReductionIdentity(Intrinsic::ID RdxID, Type *Ty, FastMathFlags FMF)
Given information about an @llvm.vector.reduce.
LLVM_ABI std::optional< MDNode * > makeFollowupLoopID(MDNode *OrigLoopID, ArrayRef< StringRef > FollowupAttrs, const char *InheritOptionsAttrsPrefix="", bool AlwaysNew=false)
Create a new loop identifier for a loop created from a loop transformation.
LLVM_ABI unsigned getArithmeticReductionInstruction(Intrinsic::ID RdxID)
Returns the arithmetic instruction opcode used when expanding a reduction.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
std::pair< const RuntimeCheckingPtrGroup *, const RuntimeCheckingPtrGroup * > RuntimePointerCheck
A memcheck which made up of a pair of grouped pointers.
LLVM_ABI char & LoopSimplifyID
LLVM_ABI Value * createMinMaxOp(IRBuilderBase &Builder, RecurKind RK, Value *Left, Value *Right)
Returns a Min/Max operation corresponding to MinMaxRecurrenceKind.
LLVM_ABI SmallVector< BasicBlock *, 16 > collectChildrenInLoop(DominatorTree *DT, DomTreeNode *N, const Loop *CurLoop)
Does a BFS from a given node to all of its children inside a given loop.
LLVM_ABI void addStringMetadataToLoop(Loop *TheLoop, const char *MDString, unsigned V=0)
Set input string into loop metadata by keeping other values intact.
LLVM_ABI bool cannotBeMaxInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE, bool Signed)
Returns true if S is defined and never is equal to signed/unsigned max.
LLVM_ABI void setBranchWeights(Instruction &I, ArrayRef< uint32_t > Weights, bool IsExpected, bool ElideAllZero=false)
Create a new branch_weights metadata node and add or overwrite a prof metadata reference to instructi...
DomTreeNodeBase< BasicBlock > DomTreeNode
constexpr T divideNearest(U Numerator, V Denominator)
Returns (Numerator / Denominator) rounded by round-half-up.
LLVM_ABI TransformationMode hasVectorizeTransformation(const Loop *L)
auto dyn_cast_or_null(const Y &Val)
OutputIt transform(R &&Range, OutputIt d_first, UnaryFunction F)
Wrapper function around std::transform to apply a function to a range and store the result elsewhere.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI bool isInstructionTriviallyDead(Instruction *I, const TargetLibraryInfo *TLI=nullptr)
Return true if the result produced by the instruction is not used, and the instruction will return.
LLVM_ABI SmallVector< Instruction *, 8 > findDefsUsedOutsideOfLoop(Loop *L)
Returns the instructions that use values defined in the loop.
auto reverse(ContainerTy &&C)
LLVM_ABI constexpr Intrinsic::ID getReductionIntrinsicID(RecurKind RK)
Returns the llvm.vector.reduce intrinsic that corresponds to the recurrence kind.
LLVM_ABI bool isMustProgress(const Loop *L)
Return true if this loop can be assumed to make progress.
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
LLVM_ABI void setBranchProbability(CondBrInst *B, BranchProbability P, bool ForFirstTarget)
Set branch weight metadata for B to indicate that P and 1 - P are the probabilities of control flowin...
bool isModSet(const ModRefInfo MRI)
LLVM_ABI TransformationMode hasUnrollAndJamTransformation(const Loop *L)
LLVM_ABI void deleteDeadLoop(Loop *L, DominatorTree *DT, ScalarEvolution *SE, LoopInfo *LI, MemorySSA *MSSA=nullptr)
This function deletes dead loops.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
LLVM_ABI bool hasDisableAllTransformsHint(const Loop *L)
Look for the loop attribute that disables all transformation heuristic.
LLVM_TEMPLATE_ABI void appendLoopsToWorklist(RangeT &&, SmallPriorityWorklist< Loop *, 4 > &)
Utility that implements appending of loops onto a worklist given a range.
LLVM_ABI cl::opt< unsigned > SCEVCheapExpansionBudget
FunctionAddr VTableAddr Count
LLVM_ABI Value * getShuffleReduction(IRBuilderBase &Builder, Value *Src, unsigned Op, TargetTransformInfo::ReductionShuffle RS, RecurKind MinMaxKind=RecurKind::None)
Generates a vector reduction using shufflevectors to reduce the value.
LLVM_ABI TransformationMode hasUnrollTransformation(const Loop *L)
LLVM_ABI BranchProbability getLoopProbability(Loop *L)
Based on branch weight metadata, return either:
LLVM_ABI TransformationMode hasDistributeTransformation(const Loop *L)
LLVM_ABI void breakLoopBackedge(Loop *L, DominatorTree &DT, ScalarEvolution &SE, LoopInfo &LI, MemorySSA *MSSA)
Remove the backedge of the specified loop.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
LLVM_ABI void getLoopAnalysisUsage(AnalysisUsage &AU)
Helper to consistently add the set of standard passes to a loop pass's AnalysisUsage.
LLVM_ABI void propagateIRFlags(Value *I, ArrayRef< Value * > VL, Value *OpValue=nullptr, bool IncludeWrapFlags=true)
Get the intersection (logical and) of all of the potential IR flags of each scalar operation (VL) tha...
LLVM_ABI bool isKnownPositiveInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE)
Returns true if we can prove that S is defined and always positive in loop L.
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
LLVM_ABI unsigned changeToUnreachable(Instruction *I, bool PreserveLCSSA=false, DomTreeUpdater *DTU=nullptr, MemorySSAUpdater *MSSAU=nullptr)
Insert an unreachable instruction before the specified instruction, making it and the rest of the cod...
RNSuccIterator< NodeRef, BlockT, RegionT > succ_begin(NodeRef Node)
LLVM_ABI std::optional< int > getOptionalIntLoopAttribute(const Loop *TheLoop, StringRef Name)
Find named metadata for a loop with an integer value.
LLVM_ABI bool setLoopProbability(Loop *L, BranchProbability P)
Set branch weight metadata for the latch of L to indicate that, at the end of any iteration,...
LLVM_ABI BasicBlock * SplitBlockPredecessors(BasicBlock *BB, ArrayRef< BasicBlock * > Preds, const char *Suffix, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, bool PreserveLCSSA=false)
This method introduces at least one new basic block into the function and moves some of the predecess...
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
LLVM_ABI CmpInst::Predicate getMinMaxReductionPredicate(RecurKind RK)
Returns the comparison predicate used when expanding a min/max reduction.
LLVM_ABI TransformationMode hasLICMVersioningTransformation(const Loop *L)
LLVM_ABI bool VerifyMemorySSA
Enables verification of MemorySSA.
TransformationMode
The mode sets how eager a transformation should be applied.
@ TM_Unspecified
The pass can use heuristics to determine whether a transformation should be applied.
@ TM_SuppressedByUser
The transformation must not be applied.
@ TM_ForcedByUser
The transformation was directed by the user, e.g.
@ TM_Disable
The transformation should not be applied.
@ TM_Enable
The transformation should be applied without considering a cost model.
RNSuccIterator< NodeRef, BlockT, RegionT > succ_end(NodeRef Node)
LLVM_ABI bool hasDisableLICMTransformsHint(const Loop *L)
Look for the loop attribute that disables the LICM transformation heuristics.
template LLVM_TEMPLATE_ABI void appendLoopsToWorklist< Loop & >(Loop &L, SmallPriorityWorklist< Loop *, 4 > &Worklist)
LLVM_ABI Intrinsic::ID getReductionForBinop(Instruction::BinaryOps Opc)
Returns the reduction intrinsic id corresponding to the binary operation.
RecurKind
These are the kinds of recurrences that we support.
@ UMin
Unsigned integer min implemented in terms of select(cmp()).
@ FMinimumNum
FP min with llvm.minimumnum semantics.
@ Or
Bitwise or logical OR of integers.
@ FMinimum
FP min with llvm.minimum semantics.
@ FMaxNum
FP max with llvm.maxnum semantics including NaNs.
@ Mul
Product of integers.
@ FSub
Subtraction of floats.
@ FAddChainWithSubs
A chain of fadds and fsubs.
@ AnyOf
AnyOf reduction with select(cmp(),x,y) where one of (x,y) is loop invariant, and both x and y are int...
@ Xor
Bitwise or logical XOR of integers.
@ FMax
FP max implemented in terms of select(cmp()).
@ FMaximum
FP max with llvm.maximum semantics.
@ FMulAdd
Sum of float products with llvm.fmuladd(a * b + sum).
@ SMax
Signed integer max implemented in terms of select(cmp()).
@ And
Bitwise or logical AND of integers.
@ SMin
Signed integer min implemented in terms of select(cmp()).
@ FMin
FP min implemented in terms of select(cmp()).
@ FMinNum
FP min with llvm.minnum semantics including NaNs.
@ Sub
Subtraction of integers.
@ AddChainWithSubs
A chain of adds and subs.
@ FMaximumNum
FP max with llvm.maximumnum semantics.
@ UMax
Unsigned integer max implemented in terms of select(cmp()).
LLVM_ABI Value * getRecurrenceIdentity(RecurKind K, Type *Tp, FastMathFlags FMF)
Given information about an recurrence kind, return the identity for the @llvm.vector....
LLVM_ABI BasicBlock * SplitBlock(BasicBlock *Old, BasicBlock::iterator SplitPt, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the specified block at the specified instruction.
LLVM_ABI bool formDedicatedExitBlocks(Loop *L, DominatorTree *DT, LoopInfo *LI, MemorySSAUpdater *MSSAU, bool PreserveLCSSA)
Ensure that all exit blocks of the loop are dedicated exits.
DWARFExpression::Operation Op
raw_ostream & operator<<(raw_ostream &OS, const APFixedPoint &FX)
LLVM_ABI bool isKnownNegativeInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE)
Returns true if we can prove that S is defined and always negative in loop L.
LLVM_ABI StringRef getLoopVectorizeKindPrefix(const Loop *L)
Return a short prefix describing the loop's vectorizer origin based on the llvm.loop....
constexpr unsigned BitWidth
ValueMap< const Value *, WeakTrackingVH > ValueToValueMapTy
LLVM_ABI Value * expandReductionViaLoop(IRBuilderBase &Builder, Value *Vec, unsigned RdxOpcode, Value *Acc, DominatorTree *DT=nullptr, LoopInfo *LI=nullptr)
Expand a scalable vector reduction into a runtime loop that applies RdxOpcode element by element,...
LLVM_ABI bool setLoopEstimatedTripCount(Loop *L, unsigned EstimatedTripCount, std::optional< unsigned > EstimatedLoopInvocationWeight=std::nullopt)
Set llvm.loop.estimated_trip_count with the value EstimatedTripCount in the loop metadata of L.
LLVM_ABI bool extractBranchWeights(const MDNode *ProfileData, SmallVectorImpl< uint32_t > &Weights)
Extract branch weights from MD_prof metadata.
LLVM_ABI const char * LLVMLoopEstimatedTripCount
Profile-based loop metadata that should be accessed only by using llvm::getLoopEstimatedTripCount and...
LLVM_ABI bool hasIterationCountInvariantInParent(Loop *L, ScalarEvolution &SE)
Check inner loop (L) backedge count is known to be invariant on all iterations of its outer loop.
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
static cl::opt< unsigned > MSSAThreshold("simple-loop-unswitch-memoryssa-threshold", cl::desc("Max number of memory uses to explore during " "partial unswitching analysis"), cl::init(100), cl::Hidden)
LLVM_ABI bool isAlmostDeadIV(PHINode *IV, BasicBlock *LatchBlock, Value *Cond)
Return true if the induction variable IV in a Loop whose latch is LatchBlock would become dead if the...
auto predecessors(const MachineBasicBlock *BB)
LLVM_ABI int rewriteLoopExitValues(Loop *L, LoopInfo *LI, TargetLibraryInfo *TLI, ScalarEvolution *SE, const TargetTransformInfo *TTI, SCEVExpander &Rewriter, DominatorTree *DT, ReplaceExitVal ReplaceExitValue, SmallVector< WeakTrackingVH, 16 > &DeadInsts)
If the final value of any expressions that are recurrent in the loop can be computed,...
LLVM_ABI Value * createOrderedReduction(IRBuilderBase &B, RecurKind RdxKind, Value *Src, Value *Start)
Create an ordered reduction intrinsic using the given recurrence kind RdxKind.
LLVM_ABI Value * addDiffRuntimeChecks(Instruction *Loc, ArrayRef< PointerDiffInfo > Checks, SCEVExpander &Expander, function_ref< Value *(IRBuilderBase &, unsigned)> GetVF, unsigned IC)
LLVM_ABI RecurKind getMinMaxReductionRecurKind(Intrinsic::ID RdxID)
Returns the recurence kind used when expanding a min/max reduction.
LLVM_ABI BasicBlock * SplitEdge(BasicBlock *From, BasicBlock *To, DominatorTree *DT=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the edge connecting the specified blocks, and return the newly created basic block between From...
LLVM_ABI std::optional< IVConditionInfo > hasPartialIVCondition(const Loop &L, unsigned MSSAThreshold, const MemorySSA &MSSA, AAResults &AA)
Check if the loop header has a conditional branch that is not loop-invariant, because it involves loa...
static auto filterDbgVars(iterator_range< simple_ilist< DbgRecord >::iterator > R)
Filter the DbgRecord range to DbgVariableRecord types only and downcast.
LLVM_ABI Value * createAnyOfReduction(IRBuilderBase &B, Value *Src, Value *InitVal, PHINode *OrigPhi)
Create a reduction of the given vector Src for a reduction of kind RecurKind::AnyOf.
LLVM_ABI bool cannotBeMinInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE, bool Signed)
Returns true if S is defined and never is equal to signed/unsigned min.
LLVM_ABI bool isKnownNonNegativeInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE)
Returns true if we can prove that S is defined and always non-negative in loop L.
LLVM_ABI Value * getOrderedReduction(IRBuilderBase &Builder, Value *Acc, Value *Src, unsigned Op, RecurKind MinMaxKind=RecurKind::None)
Generates an ordered vector reduction using extracts to reduce the value.
LLVM_ABI MDNode * findOptionMDForLoopID(MDNode *LoopID, StringRef Name)
Find and return the loop attribute node for the attribute Name in LoopID.
LLVM_ABI Intrinsic::ID getMinMaxReductionIntrinsicID(Intrinsic::ID IID)
Returns the llvm.vector.reduce min/max intrinsic that corresponds to the intrinsic op.
LLVM_ABI Loop * cloneLoop(Loop *L, Loop *PL, ValueToValueMapTy &VM, LoopInfo *LI, LPPassManager *LPM)
Recursively clone the specified loop and all of its children, mapping the blocks with the specified m...
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
IR Values for the lower and upper bounds of a pointer evolution.
TrackingVH< Value > Start
RewritePhi(PHINode *P, unsigned I, const SCEV *Val, Instruction *ExpansionPt, bool H)
const SCEV * ExpansionSCEV
Instruction * ExpansionPoint
Struct to hold information about a partially invariant condition.
unsigned AddressSpace
Address space of the involved pointers.
bool NeedsFreeze
Whether the pointer needs to be frozen after expansion, e.g.
const SCEV * High
The SCEV expression which represents the upper bound of all the pointers in this group.
const SCEV * Low
The SCEV expression which represents the lower bound of all the pointers in this group.