78using namespace jumpthreading;
80#define DEBUG_TYPE "jump-threading"
84STATISTIC(NumDupes,
"Number of branch blocks duplicated to eliminate phi");
88 cl::desc(
"Max block size to duplicate for jump threading"),
93 "jump-threading-implication-search-threshold",
94 cl::desc(
"The number of predecessors to search for a stronger "
95 "condition to use to thread over a weaker condition"),
99 "jump-threading-phi-threshold",
104 "jump-threading-across-loop-headers",
105 cl::desc(
"Allow JumpThreading to thread across loop headers, for testing"),
156 if (TrueWeight + FalseWeight == 0)
164 auto GetPredOutEdge =
166 BasicBlock *PhiBB) -> std::pair<BasicBlock *, BasicBlock *> {
167 auto *PredBB = IncomingBB;
168 auto *SuccBB = PhiBB;
171 BranchInst *PredBr = dyn_cast<BranchInst>(PredBB->getTerminator());
173 return {PredBB, SuccBB};
175 auto *SinglePredBB = PredBB->getSinglePredecessor();
177 return {
nullptr,
nullptr};
181 if (Visited.
count(SinglePredBB))
182 return {
nullptr,
nullptr};
185 PredBB = SinglePredBB;
198 TrueWeight, TrueWeight + FalseWeight)
200 FalseWeight, TrueWeight + FalseWeight));
203 if (!PredOutEdge.first)
211 uint64_t PredTrueWeight, PredFalseWeight;
249 std::make_unique<DomTreeUpdater>(
250 &DT,
nullptr, DomTreeUpdater::UpdateStrategy::Lazy),
251 std::nullopt, std::nullopt);
259#if defined(EXPENSIVE_CHECKS)
261 DominatorTree::VerificationLevel::Full) &&
262 "DT broken after JumpThreading");
266 "PDT broken after JumpThreading");
269 DominatorTree::VerificationLevel::Fast) &&
270 "DT broken after JumpThreading");
274 "PDT broken after JumpThreading");
277 return getPreservedAnalysis();
284 std::unique_ptr<DomTreeUpdater> DTU_,
285 std::optional<BlockFrequencyInfo *> BFI_,
286 std::optional<BranchProbabilityInfo *> BPI_) {
294 DTU = std::move(DTU_);
298 F->
getParent(), Intrinsic::experimental_guard);
299 HasGuards = GuardDecl && !GuardDecl->use_empty();
308 BBDupThreshold = DefaultBBDupThreshold;
313 assert(DTU &&
"DTU isn't passed into JumpThreading before using it.");
314 assert(DTU->hasDomTree() &&
"JumpThreading relies on DomTree to proceed.");
323 bool EverChanged =
false;
327 for (
auto &BB : *
F) {
328 if (Unreachable.
count(&BB))
331 Changed = ChangedSinceLastAnalysisUpdate =
true;
341 if (&BB == &
F->getEntryBlock() || DTU->isBBPendingDeletion(&BB))
348 <<
"' with terminator: " << *BB.getTerminator()
350 LoopHeaders.erase(&BB);
353 Changed = ChangedSinceLastAnalysisUpdate =
true;
359 auto *BI = dyn_cast<BranchInst>(BB.getTerminator());
360 if (BI && BI->isUnconditional()) {
364 BB.getFirstNonPHIOrDbg(
true)->isTerminator() &&
367 !LoopHeaders.count(&BB) && !LoopHeaders.count(Succ) &&
373 Changed = ChangedSinceLastAnalysisUpdate =
true;
377 EverChanged |= Changed;
393 bool Changed =
false;
398 if (
Cond->getParent() == KnownAtEndOfBB)
403 DVR.replaceVariableLocationOp(
Cond, ToVal,
true);
413 Changed |=
I.replaceUsesOfWith(
Cond, ToVal);
415 if (
Cond->use_empty() && !
Cond->mayHaveSideEffects()) {
416 Cond->eraseFromParent();
428 unsigned Threshold) {
429 assert(StopAt->
getParent() == BB &&
"Not an instruction from proper BB?");
434 unsigned PhiCount = 0;
437 if (!isa<PHINode>(&
I)) {
456 if (isa<SwitchInst>(StopAt))
460 if (isa<IndirectBrInst>(StopAt))
471 for (; &*
I != StopAt; ++
I) {
474 if (
Size > Threshold)
479 if (
I->getType()->isTokenTy() &&
I->isUsedOutsideOfBlock(BB))
484 if (
const CallInst *CI = dyn_cast<CallInst>(
I))
485 if (CI->cannotDuplicate() || CI->isConvergent())
499 if (
const CallInst *CI = dyn_cast<CallInst>(
I)) {
500 if (!isa<IntrinsicInst>(CI))
502 else if (!CI->getType()->isVectorTy())
507 return Size > Bonus ?
Size - Bonus : 0;
528 for (
const auto &Edge : Edges)
529 LoopHeaders.insert(Edge.second);
542 if (
UndefValue *U = dyn_cast<UndefValue>(Val))
548 return dyn_cast<ConstantInt>(Val);
567 if (!RecursionSet.
insert(V).second)
573 Result.emplace_back(KC, Pred);
575 return !Result.empty();
581 if (!
I ||
I->getParent() != BB) {
586 using namespace PatternMatch;
600 Result.emplace_back(KC,
P);
603 return !Result.empty();
607 if (
PHINode *PN = dyn_cast<PHINode>(
I)) {
608 for (
unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) {
609 Value *InVal = PN->getIncomingValue(i);
611 Result.emplace_back(KC, PN->getIncomingBlock(i));
614 PN->getIncomingBlock(i),
617 Result.emplace_back(KC, PN->getIncomingBlock(i));
621 return !Result.empty();
625 if (
CastInst *CI = dyn_cast<CastInst>(
I)) {
626 Value *Source = CI->getOperand(0);
634 for (
auto &Val : Vals)
637 Result.emplace_back(Folded, Val.second);
639 return !Result.empty();
643 Value *Source = FI->getOperand(0);
651 return !Result.empty();
655 if (
I->getType()->getPrimitiveSizeInBits() == 1) {
656 using namespace PatternMatch;
684 for (
const auto &LHSVal : LHSVals)
685 if (LHSVal.first == InterestingVal || isa<UndefValue>(LHSVal.first)) {
686 Result.emplace_back(InterestingVal, LHSVal.second);
687 LHSKnownBBs.
insert(LHSVal.second);
689 for (
const auto &RHSVal : RHSVals)
690 if (RHSVal.first == InterestingVal || isa<UndefValue>(RHSVal.first)) {
693 if (!LHSKnownBBs.
count(RHSVal.second))
694 Result.emplace_back(InterestingVal, RHSVal.second);
697 return !Result.empty();
701 if (
I->getOpcode() == Instruction::Xor &&
702 isa<ConstantInt>(
I->getOperand(1)) &&
703 cast<ConstantInt>(
I->getOperand(1))->isOne()) {
710 for (
auto &R : Result)
720 if (
ConstantInt *CI = dyn_cast<ConstantInt>(BO->getOperand(1))) {
726 for (
const auto &LHSVal : LHSVals) {
732 Result.emplace_back(KC, LHSVal.second);
736 return !Result.empty();
740 if (
CmpInst *Cmp = dyn_cast<CmpInst>(
I)) {
743 Type *CmpType = Cmp->getType();
744 Value *CmpLHS = Cmp->getOperand(0);
745 Value *CmpRHS = Cmp->getOperand(1);
748 PHINode *PN = dyn_cast<PHINode>(CmpLHS);
750 PN = dyn_cast<PHINode>(CmpRHS);
754 if (PN && PN->
getParent() == BB && !LoopHeaders.contains(BB)) {
770 if (!isa<Constant>(
RHS))
774 auto LHSInst = dyn_cast<Instruction>(
LHS);
775 if (LHSInst && LHSInst->getParent() == BB)
779 BB, CxtI ? CxtI : Cmp);
783 Result.emplace_back(KC, PredBB);
786 return !Result.empty();
791 if (isa<Constant>(CmpRHS) && !CmpType->
isVectorTy()) {
792 Constant *CmpConst = cast<Constant>(CmpRHS);
794 if (!isa<Instruction>(CmpLHS) ||
795 cast<Instruction>(CmpLHS)->
getParent() != BB) {
802 Result.emplace_back(KC,
P);
805 return !Result.empty();
812 using namespace PatternMatch;
816 if (isa<ConstantInt>(CmpConst) &&
818 if (!isa<Instruction>(AddLHS) ||
819 cast<Instruction>(AddLHS)->
getParent() != BB) {
825 AddLHS,
P, BB, CxtI ? CxtI : cast<Instruction>(CmpLHS));
831 Pred, cast<ConstantInt>(CmpConst)->getValue());
841 Result.emplace_back(ResC,
P);
844 return !Result.empty();
855 for (
const auto &LHSVal : LHSVals) {
860 Result.emplace_back(KC, LHSVal.second);
863 return !Result.empty();
873 if ((TrueVal || FalseVal) &&
876 for (
auto &
C : Conds) {
883 KnownCond = CI->isOne();
885 assert(isa<UndefValue>(
Cond) &&
"Unexpected condition value");
889 KnownCond = (TrueVal !=
nullptr);
893 if (
Constant *Val = KnownCond ? TrueVal : FalseVal)
894 Result.emplace_back(Val,
C.second);
897 return !Result.empty();
906 Result.emplace_back(KC, Pred);
909 return !Result.empty();
919 unsigned MinSucc = 0;
922 unsigned MinNumPreds =
pred_size(TestBB);
926 if (NumPreds < MinNumPreds) {
928 MinNumPreds = NumPreds;
950 if (DTU->isBBPendingDeletion(BB) ||
975 if (
BranchInst *BI = dyn_cast<BranchInst>(Terminator)) {
977 if (BI->isUnconditional())
return false;
978 Condition = BI->getCondition();
979 }
else if (
SwitchInst *SI = dyn_cast<SwitchInst>(Terminator)) {
980 Condition = SI->getCondition();
981 }
else if (
IndirectBrInst *IB = dyn_cast<IndirectBrInst>(Terminator)) {
983 if (IB->getNumSuccessors() == 0)
return false;
984 Condition = IB->getAddress()->stripPointerCasts();
991 bool ConstantFolded =
false;
995 if (
Instruction *
I = dyn_cast<Instruction>(Condition)) {
999 I->replaceAllUsesWith(SimpleVal);
1001 I->eraseFromParent();
1002 Condition = SimpleVal;
1003 ConstantFolded =
true;
1009 auto *FI = dyn_cast<FreezeInst>(Condition);
1010 if (isa<UndefValue>(Condition) ||
1011 (FI && isa<UndefValue>(FI->getOperand(0)) && FI->hasOneUse())) {
1013 std::vector<DominatorTree::UpdateType> Updates;
1019 if (i == BestSucc)
continue;
1026 <<
"' folding undef terminator: " << *BBTerm <<
'\n');
1031 DTU->applyUpdatesPermissive(Updates);
1033 FI->eraseFromParent();
1046 if (
auto *BPI = getBPI())
1047 BPI->eraseBlock(BB);
1051 Instruction *CondInst = dyn_cast<Instruction>(Condition);
1058 return ConstantFolded;
1062 Value *CondWithoutFreeze = CondInst;
1063 if (
auto *FI = dyn_cast<FreezeInst>(CondInst))
1064 CondWithoutFreeze = FI->getOperand(0);
1066 if (
CmpInst *CondCmp = dyn_cast<CmpInst>(CondWithoutFreeze)) {
1070 if (
Constant *CondConst = dyn_cast<Constant>(CondCmp->getOperand(1))) {
1072 LVI->
getPredicateAt(CondCmp->getPredicate(), CondCmp->getOperand(0),
1102 Value *SimplifyValue = CondWithoutFreeze;
1104 if (
CmpInst *CondCmp = dyn_cast<CmpInst>(SimplifyValue))
1105 if (isa<Constant>(CondCmp->getOperand(1)))
1106 SimplifyValue = CondCmp->getOperand(0);
1110 if (
LoadInst *LoadI = dyn_cast<LoadInst>(SimplifyValue))
1115 if (
PHINode *PN = dyn_cast<PHINode>(CondInst))
1116 if (PN->getParent() == BB && isa<BranchInst>(BB->
getTerminator()))
1127 PHINode *PN = dyn_cast<PHINode>(CondWithoutFreeze);
1132 if (CondInst->
getOpcode() == Instruction::Xor &&
1146 if (!BI || !BI->isConditional())
1155 auto *FICond = dyn_cast<FreezeInst>(
Cond);
1156 if (FICond && FICond->hasOneUse())
1157 Cond = FICond->getOperand(0);
1168 auto *PBI = dyn_cast<BranchInst>(CurrentPred->
getTerminator());
1169 if (!PBI || !PBI->isConditional())
1171 if (PBI->getSuccessor(0) != CurrentBB && PBI->getSuccessor(1) != CurrentBB)
1174 bool CondIsTrue = PBI->getSuccessor(0) == CurrentBB;
1175 std::optional<bool> Implication =
1180 if (!Implication && FICond && isa<FreezeInst>(PBI->getCondition())) {
1181 if (cast<FreezeInst>(PBI->getCondition())->getOperand(0) ==
1182 FICond->getOperand(0))
1183 Implication = CondIsTrue;
1187 BasicBlock *KeepSucc = BI->getSuccessor(*Implication ? 0 : 1);
1188 BasicBlock *RemoveSucc = BI->getSuccessor(*Implication ? 1 : 0);
1193 BI->eraseFromParent();
1195 FICond->eraseFromParent();
1198 if (
auto *BPI = getBPI())
1199 BPI->eraseBlock(BB);
1202 CurrentBB = CurrentPred;
1212 if (OpInst->getParent() == BB)
1257 LoadInst *NLoadI = cast<LoadInst>(AvailableVal);
1264 if (AvailableVal == LoadI)
1266 if (AvailableVal->getType() != LoadI->
getType()) {
1269 cast<Instruction>(AvailableVal)->setDebugLoc(LoadI->
getDebugLoc());
1279 if (BBIt != LoadBB->
begin())
1290 AvailablePredsTy AvailablePreds;
1298 if (!PredsScanned.
insert(PredBB).second)
1301 BBIt = PredBB->
end();
1302 unsigned NumScanedInst = 0;
1303 Value *PredAvailable =
nullptr;
1307 "Attempting to CSE volatile or atomic loads");
1317 &BatchAA, &IsLoadCSE, &NumScanedInst);
1322 while (!PredAvailable && SinglePredBB && BBIt == SinglePredBB->
begin() &&
1326 BBIt = SinglePredBB->
end();
1328 Loc, AccessTy, LoadI->
isAtomic(), SinglePredBB, BBIt,
1334 if (!PredAvailable) {
1335 OneUnavailablePred = PredBB;
1340 CSELoads.
push_back(cast<LoadInst>(PredAvailable));
1344 AvailablePreds.emplace_back(PredBB, PredAvailable);
1349 if (AvailablePreds.empty())
return false;
1366 if (PredsScanned.
size() != AvailablePreds.size() &&
1368 for (
auto I = LoadBB->
begin(); &*
I != LoadI; ++
I)
1375 if (PredsScanned.
size() == AvailablePreds.size()+1 &&
1377 UnavailablePred = OneUnavailablePred;
1378 }
else if (PredsScanned.
size() != AvailablePreds.size()) {
1384 for (
const auto &AvailablePred : AvailablePreds)
1385 AvailablePredSet.
insert(AvailablePred.first);
1390 if (isa<IndirectBrInst>(
P->getTerminator()))
1393 if (!AvailablePredSet.
count(
P))
1398 UnavailablePred = splitBlockPreds(LoadBB, PredsToSplit,
"thread-pre-split");
1404 if (UnavailablePred) {
1406 "Can't handle critical edge here!");
1416 AvailablePreds.emplace_back(UnavailablePred, NewVal);
1432 AvailablePredsTy::iterator
I =
1435 assert(
I != AvailablePreds.end() &&
I->first ==
P &&
1436 "Didn't find entry for predecessor!");
1442 Value *&PredV =
I->second;
1445 PredV, LoadI->
getType(),
"",
P->getTerminator()->getIterator());
1450 for (
LoadInst *PredLoadI : CSELoads) {
1468 assert(!PredToDestList.empty());
1480 DestPopularity[
nullptr] = 0;
1482 DestPopularity[SuccBB] = 0;
1484 for (
const auto &PredToDest : PredToDestList)
1485 if (PredToDest.second)
1486 DestPopularity[PredToDest.second]++;
1492 return MostPopular->first;
1502 assert(PredBB &&
"Expected a single predecessor");
1504 if (
Constant *Cst = dyn_cast<Constant>(V)) {
1510 if (!
I || (
I->getParent() != BB &&
I->getParent() != PredBB)) {
1516 if (
PHI->getParent() == PredBB)
1517 return dyn_cast<Constant>(
PHI->getIncomingValueForBlock(PredPredBB));
1522 if (
CmpInst *CondCmp = dyn_cast<CmpInst>(V)) {
1523 if (CondCmp->getParent() == BB) {
1544 if (LoopHeaders.count(BB))
1556 "computeValueKnownInPredecessors returned true with no values");
1559 for (
const auto &PredValue : PredValues) {
1561 <<
"': FOUND condition = " << *PredValue.first
1562 <<
" for pred '" << PredValue.second->getName() <<
"'.\n";
1577 for (
const auto &PredValue : PredValues) {
1579 if (!SeenPreds.insert(Pred).second)
1585 if (isa<UndefValue>(Val))
1588 assert(isa<ConstantInt>(Val) &&
"Expecting a constant integer");
1589 DestBB = BI->getSuccessor(cast<ConstantInt>(Val)->
isZero());
1591 assert(isa<ConstantInt>(Val) &&
"Expecting a constant integer");
1592 DestBB = SI->findCaseValue(cast<ConstantInt>(Val))->getCaseSuccessor();
1595 &&
"Unexpected terminator");
1596 assert(isa<BlockAddress>(Val) &&
"Expecting a constant blockaddress");
1597 DestBB = cast<BlockAddress>(Val)->getBasicBlock();
1601 if (PredToDestList.
empty()) {
1605 if (OnlyDest != DestBB)
1606 OnlyDest = MultipleDestSentinel;
1610 OnlyVal = MultipleVal;
1622 if (PredToDestList.
empty())
1628 if (OnlyDest && OnlyDest != MultipleDestSentinel) {
1630 bool SeenFirstBranchToOnlyDest =
false;
1631 std::vector <DominatorTree::UpdateType> Updates;
1634 if (SuccBB == OnlyDest && !SeenFirstBranchToOnlyDest) {
1635 SeenFirstBranchToOnlyDest =
true;
1637 SuccBB->removePredecessor(BB,
true);
1647 Term->eraseFromParent();
1648 DTU->applyUpdatesPermissive(Updates);
1649 if (
auto *BPI = getBPI())
1650 BPI->eraseBlock(BB);
1654 if (
auto *CondInst = dyn_cast<Instruction>(
Cond)) {
1655 if (CondInst->use_empty() && !CondInst->mayHaveSideEffects())
1656 CondInst->eraseFromParent();
1664 else if (OnlyVal && OnlyVal != MultipleVal)
1677 if (MostPopularDest == MultipleDestSentinel) {
1682 [&](
const std::pair<BasicBlock *, BasicBlock *> &PredToDest) {
1683 return LoopHeaders.contains(PredToDest.second);
1686 if (PredToDestList.
empty())
1695 for (
const auto &PredToDest : PredToDestList)
1696 if (PredToDest.second == MostPopularDest) {
1709 if (!MostPopularDest)
1738 if (PredBr->isUnconditional()) {
1739 PredBBs[0] = PredBB;
1763 if (!isa<PHINode>(BB->
front()))
1800 "computeValueKnownInPredecessors returned true with no values");
1804 unsigned NumTrue = 0, NumFalse = 0;
1805 for (
const auto &XorOpValue : XorOpValues) {
1806 if (isa<UndefValue>(XorOpValue.first))
1809 if (cast<ConstantInt>(XorOpValue.first)->isZero())
1817 if (NumTrue > NumFalse)
1819 else if (NumTrue != 0 || NumFalse != 0)
1825 for (
const auto &XorOpValue : XorOpValues) {
1826 if (XorOpValue.first != SplitVal && !isa<UndefValue>(XorOpValue.first))
1829 BlocksToFoldInto.
push_back(XorOpValue.second);
1834 if (BlocksToFoldInto.
size() ==
1835 cast<PHINode>(BB->
front()).getNumIncomingValues()) {
1873 Value *
IV = PN.getIncomingValueForBlock(OldPred);
1882 PN.addIncoming(
IV, NewPred);
1898 if (LoopHeaders.erase(SinglePred))
1899 LoopHeaders.insert(BB);
1952 for (
Use &U :
I.uses()) {
1955 if (UserPN->getIncomingBlock(U) == BB)
1957 }
else if (
User->getParent() == BB)
1973 if (UsesToRename.
empty() && DbgValues.
empty() && DbgVariableRecords.
empty())
1975 LLVM_DEBUG(
dbgs() <<
"JT: Renaming non-local uses of: " <<
I <<
"\n");
1984 while (!UsesToRename.
empty())
1986 if (!DbgValues.
empty() || !DbgVariableRecords.
empty()) {
1990 DbgVariableRecords.
clear();
2011 auto RetargetDbgValueIfPossible = [&](
Instruction *NewInst) ->
bool {
2012 auto DbgInstruction = dyn_cast<DbgValueInst>(NewInst);
2013 if (!DbgInstruction)
2017 for (
auto DbgOperand : DbgInstruction->location_ops()) {
2018 auto DbgOperandInstruction = dyn_cast<Instruction>(DbgOperand);
2019 if (!DbgOperandInstruction)
2022 auto I = ValueMapping.
find(DbgOperandInstruction);
2023 if (
I != ValueMapping.
end()) {
2025 std::pair<Value *, Value *>(DbgOperand,
I->second));
2029 for (
auto &[OldOp, MappedOp] : OperandsToRemap)
2030 DbgInstruction->replaceVariableLocationOp(OldOp, MappedOp);
2038 for (
auto *
Op : DVR->location_ops()) {
2043 auto I = ValueMapping.
find(OpInst);
2044 if (
I != ValueMapping.
end())
2045 OperandsToRemap.
insert({OpInst,
I->second});
2048 for (
auto &[OldOp, MappedOp] : OperandsToRemap)
2049 DVR->replaceVariableLocationOp(OldOp, MappedOp);
2057 for (;
PHINode *PN = dyn_cast<PHINode>(BI); ++BI) {
2060 ValueMapping[PN] = NewPN;
2075 RetargetDbgVariableRecordIfPossible(&DVR);
2081 for (; BI != BE; ++BI) {
2083 New->setName(BI->getName());
2084 New->insertInto(NewBB, NewBB->
end());
2085 ValueMapping[&*BI] = New;
2088 CloneAndRemapDbgInfo(New, &*BI);
2090 if (RetargetDbgValueIfPossible(New))
2094 for (
unsigned i = 0, e = New->getNumOperands(); i != e; ++i)
2095 if (
Instruction *Inst = dyn_cast<Instruction>(New->getOperand(i))) {
2097 if (
I != ValueMapping.
end())
2098 New->setOperand(i,
I->second);
2104 if (BE != RangeBB->
end() && BE->hasDbgRecords()) {
2110 RetargetDbgVariableRecordIfPossible(&DVR);
2168 if (LoopHeaders.count(PredBB))
2178 unsigned ZeroCount = 0;
2179 unsigned OneCount = 0;
2185 if (isa<IndirectBrInst>(
P->getTerminator()))
2187 if (
ConstantInt *CI = dyn_cast_or_null<ConstantInt>(
2192 }
else if (CI->isOne()) {
2201 if (ZeroCount == 1) {
2202 PredPredBB = ZeroPred;
2203 }
else if (OneCount == 1) {
2204 PredPredBB = OnePred;
2214 <<
"' - would thread to self!\n");
2220 if (LoopHeaders.count(BB) || LoopHeaders.count(SuccBB)) {
2222 bool BBIsHeader = LoopHeaders.count(BB);
2223 bool SuccIsHeader = LoopHeaders.count(SuccBB);
2224 dbgs() <<
" Not threading across "
2225 << (BBIsHeader ?
"loop header BB '" :
"block BB '")
2226 << BB->
getName() <<
"' to dest "
2227 << (SuccIsHeader ?
"loop header BB '" :
"block BB '")
2229 <<
"' - it might create an irreducible loop!\n";
2243 if (BBCost > BBDupThreshold || PredBBCost > BBDupThreshold ||
2244 BBCost + PredBBCost > BBDupThreshold) {
2246 <<
"' - Cost is too high: " << PredBBCost
2247 <<
" for PredBB, " << BBCost <<
"for BB\n");
2264 bool HasProfile = doesBlockHaveProfileData(BB);
2265 auto *BFI = getOrCreateBFI(HasProfile);
2266 auto *BPI = getOrCreateBPI(BFI !=
nullptr);
2278 assert(BPI &&
"It's expected BPI to exist along with BFI");
2279 auto NewBBFreq = BFI->getBlockFreq(PredPredBB) *
2280 BPI->getEdgeProbability(PredPredBB, PredBB);
2281 BFI->setBlockFreq(NewBB, NewBBFreq);
2293 BPI->copyEdgeProbabilities(PredBB, NewBB);
2310 DTU->applyUpdatesPermissive(
2335 <<
"' - would thread to self!\n");
2341 if (LoopHeaders.count(BB) || LoopHeaders.count(SuccBB)) {
2343 bool BBIsHeader = LoopHeaders.count(BB);
2344 bool SuccIsHeader = LoopHeaders.count(SuccBB);
2345 dbgs() <<
" Not threading across "
2346 << (BBIsHeader ?
"loop header BB '" :
"block BB '") << BB->
getName()
2347 <<
"' to dest " << (SuccIsHeader ?
"loop header BB '" :
"block BB '")
2348 << SuccBB->
getName() <<
"' - it might create an irreducible loop!\n";
2355 if (JumpThreadCost > BBDupThreshold) {
2357 <<
"' - Cost is too high: " << JumpThreadCost <<
"\n");
2371 assert(SuccBB != BB &&
"Don't create an infinite loop");
2373 assert(!LoopHeaders.count(BB) && !LoopHeaders.count(SuccBB) &&
2374 "Don't thread across loop headers");
2377 bool HasProfile = doesBlockHaveProfileData(BB);
2378 auto *BFI = getOrCreateBFI(HasProfile);
2379 auto *BPI = getOrCreateBPI(BFI !=
nullptr);
2383 if (PredBBs.
size() == 1)
2384 PredBB = PredBBs[0];
2387 <<
" common predecessors.\n");
2388 PredBB = splitBlockPreds(BB, PredBBs,
".thr_comm");
2393 <<
"' to '" << SuccBB->
getName()
2394 <<
", across block:\n " << *BB <<
"\n");
2405 assert(BPI &&
"It's expected BPI to exist along with BFI");
2407 BFI->getBlockFreq(PredBB) * BPI->getEdgeProbability(PredBB, BB);
2408 BFI->setBlockFreq(NewBB, NewBBFreq);
2448 updateBlockFreqAndEdgeWeight(PredBB, BB, NewBB, SuccBB, BFI, BPI, HasProfile);
2459 const char *Suffix) {
2465 auto *BFI = getBFI();
2467 auto *BPI = getOrCreateBPI(
true);
2468 for (
auto *Pred : Preds)
2469 FreqMap.
insert(std::make_pair(
2470 Pred, BFI->getBlockFreq(Pred) * BPI->getEdgeProbability(Pred, BB)));
2476 std::string NewName = std::string(Suffix) +
".split-lp";
2482 std::vector<DominatorTree::UpdateType> Updates;
2483 Updates.reserve((2 * Preds.size()) + NewBBs.
size());
2484 for (
auto *NewBB : NewBBs) {
2491 NewBBFreq += FreqMap.
lookup(Pred);
2494 BFI->setBlockFreq(NewBB, NewBBFreq);
2497 DTU->applyUpdatesPermissive(Updates);
2501bool JumpThreadingPass::doesBlockHaveProfileData(
BasicBlock *BB) {
2512void JumpThreadingPass::updateBlockFreqAndEdgeWeight(
BasicBlock *PredBB,
2519 assert(((BFI && BPI) || (!BFI && !BFI)) &&
2520 "Both BFI & BPI should either be set or unset");
2524 "It's expected to have BFI/BPI when profile info exists");
2530 auto BBOrigFreq =
BFI->getBlockFreq(BB);
2531 auto NewBBFreq =
BFI->getBlockFreq(NewBB);
2533 auto BBNewFreq = BBOrigFreq - NewBBFreq;
2534 BFI->setBlockFreq(BB, BBNewFreq);
2540 auto SuccFreq = (Succ == SuccBB)
2541 ? BB2SuccBBFreq - NewBBFreq
2543 BBSuccFreq.
push_back(SuccFreq.getFrequency());
2549 if (MaxBBSuccFreq == 0)
2551 {1, static_cast<unsigned>(BBSuccFreq.size())});
2598 if (BBSuccProbs.
size() >= 2 && HasProfile) {
2600 for (
auto Prob : BBSuccProbs)
2615 assert(!PredBBs.
empty() &&
"Can't handle an empty set");
2620 if (LoopHeaders.count(BB)) {
2622 <<
"' into predecessor block '" << PredBBs[0]->getName()
2623 <<
"' - it might create an irreducible loop!\n");
2629 if (DuplicationCost > BBDupThreshold) {
2631 <<
"' - Cost is too high: " << DuplicationCost <<
"\n");
2636 std::vector<DominatorTree::UpdateType> Updates;
2638 if (PredBBs.
size() == 1)
2639 PredBB = PredBBs[0];
2642 <<
" common predecessors.\n");
2643 PredBB = splitBlockPreds(BB, PredBBs,
".thr_comm");
2650 <<
"' into end of '" << PredBB->
getName()
2651 <<
"' to eliminate branch on phi. Cost: "
2652 << DuplicationCost <<
" block is:" << *BB <<
"\n");
2672 for (;
PHINode *PN = dyn_cast<PHINode>(BI); ++BI)
2676 for (; BI != BB->
end(); ++BI) {
2678 New->insertInto(PredBB, OldPredBranch->
getIterator());
2681 for (
unsigned i = 0, e = New->getNumOperands(); i != e; ++i)
2682 if (
Instruction *Inst = dyn_cast<Instruction>(New->getOperand(i))) {
2684 if (
I != ValueMapping.
end())
2685 New->setOperand(i,
I->second);
2697 ValueMapping[&*BI] =
IV;
2698 if (!New->mayHaveSideEffects()) {
2699 New->eraseFromParent();
2706 ValueMapping[&*BI] = New;
2710 New->setName(BI->getName());
2712 New->cloneDebugInfoFrom(&*BI);
2714 for (
unsigned i = 0, e = New->getNumOperands(); i != e; ++i)
2715 if (
BasicBlock *SuccBB = dyn_cast<BasicBlock>(New->getOperand(i)))
2736 if (
auto *BPI = getBPI())
2738 DTU->applyUpdatesPermissive(Updates);
2769 BI->applyMergedLocation(PredTerm->
getDebugLoc(), SI->getDebugLoc());
2770 BI->copyMetadata(*SI, {LLVMContext::MD_prof});
2778 (TrueWeight + FalseWeight) != 0) {
2781 TrueWeight, TrueWeight + FalseWeight));
2783 FalseWeight, TrueWeight + FalseWeight));
2785 if (
auto *BPI = getBPI())
2789 if (
auto *BFI = getBFI()) {
2790 if ((TrueWeight + FalseWeight) == 0) {
2795 TrueWeight, TrueWeight + FalseWeight);
2796 auto NewBBFreq = BFI->getBlockFreq(Pred) * PredToNewBBProb;
2797 BFI->setBlockFreq(NewBB, NewBBFreq);
2801 SI->eraseFromParent();
2807 PHINode *Phi = dyn_cast<PHINode>(BI); ++BI)
2809 Phi->addIncoming(Phi->getIncomingValueForBlock(Pred), NewBB);
2813 PHINode *CondPHI = dyn_cast<PHINode>(SI->getCondition());
2815 if (!CondPHI || CondPHI->
getParent() != BB)
2865 if (!SI || SI->getParent() != Pred || !SI->hasOneUse())
2877 CondRHS, Pred, BB, CondCmp);
2880 CondRHS, Pred, BB, CondCmp);
2881 if ((LHSRes || RHSRes) && LHSRes != RHSRes) {
2917 if (LoopHeaders.count(BB))
2921 PHINode *PN = dyn_cast<PHINode>(BI); ++BI) {
2924 [](
Value *V) { return !isa<ConstantInt>(V); }))
2928 using namespace PatternMatch;
2931 if (SI->getParent() != BB)
2935 return Cond &&
Cond == V &&
Cond->getType()->isIntegerTy(1) && !IsAndOr;
2939 for (
Use &U : PN->uses()) {
2940 if (
ICmpInst *Cmp = dyn_cast<ICmpInst>(U.getUser())) {
2943 if (Cmp->getParent() == BB && Cmp->hasOneUse() &&
2944 isa<ConstantInt>(Cmp->getOperand(1 - U.getOperandNo())))
2945 if (
SelectInst *SelectI = dyn_cast<SelectInst>(Cmp->user_back()))
2946 if (isUnfoldCandidate(SelectI, Cmp->use_begin()->get())) {
2950 }
else if (
SelectInst *SelectI = dyn_cast<SelectInst>(U.getUser())) {
2952 if (isUnfoldCandidate(SelectI, U.get())) {
2971 NewPN->
addIncoming(SI->getTrueValue(), Term->getParent());
2974 SI->replaceAllUsesWith(NewPN);
2975 SI->eraseFromParent();
2977 std::vector<DominatorTree::UpdateType> Updates;
2987 DTU->applyUpdatesPermissive(Updates);
3013 using namespace PatternMatch;
3035 if (
auto *BI = dyn_cast<BranchInst>(Parent->getTerminator()))
3056 bool TrueDestIsSafe =
false;
3057 bool FalseDestIsSafe =
false;
3062 TrueDestIsSafe =
true;
3067 FalseDestIsSafe =
true;
3070 if (!TrueDestIsSafe && !FalseDestIsSafe)
3073 BasicBlock *PredUnguardedBlock = TrueDestIsSafe ? TrueDest : FalseDest;
3074 BasicBlock *PredGuardedBlock = FalseDestIsSafe ? TrueDest : FalseDest;
3080 if (
Cost > BBDupThreshold)
3085 BB, PredGuardedBlock, AfterGuard, GuardedMapping, *DTU);
3086 assert(GuardedBlock &&
"Could not create the guarded block?");
3091 BB, PredUnguardedBlock, Guard, UnguardedMapping, *DTU);
3092 assert(UnguardedBlock &&
"Could not create the unguarded block?");
3094 << GuardedBlock->
getName() <<
"\n");
3099 for (
auto BI = BB->
begin(); &*BI != AfterGuard; ++BI)
3100 if (!isa<PHINode>(&*BI))
3107 if (!Inst->use_empty()) {
3109 NewPN->
addIncoming(UnguardedMapping[Inst], UnguardedBlock);
3110 NewPN->
addIncoming(GuardedMapping[Inst], GuardedBlock);
3113 Inst->replaceAllUsesWith(NewPN);
3115 Inst->dropDbgRecords();
3116 Inst->eraseFromParent();
3131template <
typename AnalysisT>
3132typename AnalysisT::Result *JumpThreadingPass::runExternalAnalysis() {
3133 assert(FAM &&
"Can't run external analysis without FunctionAnalysisManager");
3138 if (!ChangedSinceLastAnalysisUpdate) {
3139 assert(!DTU->hasPendingUpdates() &&
3140 "Lost update of 'ChangedSinceLastAnalysisUpdate'?");
3144 ChangedSinceLastAnalysisUpdate =
false;
3146 auto PA = getPreservedAnalysis();
3156 assert(DTU->getDomTree().verify(DominatorTree::VerificationLevel::Fast));
3157 assert((!DTU->hasPostDomTree() ||
3158 DTU->getPostDomTree().verify(
3172 assert(FAM &&
"Can't create BPI without FunctionAnalysisManager");
3180 assert(FAM &&
"Can't create BFI without FunctionAnalysisManager");
3190 auto *Res = getBPI();
3195 BPI = runExternalAnalysis<BranchProbabilityAnalysis>();
3201 auto *Res = getBFI();
3206 BFI = runExternalAnalysis<BlockFrequencyAnalysis>();
ReachingDefAnalysis InstSet & ToRemove
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static const Function * getParent(const Value *V)
BlockVerifier::State From
This file contains the declarations for the subclasses of Constant, which represent the different fla...
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
This file defines the DenseMap class.
This is the interface for a simple mod/ref and alias analysis over globals.
This file provides various utilities for inspecting and working with the control flow graph in LLVM I...
Module.h This file contains the declarations for the Module class.
This header defines various interfaces for pass management in LLVM.
This defines the Use class.
static unsigned getBestDestForJumpOnUndef(BasicBlock *BB)
GetBestDestForBranchOnUndef - If we determine that the specified block ends in an undefined jump,...
static cl::opt< unsigned > PhiDuplicateThreshold("jump-threading-phi-threshold", cl::desc("Max PHIs in BB to duplicate for jump threading"), cl::init(76), cl::Hidden)
static bool replaceFoldableUses(Instruction *Cond, Value *ToVal, BasicBlock *KnownAtEndOfBB)
static cl::opt< unsigned > BBDuplicateThreshold("jump-threading-threshold", cl::desc("Max block size to duplicate for jump threading"), cl::init(6), cl::Hidden)
static cl::opt< bool > ThreadAcrossLoopHeaders("jump-threading-across-loop-headers", cl::desc("Allow JumpThreading to thread across loop headers, for testing"), cl::init(false), cl::Hidden)
static unsigned getJumpThreadDuplicationCost(const TargetTransformInfo *TTI, BasicBlock *BB, Instruction *StopAt, unsigned Threshold)
Return the cost of duplicating a piece of this block from first non-phi and before StopAt instruction...
static void addPHINodeEntriesForMappedBlock(BasicBlock *PHIBB, BasicBlock *OldPred, BasicBlock *NewPred, ValueToValueMapTy &ValueMap)
addPHINodeEntriesForMappedBlock - We're adding 'NewPred' as a new predecessor to the PHIBB block.
static BasicBlock * findMostPopularDest(BasicBlock *BB, const SmallVectorImpl< std::pair< BasicBlock *, BasicBlock * > > &PredToDestList)
findMostPopularDest - The specified list contains multiple possible threadable destinations.
static Constant * getKnownConstant(Value *Val, ConstantPreference Preference)
getKnownConstant - Helper method to determine if we can thread over a terminator with the given value...
static cl::opt< unsigned > ImplicationSearchThreshold("jump-threading-implication-search-threshold", cl::desc("The number of predecessors to search for a stronger " "condition to use to thread over a weaker condition"), cl::init(3), cl::Hidden)
static bool isOpDefinedInBlock(Value *Op, BasicBlock *BB)
Return true if Op is an instruction defined in the given block.
static void updatePredecessorProfileMetadata(PHINode *PN, BasicBlock *BB)
static bool hasAddressTakenAndUsed(BasicBlock *BB)
See the comments on JumpThreadingPass.
static bool isZero(Value *V, const DataLayout &DL, DominatorTree *DT, AssumptionCache *AC)
This file implements a map that provides insertion order iteration.
This file provides utility analysis objects describing memory locations.
This file contains the declarations for profiling metadata utility functions.
const SmallVectorImpl< MachineOperand > & Cond
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
static const uint32_t IV[8]
A manager for alias analyses.
A container for analyses that lazily runs them and caches their results.
void invalidate(IRUnitT &IR, const PreservedAnalyses &PA)
Invalidate cached analyses for an IR unit.
PassT::Result * getCachedResult(IRUnitT &IR) const
Get the cached result of an analysis pass for a given IR unit.
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
LLVM Basic Block Representation.
iterator begin()
Instruction iterator methods.
iterator_range< const_phi_iterator > phis() const
Returns a range that iterates over the phis in the basic block.
const_iterator getFirstInsertionPt() const
Returns an iterator to the first instruction in this block that is suitable for inserting a non-PHI i...
DbgMarker * createMarker(Instruction *I)
Attach a DbgMarker to the given instruction.
bool hasAddressTaken() const
Returns true if there are any uses of this basic block other than direct branches,...
InstListType::const_iterator const_iterator
const Instruction & front() const
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
void moveAfter(BasicBlock *MovePos)
Unlink this basic block from its current function and insert it right after MovePos in the function M...
bool hasNPredecessors(unsigned N) const
Return true if this block has exactly N predecessors.
const BasicBlock * getSinglePredecessor() const
Return the predecessor of this block if it has a single predecessor block.
const Function * getParent() const
Return the enclosing method, or null if none.
const DataLayout & getDataLayout() const
Get the data layout of the module this basic block belongs to.
DbgMarker * getMarker(InstListType::iterator It)
Return the DbgMarker for the position given by It, so that DbgRecords can be inserted there.
InstListType::iterator iterator
Instruction iterators...
LLVMContext & getContext() const
Get the context in which this basic block lives.
bool isLandingPad() const
Return true if this basic block is a landing pad.
bool isEHPad() const
Return true if this basic block is an exception handling block.
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
void removePredecessor(BasicBlock *Pred, bool KeepOneInputPHIs=false)
Update PHI nodes in this BasicBlock before removal of predecessor Pred.
This class is a wrapper over an AAResults, and it is intended to be used only when there are no IR ch...
void disableDominatorTree()
Disable the use of the dominator tree during alias analysis queries.
The address of a basic block.
static BlockAddress * get(Function *F, BasicBlock *BB)
Return a BlockAddress for the specified function and basic block.
Analysis pass which computes BlockFrequencyInfo.
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Conditional or Unconditional Branch instruction.
bool isConditional() const
unsigned getNumSuccessors() const
static BranchInst * Create(BasicBlock *IfTrue, InsertPosition InsertBefore=nullptr)
BasicBlock * getSuccessor(unsigned i) const
bool isUnconditional() const
Value * getCondition() const
Analysis pass which computes BranchProbabilityInfo.
Analysis providing branch probability information.
void setEdgeProbability(const BasicBlock *Src, const SmallVectorImpl< BranchProbability > &Probs)
Set the raw probabilities for all edges from the given block.
BranchProbability getEdgeProbability(const BasicBlock *Src, unsigned IndexInSuccessors) const
Get an edge's probability, relative to other out-edges of the Src.
void copyEdgeProbabilities(BasicBlock *Src, BasicBlock *Dst)
Copy outgoing edge probabilities from Src to Dst.
static BranchProbability getBranchProbability(uint64_t Numerator, uint64_t Denominator)
uint32_t getNumerator() const
BranchProbability getCompl() const
static void normalizeProbabilities(ProbabilityIter Begin, ProbabilityIter End)
Value * getArgOperand(unsigned i) const
This class represents a function call, abstracting a target machine's calling convention.
This is the base class for all instructions that perform data casts.
static CastInst * CreateBitOrPointerCast(Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a BitCast, a PtrToInt, or an IntToPTr cast instruction.
This class is the base class for the comparison instructions.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Predicate getPredicate() const
Return the predicate for this instruction.
An abstraction over a floating-point predicate, and a pack of an integer predicate with samesign info...
static Constant * getNot(Constant *C)
This is the shared class of boolean and integer constants.
bool isOne() const
This is just a convenience method to make client code smaller for a common case.
static ConstantInt * getTrue(LLVMContext &Context)
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
static ConstantInt * getFalse(LLVMContext &Context)
const APInt & getValue() const
Return the constant as an APInt value reference.
This class represents a range of values.
ConstantRange add(const ConstantRange &Other) const
Return a new range representing the possible values resulting from an addition of a value in this ran...
static ConstantRange makeExactICmpRegion(CmpInst::Predicate Pred, const APInt &Other)
Produce the exact range such that all values in the returned range satisfy the given predicate with a...
ConstantRange inverse() const
Return a new range that is the logical not of the current set.
bool contains(const APInt &Val) const
Return true if the specified value is in the set.
This is an important base class in LLVM.
void removeDeadConstantUsers() const
If there are any dead constant users dangling off of this constant, remove them.
This class represents an Operation in the Expression.
A parsed version of the target data layout string in and methods for querying it.
Per-instruction record of debug-info.
iterator_range< simple_ilist< DbgRecord >::iterator > cloneDebugInfoFrom(DbgMarker *From, std::optional< simple_ilist< DbgRecord >::iterator > FromHere, bool InsertAtHead=false)
Clone all DbgMarkers from From into this marker.
const BasicBlock * getParent() const
This represents the llvm.dbg.value instruction.
Record of a variable value-assignment, aka a non instruction representation of the dbg....
ValueT lookup(const_arg_type_t< KeyT > Val) const
lookup - Return the entry for the specified key, or a default constructed value if no such entry exis...
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Analysis pass which computes a DominatorTree.
static constexpr UpdateKind Delete
static constexpr UpdateKind Insert
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
bool isReachableFromEntry(const Use &U) const
Provide an overload for a Use.
This class represents a freeze function that returns random concrete value if an operand is either a ...
const BasicBlock & getEntryBlock() const
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
void flush()
Apply all pending updates to available trees and flush all BasicBlocks awaiting deletion.
Module * getParent()
Get the module that this global value is contained inside of...
This instruction compares its operands according to the predicate given to the constructor.
Indirect Branch Instruction.
void removeFromParent()
This method unlinks 'this' from the containing basic block, but does not delete it.
iterator_range< simple_ilist< DbgRecord >::iterator > cloneDebugInfoFrom(const Instruction *From, std::optional< simple_ilist< DbgRecord >::iterator > FromHere=std::nullopt, bool InsertAtHead=false)
Clone any debug-info attached to From onto this instruction.
unsigned getNumSuccessors() const LLVM_READONLY
Return the number of successors that this instruction has.
void insertBefore(Instruction *InsertPos)
Insert an unlinked instruction into a basic block immediately before the specified instruction.
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
void setAAMetadata(const AAMDNodes &N)
Sets the AA metadata on this instruction from the AAMDNodes structure.
bool isAtomic() const LLVM_READONLY
Return true if this instruction has an AtomicOrdering of unordered or higher.
InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
BasicBlock * getSuccessor(unsigned Idx) const LLVM_READONLY
Return the specified successor. This instruction must be a terminator.
AAMDNodes getAAMetadata() const
Returns the AA metadata for this instruction.
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
void setSuccessor(unsigned Idx, BasicBlock *BB)
Update the specified successor to point at the provided block.
const DataLayout & getDataLayout() const
Get the data layout of the module this instruction belongs to.
bool isSpecialTerminator() const
InstListType::iterator insertInto(BasicBlock *ParentBB, InstListType::iterator It)
Inserts an unlinked instruction into ParentBB at position It and returns the iterator of the inserted...
A wrapper class for inspecting calls to intrinsic functions.
bool simplifyPartiallyRedundantLoad(LoadInst *LI)
simplifyPartiallyRedundantLoad - If LoadI is an obviously partially redundant load instruction,...
bool processBranchOnXOR(BinaryOperator *BO)
processBranchOnXOR - We have an otherwise unthreadable conditional branch on a xor instruction in the...
bool processGuards(BasicBlock *BB)
Try to propagate a guard from the current BB into one of its predecessors in case if another branch o...
void updateSSA(BasicBlock *BB, BasicBlock *NewBB, ValueToValueMapTy &ValueMapping)
Update the SSA form.
bool computeValueKnownInPredecessors(Value *V, BasicBlock *BB, jumpthreading::PredValueInfo &Result, jumpthreading::ConstantPreference Preference, Instruction *CxtI=nullptr)
void findLoopHeaders(Function &F)
findLoopHeaders - We do not want jump threading to turn proper loop structures into irreducible loops...
bool maybeMergeBasicBlockIntoOnlyPred(BasicBlock *BB)
Merge basic block BB into its sole predecessor if possible.
JumpThreadingPass(int T=-1)
void cloneInstructions(ValueToValueMapTy &ValueMapping, BasicBlock::iterator BI, BasicBlock::iterator BE, BasicBlock *NewBB, BasicBlock *PredBB)
Clone instructions in range [BI, BE) to NewBB.
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
bool runImpl(Function &F, FunctionAnalysisManager *FAM, TargetLibraryInfo *TLI, TargetTransformInfo *TTI, LazyValueInfo *LVI, AAResults *AA, std::unique_ptr< DomTreeUpdater > DTU, std::optional< BlockFrequencyInfo * > BFI, std::optional< BranchProbabilityInfo * > BPI)
Constant * evaluateOnPredecessorEdge(BasicBlock *BB, BasicBlock *PredPredBB, Value *cond, const DataLayout &DL)
bool processBranchOnPHI(PHINode *PN)
processBranchOnPHI - We have an otherwise unthreadable conditional branch on a PHI node (or freeze PH...
bool maybethreadThroughTwoBasicBlocks(BasicBlock *BB, Value *Cond)
Attempt to thread through two successive basic blocks.
bool computeValueKnownInPredecessorsImpl(Value *V, BasicBlock *BB, jumpthreading::PredValueInfo &Result, jumpthreading::ConstantPreference Preference, SmallPtrSet< Value *, 4 > &RecursionSet, Instruction *CxtI=nullptr)
computeValueKnownInPredecessors - Given a basic block BB and a value V, see if we can infer that the ...
void unfoldSelectInstr(BasicBlock *Pred, BasicBlock *BB, SelectInst *SI, PHINode *SIUse, unsigned Idx)
DomTreeUpdater * getDomTreeUpdater() const
bool processThreadableEdges(Value *Cond, BasicBlock *BB, jumpthreading::ConstantPreference Preference, Instruction *CxtI=nullptr)
bool processBlock(BasicBlock *BB)
processBlock - If there are any predecessors whose control can be threaded through to a successor,...
bool processImpliedCondition(BasicBlock *BB)
bool duplicateCondBranchOnPHIIntoPred(BasicBlock *BB, const SmallVectorImpl< BasicBlock * > &PredBBs)
duplicateCondBranchOnPHIIntoPred - PredBB contains an unconditional branch to BB which contains an i1...
void threadThroughTwoBasicBlocks(BasicBlock *PredPredBB, BasicBlock *PredBB, BasicBlock *BB, BasicBlock *SuccBB)
bool tryThreadEdge(BasicBlock *BB, const SmallVectorImpl< BasicBlock * > &PredBBs, BasicBlock *SuccBB)
tryThreadEdge - Thread an edge if it's safe and profitable to do so.
bool tryToUnfoldSelect(CmpInst *CondCmp, BasicBlock *BB)
tryToUnfoldSelect - Look for blocks of the form bb1: a = select br bb2
bool tryToUnfoldSelectInCurrBB(BasicBlock *BB)
tryToUnfoldSelectInCurrBB - Look for PHI/Select or PHI/CMP/Select in the same BB in the form bb: p = ...
void threadEdge(BasicBlock *BB, const SmallVectorImpl< BasicBlock * > &PredBBs, BasicBlock *SuccBB)
threadEdge - We have decided that it is safe and profitable to factor the blocks in PredBBs to one pr...
bool threadGuard(BasicBlock *BB, IntrinsicInst *Guard, BranchInst *BI)
Try to propagate the guard from BB which is the lower block of a diamond to one of its branches,...
This is an important class for using LLVM in a threaded context.
Analysis to compute lazy value information.
This pass computes, caches, and vends lazy value constraint information.
void eraseBlock(BasicBlock *BB)
Inform the analysis cache that we have erased a block.
void threadEdge(BasicBlock *PredBB, BasicBlock *OldSucc, BasicBlock *NewSucc)
Inform the analysis cache that we have threaded an edge from PredBB to OldSucc to be from PredBB to N...
Constant * getPredicateOnEdge(CmpInst::Predicate Pred, Value *V, Constant *C, BasicBlock *FromBB, BasicBlock *ToBB, Instruction *CxtI=nullptr)
Determine whether the specified value comparison with a constant is known to be true or false on the ...
Constant * getConstantOnEdge(Value *V, BasicBlock *FromBB, BasicBlock *ToBB, Instruction *CxtI=nullptr)
Determine whether the specified value is known to be a constant on the specified edge.
ConstantRange getConstantRangeOnEdge(Value *V, BasicBlock *FromBB, BasicBlock *ToBB, Instruction *CxtI=nullptr)
Return the ConstantRage constraint that is known to hold for the specified value on the specified edg...
Constant * getConstant(Value *V, Instruction *CxtI)
Determine whether the specified value is known to be a constant at the specified instruction.
void forgetValue(Value *V)
Remove information related to this value from the cache.
Constant * getPredicateAt(CmpInst::Predicate Pred, Value *V, Constant *C, Instruction *CxtI, bool UseBlockValue)
Determine whether the specified value comparison with a constant is known to be true or false at the ...
An instruction for reading from memory.
AtomicOrdering getOrdering() const
Returns the ordering constraint of this load instruction.
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this load instruction.
Align getAlign() const
Return the alignment of the access that is being performed.
static LocationSize precise(uint64_t Value)
This class implements a map that also provides access to all stored values in a deterministic order.
Representation for a specific memory location.
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
void setIncomingValue(unsigned i, Value *V)
Value * getIncomingValueForBlock(const BasicBlock *BB) const
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
unsigned getNumIncomingValues() const
Return the number of incoming edges.
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
void preserve()
Mark an analysis as preserved.
Helper class for SSA formation on a set of values defined in multiple blocks.
void RewriteUse(Use &U)
Rewrite a use of the symbolic value.
void Initialize(Type *Ty, StringRef Name)
Reset this object to get ready for a new set of SSA updates with type 'Ty'.
void UpdateDebugValues(Instruction *I)
Rewrite debug value intrinsics to conform to a new SSA form.
void AddAvailableValue(BasicBlock *BB, Value *V)
Indicate that a rewritten value is available in the specified block with the specified value.
This class represents the LLVM 'select' instruction.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void assign(size_type NumElts, ValueParamT Elt)
reference emplace_back(ArgTypes &&... Args)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Analysis pass providing the TargetTransformInfo.
Analysis pass providing the TargetLibraryInfo.
Provides information about what library functions are available for the current target.
The instances of the Type class are immutable: once they are created, they are never changed.
bool isVectorTy() const
True if this is an instance of VectorType.
bool isIntegerTy() const
True if this is an instance of IntegerType.
'undef' values are things that do not have specified contents.
static UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
A Use represents the edge between a Value definition and its users.
void setOperand(unsigned i, Value *Val)
Value * getOperand(unsigned i) const
iterator find(const KeyT &Val)
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
const Value * DoPHITranslation(const BasicBlock *CurBB, const BasicBlock *PredBB) const
Translate PHI node to its predecessor from the given basic block.
bool hasOneUse() const
Return true if there is exactly one use of this value.
void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
StringRef getName() const
Return a constant reference to the value's name.
void takeName(Value *V)
Transfer the name from V to this value.
const ParentTy * getParent() const
self_iterator getIterator()
NodeTy * getNextNode()
Get the next node, or nullptr for the list tail.
@ C
The default llvm calling convention, compatible with C.
Function * getDeclarationIfExists(Module *M, ID id, ArrayRef< Type * > Tys, FunctionType *FT=nullptr)
This version supports overloaded intrinsics.
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
bool match(Val *V, const Pattern &P)
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
class_match< CmpInst > m_Cmp()
Matches any compare instruction and ignore it.
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
bool RemoveRedundantDbgInstrs(BasicBlock *BB)
Try to remove redundant dbg.value instructions from given basic block.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
bool ConstantFoldTerminator(BasicBlock *BB, bool DeleteDeadConditions=false, const TargetLibraryInfo *TLI=nullptr, DomTreeUpdater *DTU=nullptr)
If a terminator instruction is predicated on a constant value, convert it into an unconditional branc...
auto pred_end(const MachineBasicBlock *BB)
unsigned replaceNonLocalUsesWith(Instruction *From, Value *To)
auto successors(const MachineBasicBlock *BB)
MDNode * getBranchWeightMDNode(const Instruction &I)
Get the branch weights metadata node.
Value * findAvailablePtrLoadStore(const MemoryLocation &Loc, Type *AccessTy, bool AtLeastAtomic, BasicBlock *ScanBB, BasicBlock::iterator &ScanFrom, unsigned MaxInstsToScan, BatchAAResults *AA, bool *IsLoadCSE, unsigned *NumScanedInst)
Scan backwards to see if we have the value of the given pointer available locally within a small numb...
void remapDebugVariable(ValueToValueMapTy &Mapping, Instruction *Inst)
Remap the operands of the debug records attached to Inst, and the operands of Inst itself if it's a d...
Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
auto pred_size(const MachineBasicBlock *BB)
bool SimplifyInstructionsInBlock(BasicBlock *BB, const TargetLibraryInfo *TLI=nullptr)
Scan the specified basic block and try to simplify any instructions in it and recursively delete dead...
void DeleteDeadBlock(BasicBlock *BB, DomTreeUpdater *DTU=nullptr, bool KeepOneInputPHIs=false)
Delete the specified block, which must have no predecessors.
Value * FindAvailableLoadedValue(LoadInst *Load, BasicBlock *ScanBB, BasicBlock::iterator &ScanFrom, unsigned MaxInstsToScan=DefMaxInstsToScan, BatchAAResults *AA=nullptr, bool *IsLoadCSE=nullptr, unsigned *NumScanedInst=nullptr)
Scan backwards to see if we have the value of the given load available locally within a small number ...
bool hasBranchWeightOrigin(const Instruction &I)
Check if Branch Weight Metadata has an "expected" field from an llvm.expect* intrinsic.
BasicBlock * DuplicateInstructionsInSplitBetween(BasicBlock *BB, BasicBlock *PredBB, Instruction *StopAt, ValueToValueMapTy &ValueMapping, DomTreeUpdater &DTU)
Split edge between BB and PredBB and duplicate all non-Phi instructions from BB between its beginning...
void findDbgValues(SmallVectorImpl< DbgValueInst * > &DbgValues, Value *V, SmallVectorImpl< DbgVariableRecord * > *DbgVariableRecords=nullptr)
Finds the llvm.dbg.value intrinsics describing a value.
Value * simplifyInstruction(Instruction *I, const SimplifyQuery &Q)
See if we can compute a simplified version of this instruction.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
bool isInstructionTriviallyDead(Instruction *I, const TargetLibraryInfo *TLI=nullptr)
Return true if the result produced by the instruction is not used, and the instruction will return.
bool isGuard(const User *U)
Returns true iff U has semantics of a guard expressed in a form of call of llvm.experimental....
bool TryToSimplifyUncondBranchFromEmptyBlock(BasicBlock *BB, DomTreeUpdater *DTU=nullptr)
BB is known to contain an unconditional branch, and contains no instructions other than PHI nodes,...
auto reverse(ContainerTy &&C)
void setBranchWeights(Instruction &I, ArrayRef< uint32_t > Weights, bool IsExpected)
Create a new branch_weights metadata node and add or overwrite a prof metadata reference to instructi...
bool hasValidBranchWeightMD(const Instruction &I)
Checks if an instructions has valid Branch Weight Metadata.
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
void cloneNoAliasScopes(ArrayRef< MDNode * > NoAliasDeclScopes, DenseMap< MDNode *, MDNode * > &ClonedScopes, StringRef Ext, LLVMContext &Context)
Duplicate the specified list of noalias decl scopes.
cl::opt< unsigned > DefMaxInstsToScan
The default number of maximum instructions to scan in the block, used by FindAvailableLoadedValue().
void SplitLandingPadPredecessors(BasicBlock *OrigBB, ArrayRef< BasicBlock * > Preds, const char *Suffix, const char *Suffix2, SmallVectorImpl< BasicBlock * > &NewBBs, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, bool PreserveLCSSA=false)
This method transforms the landing pad, OrigBB, by introducing two new basic blocks into the function...
Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
void combineMetadataForCSE(Instruction *K, const Instruction *J, bool DoesKMove)
Combine the metadata of two instructions so that K can replace J.
BasicBlock * SplitBlockPredecessors(BasicBlock *BB, ArrayRef< BasicBlock * > Preds, const char *Suffix, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, bool PreserveLCSSA=false)
This method introduces at least one new basic block into the function and moves some of the predecess...
void MergeBasicBlockIntoOnlyPred(BasicBlock *BB, DomTreeUpdater *DTU=nullptr)
BB is a block with one predecessor and its predecessor is known to have one successor (BB!...
auto lower_bound(R &&Range, T &&Value)
Provide wrappers to std::lower_bound which take ranges instead of having to pass begin/end explicitly...
void adaptNoAliasScopes(llvm::Instruction *I, const DenseMap< MDNode *, MDNode * > &ClonedScopes, LLVMContext &Context)
Adapt the metadata for the specified instruction according to the provided mapping.
auto max_element(R &&Range)
Provide wrappers to std::max_element which take ranges instead of having to pass begin/end explicitly...
Constant * ConstantFoldInstruction(Instruction *I, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldInstruction - Try to constant fold the specified instruction.
bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
bool isGuaranteedToTransferExecutionToSuccessor(const Instruction *I)
Return true if this function can prove that the instruction I will always transfer execution to one o...
bool extractBranchWeights(const MDNode *ProfileData, SmallVectorImpl< uint32_t > &Weights)
Extract branch weights from MD_prof metadata.
auto pred_begin(const MachineBasicBlock *BB)
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
auto predecessors(const MachineBasicBlock *BB)
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
bool pred_empty(const BasicBlock *BB)
Instruction * SplitBlockAndInsertIfThen(Value *Cond, BasicBlock::iterator SplitBefore, bool Unreachable, MDNode *BranchWeights=nullptr, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, BasicBlock *ThenBlock=nullptr)
Split the containing block at the specified instruction - everything before SplitBefore stays in the ...
Value * simplifyCmpInst(CmpPredicate Predicate, Value *LHS, Value *RHS, const SimplifyQuery &Q)
Given operands for a CmpInst, fold the result or return null.
void array_pod_sort(IteratorTy Start, IteratorTy End)
array_pod_sort - This sorts an array with the specified start and end extent.
void identifyNoAliasScopesToClone(ArrayRef< BasicBlock * > BBs, SmallVectorImpl< MDNode * > &NoAliasDeclScopes)
Find the 'llvm.experimental.noalias.scope.decl' intrinsics in the specified basic blocks and extract ...
BasicBlock * SplitEdge(BasicBlock *From, BasicBlock *To, DominatorTree *DT=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the edge connecting the specified blocks, and return the newly created basic block between From...
static auto filterDbgVars(iterator_range< simple_ilist< DbgRecord >::iterator > R)
Filter the DbgRecord range to DbgVariableRecord types only and downcast.
void FindFunctionBackedges(const Function &F, SmallVectorImpl< std::pair< const BasicBlock *, const BasicBlock * > > &Result)
Analyze the specified function to find all of the loop backedges in the function and return them.
std::optional< bool > isImpliedCondition(const Value *LHS, const Value *RHS, const DataLayout &DL, bool LHSIsTrue=true, unsigned Depth=0)
Return true if RHS is known to be implied true by LHS.
A collection of metadata nodes that might be associated with a memory access used by the alias-analys...
Function object to check whether the second component of a container supported by std::get (like std:...