LLVM 20.0.0git
|
#include "llvm/Transforms/Utils/LoopPeel.h"
#include "llvm/ADT/DenseMap.h"
#include "llvm/ADT/SmallVector.h"
#include "llvm/ADT/Statistic.h"
#include "llvm/Analysis/Loads.h"
#include "llvm/Analysis/LoopInfo.h"
#include "llvm/Analysis/LoopIterator.h"
#include "llvm/Analysis/ScalarEvolution.h"
#include "llvm/Analysis/ScalarEvolutionExpressions.h"
#include "llvm/Analysis/TargetTransformInfo.h"
#include "llvm/IR/BasicBlock.h"
#include "llvm/IR/Dominators.h"
#include "llvm/IR/Function.h"
#include "llvm/IR/InstrTypes.h"
#include "llvm/IR/Instruction.h"
#include "llvm/IR/Instructions.h"
#include "llvm/IR/LLVMContext.h"
#include "llvm/IR/MDBuilder.h"
#include "llvm/IR/PatternMatch.h"
#include "llvm/IR/ProfDataUtils.h"
#include "llvm/Support/Casting.h"
#include "llvm/Support/CommandLine.h"
#include "llvm/Support/Debug.h"
#include "llvm/Support/raw_ostream.h"
#include "llvm/Transforms/Utils/BasicBlockUtils.h"
#include "llvm/Transforms/Utils/Cloning.h"
#include "llvm/Transforms/Utils/LoopSimplify.h"
#include "llvm/Transforms/Utils/LoopUtils.h"
#include "llvm/Transforms/Utils/ValueMapper.h"
#include <algorithm>
#include <cassert>
#include <cstdint>
#include <optional>
Go to the source code of this file.
Classes | |
struct | WeightInfo |
Macros | |
#define | DEBUG_TYPE "loop-peel" |
Functions | |
STATISTIC (NumPeeled, "Number of loops peeled") | |
static unsigned | peelToTurnInvariantLoadsDerefencebale (Loop &L, DominatorTree &DT, AssumptionCache *AC) |
static unsigned | countToEliminateCompares (Loop &L, unsigned MaxPeelCount, ScalarEvolution &SE) |
static bool | violatesLegacyMultiExitLoopCheck (Loop *L) |
This "heuristic" exactly matches implicit behavior which used to exist inside getLoopEstimatedTripCount. | |
static void | updateBranchWeights (Instruction *Term, WeightInfo &Info) |
Update the branch weights of an exiting block of a peeled-off loop iteration. | |
static void | initBranchWeights (DenseMap< Instruction *, WeightInfo > &WeightInfos, Loop *L) |
Initialize the weights for all exiting blocks. | |
static void | cloneLoopBlocks (Loop *L, unsigned IterNumber, BasicBlock *InsertTop, BasicBlock *InsertBot, SmallVectorImpl< std::pair< BasicBlock *, BasicBlock * > > &ExitEdges, SmallVectorImpl< BasicBlock * > &NewBlocks, LoopBlocksDFS &LoopBlocks, ValueToValueMapTy &VMap, ValueToValueMapTy &LVMap, DominatorTree *DT, LoopInfo *LI, ArrayRef< MDNode * > LoopLocalNoAliasDeclScopes, ScalarEvolution &SE) |
Clones the body of the loop L, putting it between InsertTop and InsertBot . | |
Variables | |
static cl::opt< unsigned > | UnrollPeelCount ("unroll-peel-count", cl::Hidden, cl::desc("Set the unroll peeling count, for testing purposes")) |
static cl::opt< bool > | UnrollAllowPeeling ("unroll-allow-peeling", cl::init(true), cl::Hidden, cl::desc("Allows loops to be peeled when the dynamic " "trip count is known to be low.")) |
static cl::opt< bool > | UnrollAllowLoopNestsPeeling ("unroll-allow-loop-nests-peeling", cl::init(false), cl::Hidden, cl::desc("Allows loop nests to be peeled.")) |
static cl::opt< unsigned > | UnrollPeelMaxCount ("unroll-peel-max-count", cl::init(7), cl::Hidden, cl::desc("Max average trip count which will cause loop peeling.")) |
static cl::opt< unsigned > | UnrollForcePeelCount ("unroll-force-peel-count", cl::init(0), cl::Hidden, cl::desc("Force a peel count regardless of profiling information.")) |
static cl::opt< bool > | DisableAdvancedPeeling ("disable-advanced-peeling", cl::init(false), cl::Hidden, cl::desc("Disable advance peeling. Issues for convergent targets (D134803).")) |
static const char * | PeeledCountMetaData = "llvm.loop.peeled.count" |
#define DEBUG_TYPE "loop-peel" |
Definition at line 49 of file LoopPeel.cpp.
|
static |
Clones the body of the loop L, putting it between InsertTop
and InsertBot
.
IterNumber | The serial number of the iteration currently being peeled off. | |
ExitEdges | The exit edges of the original loop. | |
[out] | NewBlocks | A list of the blocks in the newly created clone |
[out] | VMap | The value map between the loop and the new clone. |
LoopBlocks | A helper for DFS-traversal of the loop. | |
LVMap | A value-map that maps instructions from the original loop to instructions in the last peeled-off iteration. |
Definition at line 748 of file LoopPeel.cpp.
References llvm::LoopBase< BlockT, LoopT >::addBasicBlockToLoop(), llvm::DominatorTreeBase< NodeT, IsPostDom >::addNewBlock(), llvm::LoopBlocksDFS::beginRPO(), llvm::DominatorTreeBase< NodeT, IsPostDom >::changeImmediateDominator(), llvm::cloneAndAdaptNoAliasScopes(), llvm::CloneBasicBlock(), llvm::cloneLoop(), llvm::LoopBlocksDFS::endRPO(), llvm::Instruction::eraseFromParent(), F, llvm::ScalarEvolution::forgetLcssaPhiWithNewPredecessor(), llvm::DomTreeNodeBase< NodeT >::getBlock(), llvm::DomTreeNodeBase< NodeT >::getIDom(), llvm::PHINode::getIncomingValueForBlock(), llvm::LoopInfoBase< BlockT, LoopT >::getLoopFor(), llvm::DominatorTreeBase< NodeT, IsPostDom >::getNode(), llvm::BasicBlock::getTerminator(), I, PHI, llvm::SmallVectorTemplateBase< T, bool >::push_back(), and llvm::Instruction::setSuccessor().
Referenced by llvm::peelLoop().
|
static |
Definition at line 341 of file LoopPeel.cpp.
References assert(), llvm::Depth, llvm::SCEVAddRecExpr::evaluateAtIteration(), llvm::ScalarEvolution::evaluatePredicate(), llvm::ScalarEvolution::getAddExpr(), llvm::ScalarEvolution::getConstant(), llvm::ScalarEvolution::getConstantMaxBackedgeTakenCount(), llvm::SCEVAddRecExpr::getLoop(), llvm::ScalarEvolution::getMonotonicPredicateType(), llvm::ScalarEvolution::getSCEV(), llvm::SCEVAddRecExpr::getStepRecurrence(), llvm::SCEV::getType(), llvm::Value::getType(), llvm::SCEVNAryExpr::hasNoSelfWrap(), I, llvm::SCEVAddRecExpr::isAffine(), llvm::ICmpInst::isEquality(), llvm::Type::isIntegerTy(), llvm::ScalarEvolution::isKnownNegative(), llvm::ScalarEvolution::isKnownPositive(), llvm::ScalarEvolution::isKnownPredicate(), LHS, llvm::PatternMatch::m_And(), llvm::PatternMatch::m_ICmp(), llvm::PatternMatch::m_Or(), llvm::PatternMatch::m_Value(), llvm::PatternMatch::match(), MaxDepth, RHS, and std::swap().
Referenced by llvm::computePeelCount().
|
static |
Initialize the weights for all exiting blocks.
Definition at line 695 of file LoopPeel.cpp.
References llvm::extractBranchWeights(), llvm::DenseMapBase< DerivedT, KeyT, ValueT, KeyInfoT, BucketT >::insert(), llvm::SmallVectorTemplateBase< T, bool >::push_back(), llvm::successors(), and llvm::zip().
Referenced by llvm::peelLoop().
|
static |
Definition at line 274 of file LoopPeel.cpp.
References llvm::any_of(), llvm::SmallPtrSetImpl< PtrType >::contains(), DL, llvm::DominatorTree::dominates(), llvm::SmallPtrSetImpl< PtrType >::end(), llvm::SmallPtrSetImpl< PtrType >::find(), llvm::BasicBlock::getTerminator(), I, llvm::SmallPtrSetImpl< PtrType >::insert(), llvm::isDereferenceablePointer(), and Ptr.
Referenced by llvm::computePeelCount().
STATISTIC | ( | NumPeeled | , |
"Number of loops peeled" | |||
) |
|
static |
Update the branch weights of an exiting block of a peeled-off loop iteration.
Let F is a weight of the edge to continue (fallthrough) into the loop. Let E is a weight of the edge to an exit. F/(F+E) is a probability to go to loop and E/(F+E) is a probability to go to exit. Then, Estimated ExitCount = F / E. For I-th (counting from 0) peeled off iteration we set the weights for the peeled exit as (EC - I, 1). It gives us reasonable distribution, The probability to go to exit 1/(EC-I) increases. At the same time the estimated exit count in the remainder loop reduces by I. To avoid dealing with division rounding we can just multiple both part of weights to E and use weight as (F - I * E, E).
Definition at line 680 of file LoopPeel.cpp.
References llvm::enumerate(), Idx, Info, and llvm::setBranchWeights().
Referenced by llvm::peelLoop().
This "heuristic" exactly matches implicit behavior which used to exist inside getLoopEstimatedTripCount.
It was added here to keep an improvement inside that API from causing peeling to become more aggressive. This should probably be removed.
Definition at line 514 of file LoopPeel.cpp.
References llvm::any_of(), assert(), llvm::BranchInst::getNumSuccessors(), llvm::BranchInst::getSuccessor(), llvm::BasicBlock::getTerminatingDeoptimizeCall(), and llvm::BasicBlock::getTerminator().
Referenced by llvm::computePeelCount().
|
static |
Referenced by llvm::canPeel().
Definition at line 80 of file LoopPeel.cpp.
Referenced by llvm::computePeelCount(), and llvm::peelLoop().
|
static |
Referenced by llvm::gatherPeelingPreferences().
|
static |
Referenced by llvm::gatherPeelingPreferences().
|
static |
Referenced by llvm::computePeelCount().
|
static |
Referenced by llvm::gatherPeelingPreferences().
|
static |
Referenced by llvm::computePeelCount().