74#define DEBUG_TYPE "consthoist"
76STATISTIC(NumConstantsHoisted,
"Number of constants hoisted");
77STATISTIC(NumConstantsRebased,
"Number of constants rebased");
81 cl::desc(
"Enable the use of the block frequency analysis to reduce the "
82 "chance to execute const materialization more frequently than "
83 "without hoisting."));
87 cl::desc(
"Try hoisting constant gep expressions"));
91 cl::desc(
"Do not rebase if number of dependent constants of a Base is less "
125char ConstantHoistingLegacyPass::ID = 0;
128 "Constant Hoisting",
false,
false)
137 return new ConstantHoistingLegacyPass();
141bool ConstantHoistingLegacyPass::runOnFunction(
Function &Fn) {
142 if (skipFunction(Fn))
145 LLVM_DEBUG(
dbgs() <<
"********** Begin Constant Hoisting **********\n");
149 Impl.runImpl(Fn, getAnalysis<TargetTransformInfoWrapperPass>().getTTI(Fn),
150 getAnalysis<DominatorTreeWrapperPass>().getDomTree(),
152 ? &getAnalysis<BlockFrequencyInfoWrapperPass>().getBFI()
155 &getAnalysis<ProfileSummaryInfoWrapperPass>().getPSI());
157 LLVM_DEBUG(
dbgs() <<
"********** End Constant Hoisting **********\n");
162void ConstantHoistingPass::collectMatInsertPts(
172 unsigned Idx)
const {
177 if (
auto CastInst = dyn_cast<Instruction>(Opnd))
183 if (!isa<PHINode>(Inst) && !Inst->
isEHPad())
188 assert(Entry != Inst->
getParent() &&
"PHI or landing pad in entry block!");
190 if (
Idx != ~0U && isa<PHINode>(Inst)) {
191 InsertionBlock = cast<PHINode>(Inst)->getIncomingBlock(
Idx);
192 if (!InsertionBlock->
isEHPad()) {
203 while (IDom->getBlock()->isEHPad()) {
204 assert(Entry != IDom->getBlock() &&
"eh pad in entry block");
205 IDom = IDom->getIDom();
208 return IDom->getBlock()->getTerminator()->getIterator();
217 assert(!BBs.
count(Entry) &&
"Assume Entry is not in BBs");
224 for (
auto *BB : BBs) {
241 "Entry doens't dominate current Node");
251 Candidates.
insert(Path.begin(), Path.end());
262 if (Candidates.
count(ChildDomNode->getBlock()))
263 Orders.
push_back(ChildDomNode->getBlock());
268 using InsertPtsCostPair =
277 auto &InsertPts = InsertPtsMap[
Node].first;
283 if (InsertPtsFreq > BFI.getBlockFreq(
Node) ||
284 (InsertPtsFreq == BFI.getBlockFreq(
Node) && InsertPts.size() > 1))
287 BBs.
insert(InsertPts.begin(), InsertPts.end());
294 auto &ParentInsertPts = InsertPtsMap[Parent].first;
304 (InsertPtsFreq > BFI.getBlockFreq(
Node) ||
305 (InsertPtsFreq == BFI.getBlockFreq(
Node) && InsertPts.size() > 1)))) {
307 ParentPtsFreq += BFI.getBlockFreq(
Node);
309 ParentInsertPts.insert(InsertPts.begin(), InsertPts.end());
310 ParentPtsFreq += InsertPtsFreq;
317ConstantHoistingPass::findConstantInsertionPoint(
326 BBs.
insert(MatInsertPt->getParent());
328 if (BBs.
count(Entry)) {
336 InsertPts.
insert(BB->getFirstInsertionPt());
340 while (BBs.size() >= 2) {
342 BB1 = BBs.pop_back_val();
343 BB2 = BBs.pop_back_val();
351 assert((BBs.size() == 1) &&
"Expected only one element.");
353 InsertPts.
insert(findMatInsertPt(&FirstInst));
363void ConstantHoistingPass::collectConstantCandidates(
372 if (
auto IntrInst = dyn_cast<IntrinsicInst>(Inst))
385 ConstPtrUnionType Cand = ConstInt;
386 std::tie(Itr, Inserted) = ConstCandMap.insert(std::make_pair(Cand, 0));
389 Itr->second = ConstIntCandVec.size() - 1;
393 <<
"Collect constant " << *ConstInt <<
" from " << *Inst
394 <<
" with cost " <<
Cost <<
'\n';
395 else dbgs() <<
"Collect constant " << *ConstInt
396 <<
" indirectly from " << *Inst <<
" via "
403void ConstantHoistingPass::collectConstantCandidates(
418 auto *GEPO = cast<GEPOperator>(ConstExpr);
424 if (!GEPO->isInBounds())
427 if (!GEPO->accumulateConstantOffset(*DL,
Offset))
440 ConstCandVecType &ExprCandVec = ConstGEPCandMap[BaseGV];
443 ConstPtrUnionType Cand = ConstExpr;
444 std::tie(Itr, Inserted) = ConstCandMap.insert(std::make_pair(Cand, 0));
449 Itr->second = ExprCandVec.size() - 1;
455void ConstantHoistingPass::collectConstantCandidates(
456 ConstCandMapType &ConstCandMap,
Instruction *Inst,
unsigned Idx) {
460 if (
auto ConstInt = dyn_cast<ConstantInt>(Opnd)) {
461 collectConstantCandidates(ConstCandMap, Inst,
Idx, ConstInt);
466 if (
auto CastInst = dyn_cast<Instruction>(Opnd)) {
475 collectConstantCandidates(ConstCandMap, Inst,
Idx, ConstInt);
481 if (
auto ConstExpr = dyn_cast<ConstantExpr>(Opnd)) {
484 collectConstantCandidates(ConstCandMap, Inst,
Idx, ConstExpr);
490 if (
auto ConstInt = dyn_cast<ConstantInt>(ConstExpr->
getOperand(0))) {
493 collectConstantCandidates(ConstCandMap, Inst,
Idx, ConstInt);
501void ConstantHoistingPass::collectConstantCandidates(
502 ConstCandMapType &ConstCandMap,
Instruction *Inst) {
515 collectConstantCandidates(ConstCandMap, Inst,
Idx);
522void ConstantHoistingPass::collectConstantCandidates(
Function &Fn) {
523 ConstCandMapType ConstCandMap;
530 collectConstantCandidates(ConstCandMap, &Inst);
558ConstantHoistingPass::maximizeConstantsInRange(ConstCandVecType::iterator S,
559 ConstCandVecType::iterator E,
560 ConstCandVecType::iterator &MaxCostItr) {
561 unsigned NumUses = 0;
563 if (!OptForSize || std::distance(S,E) > 100) {
564 for (
auto ConstCand = S; ConstCand != E; ++ConstCand) {
565 NumUses += ConstCand->Uses.size();
566 if (ConstCand->CumulativeCost > MaxCostItr->CumulativeCost)
567 MaxCostItr = ConstCand;
574 for (
auto ConstCand = S; ConstCand != E; ++ConstCand) {
575 auto Value = ConstCand->ConstInt->getValue();
576 Type *Ty = ConstCand->ConstInt->getType();
578 NumUses += ConstCand->Uses.size();
579 LLVM_DEBUG(
dbgs() <<
"= Constant: " << ConstCand->ConstInt->getValue()
582 for (
auto User : ConstCand->Uses) {
583 unsigned Opcode =
User.Inst->getOpcode();
584 unsigned OpndIdx =
User.OpndIdx;
589 for (
auto C2 = S; C2 != E; ++C2) {
590 APInt Diff = C2->ConstInt->getValue() - ConstCand->ConstInt->getValue();
595 <<
"has penalty: " << ImmCosts <<
"\n"
596 <<
"Adjusted cost: " <<
Cost <<
"\n");
600 if (
Cost > MaxCost) {
602 MaxCostItr = ConstCand;
603 LLVM_DEBUG(
dbgs() <<
"New candidate: " << MaxCostItr->ConstInt->getValue()
612void ConstantHoistingPass::findAndMakeBaseConstant(
613 ConstCandVecType::iterator S, ConstCandVecType::iterator E,
616 unsigned NumUses = maximizeConstantsInRange(S, E, MaxCostItr);
630 for (
auto ConstCand = S; ConstCand != E; ++ConstCand) {
631 APInt Diff = ConstCand->ConstInt->getValue() - ConstInt->
getValue();
632 Constant *
Offset = Diff == 0 ? nullptr : ConstantInt::get(Ty, Diff);
634 ConstCand->ConstExpr ? ConstCand->ConstExpr->getType() :
nullptr;
638 ConstInfoVec.
push_back(std::move(ConstInfo));
643void ConstantHoistingPass::findBaseConstants(
GlobalVariable *BaseGV) {
646 ConstCandVecType &ConstCandVec = BaseGV ?
647 ConstGEPCandMap[BaseGV] : ConstIntCandVec;
648 ConstInfoVecType &ConstInfoVec = BaseGV ?
649 ConstGEPInfoMap[BaseGV] : ConstIntInfoVec;
655 return LHS.ConstInt->getBitWidth() <
RHS.ConstInt->getBitWidth();
656 return LHS.ConstInt->getValue().ult(
RHS.ConstInt->getValue());
661 auto MinValItr = ConstCandVec.begin();
662 for (
auto CC = std::next(ConstCandVec.begin()), E = ConstCandVec.end();
664 if (MinValItr->ConstInt->getType() ==
CC->ConstInt->getType()) {
665 Type *MemUseValTy =
nullptr;
666 for (
auto &U :
CC->Uses) {
668 if (
LoadInst *LI = dyn_cast<LoadInst>(UI)) {
669 MemUseValTy = LI->getType();
671 }
else if (
StoreInst *SI = dyn_cast<StoreInst>(UI)) {
673 if (
SI->getPointerOperand() ==
SI->getOperand(
U.OpndIdx)) {
674 MemUseValTy =
SI->getValueOperand()->getType();
681 APInt Diff =
CC->ConstInt->getValue() - MinValItr->ConstInt->getValue();
693 findAndMakeBaseConstant(MinValItr,
CC, ConstInfoVec);
698 findAndMakeBaseConstant(MinValItr, ConstCandVec.end(), ConstInfoVec);
708 if (
auto PHI = dyn_cast<PHINode>(Inst)) {
716 for (
unsigned i = 0; i <
Idx; ++i) {
717 if (
PHI->getIncomingBlock(i) == IncomingBB) {
718 Value *IncomingVal =
PHI->getIncomingValue(i);
732 UserAdjustment *Adj) {
736 if (!Adj->Offset && Adj->Ty && Adj->Ty !=
Base->getType())
743 "mat_gep", Adj->MatInsertPt);
746 Adj->MatInsertPt->getIterator());
751 "const_mat", Adj->MatInsertPt->getIterator());
754 <<
" + " << *Adj->Offset <<
") in BB "
759 Value *Opnd = Adj->User.Inst->getOperand(Adj->User.OpndIdx);
762 if (isa<ConstantInt>(Opnd)) {
764 if (!
updateOperand(Adj->User.Inst, Adj->User.OpndIdx, Mat) && Adj->Offset)
771 if (
auto CastInst = dyn_cast<Instruction>(Opnd)) {
776 if (!ClonedCastInst) {
783 <<
"To : " << *ClonedCastInst <<
'\n');
787 updateOperand(Adj->User.Inst, Adj->User.OpndIdx, ClonedCastInst);
793 if (
auto ConstExpr = dyn_cast<ConstantExpr>(Opnd)) {
794 if (isa<GEPOperator>(ConstExpr)) {
801 assert(ConstExpr->
isCast() &&
"ConstExpr should be a cast");
807 ConstExprInst->
setDebugLoc(Adj->User.Inst->getDebugLoc());
809 LLVM_DEBUG(
dbgs() <<
"Create instruction: " << *ConstExprInst <<
'\n'
810 <<
"From : " << *ConstExpr <<
'\n');
812 if (!
updateOperand(Adj->User.Inst, Adj->User.OpndIdx, ConstExprInst)) {
824bool ConstantHoistingPass::emitBaseConstants(
GlobalVariable *BaseGV) {
825 bool MadeChange =
false;
827 BaseGV ? ConstGEPInfoMap[BaseGV] : ConstIntInfoVec;
832 findConstantInsertionPoint(ConstInfo, MatInsertPts);
837 unsigned UsesNum = 0;
838 unsigned ReBasesNum = 0;
839 unsigned NotRebasedNum = 0;
846 UsesNum += RCI.Uses.size();
847 for (
auto const &U : RCI.Uses) {
852 if (IPSet.size() == 1 ||
853 DT->
dominates(IP->getParent(), OrigMatInsertBB))
854 ToBeRebased.
emplace_back(RCI.Offset, RCI.Ty, MatInsertPt, U);
861 NotRebasedNum += ToBeRebased.
size();
869 assert(BaseGV &&
"A base constant expression must have an base GV");
877 Base->setDebugLoc(IP->getDebugLoc());
880 <<
") to BB " << IP->getParent()->
getName() <<
'\n'
884 for (UserAdjustment &R : ToBeRebased) {
885 emitBaseConstants(
Base, &R);
889 Base->getDebugLoc(),
R.User.Inst->getDebugLoc()));
891 assert(!
Base->use_empty() &&
"The use list is empty!?");
893 "All uses should be instructions.");
899 assert(UsesNum == (ReBasesNum + NotRebasedNum) &&
900 "Not all uses are rebased");
902 NumConstantsHoisted++;
915void ConstantHoistingPass::deleteDeadCastInst()
const {
916 for (
auto const &
I : ClonedCastMap)
917 if (
I.first->use_empty())
918 I.first->eraseFromParent();
930 this->Entry = &Entry;
936 collectConstantCandidates(Fn);
940 if (!ConstIntCandVec.empty())
941 findBaseConstants(
nullptr);
942 for (
const auto &MapEntry : ConstGEPCandMap)
943 if (!MapEntry.second.empty())
944 findBaseConstants(MapEntry.first);
948 bool MadeChange =
false;
949 if (!ConstIntInfoVec.
empty())
950 MadeChange = emitBaseConstants(
nullptr);
951 for (
const auto &MapEntry : ConstGEPInfoMap)
952 if (!MapEntry.second.empty())
953 MadeChange |= emitBaseConstants(MapEntry.first);
957 deleteDeadCastInst();
This file implements a class to represent arbitrary precision integral constant values and operations...
static bool updateOperand(Instruction *Inst, unsigned Idx, Instruction *Mat)
Updates the operand at Idx in instruction Inst with the result of instruction Mat.
static void findBestInsertionSet(DominatorTree &DT, BlockFrequencyInfo &BFI, BasicBlock *Entry, SetVector< BasicBlock * > &BBs)
Given BBs as input, find another set of BBs which collectively dominates BBs and have the minimal sum...
static cl::opt< unsigned > MinNumOfDependentToRebase("consthoist-min-num-to-rebase", cl::desc("Do not rebase if number of dependent constants of a Base is less " "than this number."), cl::init(0), cl::Hidden)
static cl::opt< bool > ConstHoistWithBlockFrequency("consthoist-with-block-frequency", cl::init(true), cl::Hidden, cl::desc("Enable the use of the block frequency analysis to reduce the " "chance to execute const materialization more frequently than " "without hoisting."))
static cl::opt< bool > ConstHoistGEP("consthoist-gep", cl::init(false), cl::Hidden, cl::desc("Try hoisting constant gep expressions"))
This file contains the declarations for the subclasses of Constant, which represent the different fla...
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
This file defines the DenseMap class.
static bool isCandidate(const MachineInstr *MI, Register &DefedReg, Register FrameReg)
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
Class for arbitrary precision integers.
unsigned getBitWidth() const
Return the number of bits in the APInt.
int64_t getSExtValue() const
Get sign extended value.
A container for analyses that lazily runs them and caches their results.
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
void setPreservesCFG()
This function should be called by the pass, iff they do not:
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
LLVM Basic Block Representation.
iterator begin()
Instruction iterator methods.
const Function * getParent() const
Return the enclosing method, or null if none.
InstListType::iterator iterator
Instruction iterators...
bool isEHPad() const
Return true if this basic block is an exception handling block.
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
static BinaryOperator * Create(BinaryOps Op, Value *S1, Value *S2, const Twine &Name=Twine(), InsertPosition InsertBefore=nullptr)
Construct a binary instruction, given the opcode and the two operands.
This class represents a no-op cast from one type to another.
Analysis pass which computes BlockFrequencyInfo.
Legacy analysis pass which computes BlockFrequencyInfo.
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Represents analyses that only rely on functions' control flow.
This is the base class for all instructions that perform data casts.
A constant value that is initialized with an expression using other constant values.
bool isCast() const
Return true if this is a convert constant expression.
Instruction * getAsInstruction() const
Returns an Instruction which implements the same operation as this ConstantExpr.
bool runImpl(Function &F, TargetTransformInfo &TTI, DominatorTree &DT, BlockFrequencyInfo *BFI, BasicBlock &Entry, ProfileSummaryInfo *PSI)
Optimize expensive integer constants in the given function.
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
This is the shared class of boolean and integer constants.
IntegerType * getIntegerType() const
Variant of the getType() method to always return an IntegerType, which reduces the amount of casting ...
const APInt & getValue() const
Return the constant as an APInt value reference.
This is an important base class in LLVM.
static DILocation * getMergedLocation(DILocation *LocA, DILocation *LocB)
When two instructions are combined into a single instruction we also need to combine the original loc...
IntegerType * getIndexType(LLVMContext &C, unsigned AddressSpace) const
Returns the type of a GEP index in AddressSpace.
TypeSize getTypeSizeInBits(Type *Ty) const
Size examples:
DenseMapIterator< KeyT, ValueT, KeyInfoT, BucketT > iterator
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
void reserve(size_type NumEntries)
Grow the densemap so that it can contain at least NumEntries items before resizing again.
iterator_range< iterator > children()
DomTreeNodeBase * getIDom() const
Analysis pass which computes a DominatorTree.
DomTreeNodeBase< NodeT > * getNode(const NodeT *BB) const
getNode - return the (Post)DominatorTree node for the specified basic block.
Legacy analysis pass which computes a DominatorTree.
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
bool isReachableFromEntry(const Use &U) const
Provide an overload for a Use.
Instruction * findNearestCommonDominator(Instruction *I1, Instruction *I2) const
Find the nearest instruction I that dominates both I1 and I2, in the sense that a result produced bef...
bool dominates(const BasicBlock *BB, const Use &U) const
Return true if the (end of the) basic block BB dominates the use U.
FunctionPass class - This class is used to implement most global optimizations.
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.
const BasicBlock & getEntryBlock() const
const DataLayout & getDataLayout() const
Get the data layout of the module this function belongs to.
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
static GetElementPtrInst * Create(Type *PointeeType, Value *Ptr, ArrayRef< Value * > IdxList, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
PointerType * getType() const
Global values are always pointers.
std::optional< CostType > getValue() const
This function is intended to be used as sparingly as possible, since the class provides the full rang...
Instruction * clone() const
Create a copy of 'this' instruction that is identical in all ways except the following:
void insertBefore(Instruction *InsertPos)
Insert an unlinked instruction into a basic block immediately before the specified instruction.
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
bool isEHPad() const
Return true if the instruction is a variety of EH-block.
InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
void insertAfter(Instruction *InsertPos)
Insert an unlinked instruction into a basic block immediately after the specified instruction.
Class to represent integer types.
An instruction for reading from memory.
An analysis over an "inner" IR unit that provides access to an analysis manager over a "outer" IR uni...
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
virtual StringRef getPassName() const
getPassName - Return a nice clean name for a pass.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
void preserveSet()
Mark an analysis set as preserved.
An analysis pass based on the new PM to deliver ProfileSummaryInfo.
An analysis pass based on legacy pass manager to deliver ProfileSummaryInfo.
Analysis providing profile information.
A vector that has set insertion semantics.
void clear()
Completely clear the SetVector.
size_type count(const key_type &key) const
Count the number of elements of a given key in the SetVector.
bool empty() const
Determine if the SetVector is empty or not.
bool insert(const value_type &X)
Insert a new element into the SetVector.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
reference emplace_back(ArgTypes &&... Args)
void push_back(const T &Elt)
An instruction for storing to memory.
StringRef - Represent a constant reference to a string, i.e.
Analysis pass providing the TargetTransformInfo.
The instances of the Type class are immutable: once they are created, they are never changed.
bool isVectorTy() const
True if this is an instance of VectorType.
static IntegerType * getInt8Ty(LLVMContext &C)
static IntegerType * getInt32Ty(LLVMContext &C)
void setOperand(unsigned i, Value *Val)
Value * getOperand(unsigned i) const
unsigned getNumOperands() const
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
StringRef getName() const
Return a constant reference to the value's name.
const ParentTy * getParent() const
self_iterator getIterator()
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
void stable_sort(R &&Range)
FunctionPass * createConstantHoistingPass()
bool shouldOptimizeForSize(const MachineFunction *MF, ProfileSummaryInfo *PSI, const MachineBlockFrequencyInfo *BFI, PGSOQueryType QueryType=PGSOQueryType::Other)
Returns true if machine function MF is suggested to be size-optimized based on the profile.
auto reverse(ContainerTy &&C)
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
bool canReplaceOperandWithVariable(const Instruction *I, unsigned OpIdx)
Given an instruction, is it legal to set operand OpIdx to a non-constant value?
void initializeConstantHoistingLegacyPassPass(PassRegistry &)
Keeps track of a constant candidate and its uses.
A base constant and all its rebased constants.
RebasedConstantListType RebasedConstants
Keeps track of the user of a constant and the operand index where the constant is used.
This represents a constant that has been rebased with respect to a base constant.