52#define DEBUG_TYPE "pgo-icall-prom"
54STATISTIC(NumOfPGOICallPromotion,
"Number of indirect call promotions.");
55STATISTIC(NumOfPGOICallsites,
"Number of indirect call candidate sites.");
66 cl::desc(
"Disable indirect call promotion"));
74 cl::desc(
"Max number of promotions for this compilation"));
80 cl::desc(
"Skip Callsite up to this number for this compilation"));
85 cl::desc(
"Promote the target candidate even when the definition "
86 " is not available"));
92 cl::desc(
"Promote the target candidate only if it is a "
93 "hot function. Otherwise, warm functions can "
100 cl::desc(
"Continue with the remaining targets instead of exiting "
101 "when failing in a candidate"));
107 cl::desc(
"Run indirect-call promotion in LTO "
114 cl::desc(
"Run indirect-call promotion in SamplePGO mode"));
120 cl::desc(
"Run indirect-call promotion for call instructions "
127 cl::desc(
"Run indirect-call promotion for "
128 "invoke instruction only"));
134 cl::desc(
"Dump IR after transformation happens"));
140 cl::desc(
"The percentage threshold of vtable-count / function-count for "
141 "cost-benefit analysis."));
152 cl::desc(
"The maximum number of vtable for the last candidate."));
157 "A list of mangled vtable type info names. Classes specified by the "
158 "type info names and their derived ones will not be vtable-ICP'ed. "
159 "Useful when the profiled types and actual types in the optimized "
160 "binary could be different due to profiling limitations. Type info "
161 "names are those string literals used in LLVM type metadata"));
168using VTableAddressPointOffsetValMap =
172struct VirtualCallSiteInfo {
182using VirtualCallSiteTypeInfoMap =
193static std::optional<uint64_t>
197 VTableVar.
getMetadata(LLVMContext::MD_type, Types);
201 TypeId && TypeId->getString() == CompatibleType)
215 assert(AddressPointOffset < VTable->getGlobalSize(M.getDataLayout()) &&
216 "Out-of-bound access");
226 return PN->getIncomingBlock(U);
241 "Guaranteed by ICP transformation");
252 UserBB = getUserBasicBlock(
Use, UserInst);
255 if (UserBB != DestBB)
258 return UserBB !=
nullptr;
266 if (!isDestBBSuitableForSink(
I, DestBlock))
277 if (
C->isInlineAsm() ||
C->cannotMerge() ||
C->isConvergent())
281 if (
I->mayWriteToMemory())
286 if (
I->mayReadFromMemory()) {
289 E =
I->getParent()->end();
294 if (Scan->mayWriteToMemory())
300 I->moveBefore(*DestBlock, InsertPos);
311static int tryToSinkInstructions(
BasicBlock *OriginalBB,
320 if (tryToSinkInstruction(&
I, IndirectCallBB))
328class IndirectCallPromoter {
335 InstrProfSymtab *
const Symtab;
337 const bool SamplePGO;
340 const VirtualCallSiteTypeInfoMap &VirtualCSInfo;
342 VTableAddressPointOffsetValMap &VTableAddressPointOffsetVal;
344 OptimizationRemarkEmitter &ORE;
346 const DenseSet<StringRef> &IgnoredBaseTypes;
349 struct PromotionCandidate {
351 const uint64_t Count;
352 const uint32_t Index;
361 VTableGUIDCountsMap VTableGUIDAndCounts;
364 PromotionCandidate(Function *
F, uint64_t
C, uint32_t
I)
365 : TargetFunction(
F), Count(
C), Index(
I) {}
373 std::vector<PromotionCandidate> getPromotionCandidatesForCallSite(
375 uint64_t TotalCount, uint32_t NumCandidates);
380 bool tryToPromoteWithFuncCmp(
383 uint32_t NumCandidates, VTableGUIDCountsMap &VTableGUIDCounts);
388 bool tryToPromoteWithVTableCmp(
390 uint64_t TotalFuncCount, uint32_t NumCandidates,
392 VTableGUIDCountsMap &VTableGUIDCounts);
395 bool isProfitableToCompareVTables(
const CallBase &CB,
400 bool shouldSkipVTable(uint64_t VTableGUID);
409 Instruction *computeVTableInfos(
const CallBase *CB,
410 VTableGUIDCountsMap &VTableGUIDCounts,
411 std::vector<PromotionCandidate> &Candidates);
413 Constant *getOrCreateVTableAddressPointVar(GlobalVariable *GV,
414 uint64_t AddressPointOffset);
416 void updateFuncValueProfiles(CallBase &CB,
418 uint64_t Sum, uint32_t MaxMDCount);
420 void updateVPtrValueProfiles(Instruction *VPtr,
421 VTableGUIDCountsMap &VTableGUIDCounts);
423 bool isValidTarget(uint64_t, Function *,
const CallBase &, uint64_t);
426 IndirectCallPromoter(
427 Function &Func,
Module &M, InstrProfSymtab *Symtab,
bool SamplePGO,
428 const VirtualCallSiteTypeInfoMap &VirtualCSInfo,
429 VTableAddressPointOffsetValMap &VTableAddressPointOffsetVal,
430 const DenseSet<StringRef> &IgnoredBaseTypes,
431 OptimizationRemarkEmitter &ORE)
432 : F(
Func), M(M), Symtab(Symtab), SamplePGO(SamplePGO),
433 VirtualCSInfo(VirtualCSInfo),
434 VTableAddressPointOffsetVal(VTableAddressPointOffsetVal), ORE(ORE),
435 IgnoredBaseTypes(IgnoredBaseTypes) {}
436 IndirectCallPromoter(
const IndirectCallPromoter &) =
delete;
437 IndirectCallPromoter &operator=(
const IndirectCallPromoter &) =
delete;
455 if (TargetFunction ==
nullptr) {
458 return OptimizationRemarkMissed(
DEBUG_TYPE,
"UnableToFindTarget", &CB)
459 <<
"Cannot promote indirect call: target with md5sum "
460 <<
NV(
"target md5sum", Target)
461 <<
" not found (count=" <<
NV(
"Count",
Count) <<
")";
466 LLVM_DEBUG(
dbgs() <<
" Not promote: target definition is not available\n");
468 return OptimizationRemarkMissed(
DEBUG_TYPE,
"NoTargetDef", &CB)
469 <<
"Do not promote indirect call: target with md5sum "
470 <<
NV(
"target md5sum", Target)
471 <<
" definition not available (count=" <<
ore::NV(
"Count",
Count)
477 const char *Reason =
nullptr;
481 return OptimizationRemarkMissed(
DEBUG_TYPE,
"UnableToPromote", &CB)
482 <<
"Cannot promote indirect call to "
483 <<
NV(
"TargetFunction", TargetFunction)
484 <<
" (count=" <<
NV(
"Count",
Count) <<
"): " << Reason;
493std::vector<IndirectCallPromoter::PromotionCandidate>
494IndirectCallPromoter::getPromotionCandidatesForCallSite(
496 uint64_t TotalCount, uint32_t NumCandidates) {
497 std::vector<PromotionCandidate> Ret;
499 LLVM_DEBUG(
dbgs() <<
" \nWork on callsite #" << NumOfPGOICallsites << CB
500 <<
" Num_targets: " << ValueDataRef.
size()
501 <<
" Num_candidates: " << NumCandidates <<
"\n");
502 NumOfPGOICallsites++;
508 for (uint32_t
I = 0;
I < NumCandidates;
I++) {
509 uint64_t
Count = ValueDataRef[
I].Count;
512 uint64_t
Target = ValueDataRef[
I].Value;
514 <<
" Target_func: " << Target <<
"\n");
519 return OptimizationRemarkMissed(
DEBUG_TYPE,
"UserOptions", &CB)
520 <<
" Not promote: User options";
527 return OptimizationRemarkMissed(
DEBUG_TYPE,
"UserOptions", &CB)
528 <<
" Not promote: User options";
535 return OptimizationRemarkMissed(
DEBUG_TYPE,
"CutOffReached", &CB)
536 <<
" Not promote: Cutoff reached";
542 if (!isValidTarget(Target, TargetFunction, CB,
Count)) {
549 Ret.push_back(PromotionCandidate(TargetFunction,
Count,
I));
555Constant *IndirectCallPromoter::getOrCreateVTableAddressPointVar(
556 GlobalVariable *GV, uint64_t AddressPointOffset) {
558 VTableAddressPointOffsetVal[GV].try_emplace(AddressPointOffset,
nullptr);
560 Iter->second = getVTableAddressPointOffset(GV, AddressPointOffset);
564Instruction *IndirectCallPromoter::computeVTableInfos(
565 const CallBase *CB, VTableGUIDCountsMap &GUIDCountsMap,
566 std::vector<PromotionCandidate> &Candidates) {
594 auto Iter = VirtualCSInfo.find(CB);
595 if (Iter == VirtualCSInfo.end())
599 << NumOfPGOICallsites <<
"\n");
601 const auto &VirtualCallInfo = Iter->second;
604 SmallDenseMap<Function *, int, 4> CalleeIndexMap;
605 for (
size_t I = 0;
I < Candidates.size();
I++)
606 CalleeIndexMap[Candidates[
I].TargetFunction] =
I;
608 uint64_t TotalVTableCount = 0;
609 auto VTableValueDataArray =
612 if (VTableValueDataArray.empty())
616 for (
const auto &V : VTableValueDataArray) {
617 uint64_t VTableVal =
V.Value;
618 GUIDCountsMap[VTableVal] =
V.Count;
621 LLVM_DEBUG(
dbgs() <<
" Cannot find vtable definition for " << VTableVal
622 <<
"; maybe the vtable isn't imported\n");
626 std::optional<uint64_t> MaybeAddressPointOffset =
627 getAddressPointOffset(*VTableVar, VirtualCallInfo.CompatibleTypeStr);
628 if (!MaybeAddressPointOffset)
631 const uint64_t AddressPointOffset = *MaybeAddressPointOffset;
635 VTableVar, AddressPointOffset + VirtualCallInfo.FunctionOffset, M);
638 auto CalleeIndexIter = CalleeIndexMap.
find(Callee);
639 if (CalleeIndexIter == CalleeIndexMap.
end())
642 auto &Candidate = Candidates[CalleeIndexIter->second];
646 Candidate.VTableGUIDAndCounts[VTableVal] =
V.Count;
647 Candidate.AddressPoints.push_back(
648 getOrCreateVTableAddressPointVar(VTableVar, AddressPointOffset));
666 bool AttachProfToDirectCall,
672 if (AttachProfToDirectCall)
681 <<
"Promote indirect call to " << NV(
"DirectCallee", DirectCallee)
682 <<
" with count " << NV(
"Count",
Count) <<
" out of "
683 << NV(
"TotalCount", TotalCount);
689bool IndirectCallPromoter::tryToPromoteWithFuncCmp(
692 uint32_t NumCandidates, VTableGUIDCountsMap &VTableGUIDCounts) {
695 for (
const auto &
C : Candidates) {
699 assert(TotalCount >= FuncCount);
700 TotalCount -= FuncCount;
701 NumOfPGOICallPromotion++;
705 ICallProfDataRef[
C.Index].Count = 0;
714 for (
const auto &[GUID, VTableCount] :
C.VTableGUIDAndCounts)
715 SumVTableCount += VTableCount;
717 for (
const auto &[GUID, VTableCount] :
C.VTableGUIDAndCounts) {
718 APInt APFuncCount((
unsigned)128, FuncCount,
false );
719 APFuncCount *= VTableCount;
720 VTableGUIDCounts[GUID] -= APFuncCount.udiv(SumVTableCount).getZExtValue();
723 if (NumPromoted == 0)
726 assert(NumPromoted <= ICallProfDataRef.
size() &&
727 "Number of promoted functions should not be greater than the number "
728 "of values in profile metadata");
730 updateFuncValueProfiles(CB, ICallProfDataRef, TotalCount, NumCandidates);
731 updateVPtrValueProfiles(VPtr, VTableGUIDCounts);
735void IndirectCallPromoter::updateFuncValueProfiles(
737 uint64_t TotalCount, uint32_t MaxMDCount) {
743 const InstrProfValueData &
RHS) {
744 return LHS.Count >
RHS.Count;
750 [](uint64_t
Count,
const InstrProfValueData &ProfData) {
751 return ProfData.Count <= Count;
760void IndirectCallPromoter::updateVPtrValueProfiles(
761 Instruction *VPtr, VTableGUIDCountsMap &VTableGUIDCounts) {
766 std::vector<InstrProfValueData> VTableValueProfiles;
767 uint64_t TotalVTableCount = 0;
768 for (
auto [GUID,
Count] : VTableGUIDCounts) {
772 VTableValueProfiles.push_back({
GUID,
Count});
773 TotalVTableCount +=
Count;
776 [](
const InstrProfValueData &
LHS,
const InstrProfValueData &
RHS) {
777 return LHS.Count >
RHS.Count;
781 IPVK_VTableTarget, VTableValueProfiles.size());
784bool IndirectCallPromoter::tryToPromoteWithVTableCmp(
786 uint64_t TotalFuncCount, uint32_t NumCandidates,
788 VTableGUIDCountsMap &VTableGUIDCounts) {
791 for (
const auto &Candidate : Candidates) {
792 for (
auto &[GUID,
Count] : Candidate.VTableGUIDAndCounts)
800 CB, VPtr, Candidate.TargetFunction, Candidate.AddressPoints,
802 TotalFuncCount - Candidate.Count));
804 int SinkCount = tryToSinkInstructions(OriginalBB, CB.
getParent());
809 const auto &VTableGUIDAndCounts = Candidate.VTableGUIDAndCounts;
810 Remark <<
"Promote indirect call to "
811 <<
ore::NV(
"DirectCallee", Candidate.TargetFunction)
812 <<
" with count " <<
ore::NV(
"Count", Candidate.Count)
813 <<
" out of " <<
ore::NV(
"TotalCount", TotalFuncCount) <<
", sink "
814 <<
ore::NV(
"SinkCount", SinkCount)
815 <<
" instruction(s) and compare "
816 <<
ore::NV(
"VTable", VTableGUIDAndCounts.size())
820 std::set<uint64_t> GUIDSet;
821 for (
auto [GUID,
Count] : VTableGUIDAndCounts)
822 GUIDSet.insert(GUID);
823 for (
auto Iter = GUIDSet.begin(); Iter != GUIDSet.end(); Iter++) {
824 if (Iter != GUIDSet.begin())
834 PromotedFuncCount.
push_back({Candidate.Index, Candidate.Count});
836 assert(TotalFuncCount >= Candidate.Count &&
837 "Within one prof metadata, total count is the sum of counts from "
838 "individual <target, count> pairs");
842 TotalFuncCount -= std::min(TotalFuncCount, Candidate.Count);
843 NumOfPGOICallPromotion++;
846 if (PromotedFuncCount.
empty())
855 for (
size_t I = 0;
I < PromotedFuncCount.
size();
I++) {
856 uint32_t
Index = PromotedFuncCount[
I].first;
857 ICallProfDataRef[
Index].Count -=
858 std::max(PromotedFuncCount[
I].second, ICallProfDataRef[Index].
Count);
860 updateFuncValueProfiles(CB, ICallProfDataRef, TotalFuncCount, NumCandidates);
861 updateVPtrValueProfiles(VPtr, VTableGUIDCounts);
867bool IndirectCallPromoter::processFunction(ProfileSummaryInfo *PSI) {
869 ICallPromotionAnalysis ICallAnalysis;
871 uint32_t NumCandidates;
874 CB, TotalCount, NumCandidates);
880 LLVM_DEBUG(
dbgs() <<
"Don't promote the cold candidate: TotalCount="
881 << TotalCount <<
"\n");
886 LLVM_DEBUG(
dbgs() <<
"Don't promote the non-hot candidate: TotalCount="
887 << TotalCount <<
"\n");
892 auto PromotionCandidates = getPromotionCandidatesForCallSite(
893 *CB, ICallProfDataRef, TotalCount, NumCandidates);
895 VTableGUIDCountsMap VTableGUIDCounts;
897 computeVTableInfos(CB, VTableGUIDCounts, PromotionCandidates);
899 if (isProfitableToCompareVTables(*CB, PromotionCandidates))
900 Changed |= tryToPromoteWithVTableCmp(*CB, VPtr, PromotionCandidates,
901 TotalCount, NumCandidates,
902 ICallProfDataRef, VTableGUIDCounts);
904 Changed |= tryToPromoteWithFuncCmp(*CB, VPtr, PromotionCandidates,
905 TotalCount, ICallProfDataRef,
906 NumCandidates, VTableGUIDCounts);
913bool IndirectCallPromoter::isProfitableToCompareVTables(
917 LLVM_DEBUG(
dbgs() <<
"\nEvaluating vtable profitability for callsite #"
918 << NumOfPGOICallsites << CB <<
"\n");
919 const size_t CandidateSize = Candidates.
size();
920 for (
size_t I = 0;
I < CandidateSize;
I++) {
921 auto &Candidate = Candidates[
I];
922 auto &VTableGUIDAndCounts = Candidate.VTableGUIDAndCounts;
925 dbgs() <<
" Candidate " <<
I <<
" FunctionCount: " << Candidate.Count
926 <<
", VTableCounts:";
927 for (
const auto &[GUID,
Count] : VTableGUIDAndCounts)
933 uint64_t CandidateVTableCount = 0;
935 for (
auto &[GUID,
Count] : VTableGUIDAndCounts) {
936 CandidateVTableCount +=
Count;
938 if (shouldSkipVTable(GUID))
944 dbgs() <<
" function count " << Candidate.Count
945 <<
" and its vtable sum count " << CandidateVTableCount
946 <<
" have discrepancies. Bail out vtable comparison.\n");
956 int MaxNumVTable = 1;
957 if (
I == CandidateSize - 1)
960 if ((
int)Candidate.AddressPoints.size() > MaxNumVTable) {
961 LLVM_DEBUG(
dbgs() <<
" allow at most " << MaxNumVTable <<
" and got "
962 << Candidate.AddressPoints.size()
963 <<
" vtables. Bail out for vtable comparison.\n");
971bool IndirectCallPromoter::shouldSkipVTable(uint64_t VTableGUID) {
972 if (IgnoredBaseTypes.empty())
977 assert(VTableVar &&
"VTableVar must exist for GUID in VTableGUIDAndCounts");
980 VTableVar->
getMetadata(LLVMContext::MD_type, Types);
982 for (
auto *
Type : Types)
984 if (IgnoredBaseTypes.contains(TypeId->getString())) {
986 "out of vtable comparison.");
1000 VirtualCallSiteTypeInfoMap &VirtualCSInfo) {
1011 if (!TypeTestFunc || TypeTestFunc->
use_empty())
1027 if (!CompatibleTypeId)
1034 auto &DT = LookupDomTree(*CI->getFunction());
1037 for (
auto &DevirtCall : DevirtCalls) {
1045 VirtualCSInfo[&CB] = {DevirtCall.Offset, VTablePtr,
1046 CompatibleTypeId->getString()};
1058 std::string SymtabFailure =
toString(std::move(
E));
1059 M.getContext().emitError(
"Failed to create symtab: " + SymtabFailure);
1063 VirtualCallSiteTypeInfoMap VirtualCSInfo;
1080 VTableAddressPointOffsetValMap VTableAddressPointOffsetVal;
1083 if (
F.isDeclaration() ||
F.hasOptNone())
1090 IndirectCallPromoter CallPromoter(
F, M, &Symtab, SamplePGO, VirtualCSInfo,
1091 VTableAddressPointOffsetVal,
1092 IgnoredBaseTypes, ORE);
1093 bool FuncChanged = CallPromoter.processFunction(PSI);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
This file defines the DenseMap class.
This header defines various interfaces for pass management in LLVM.
Machine Check Debug Module
static bool processFunction(Function &F, NVPTXTargetMachine &TM)
This file provides the interface for IR based instrumentation passes ( (profile-gen,...
FunctionAnalysisManager FAM
ModuleAnalysisManager MAM
This file contains the declarations for profiling metadata utility functions.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
Class for arbitrary precision integers.
Represent a constant reference to an array (0 or more elements consecutively in memory),...
size_t size() const
Get the array size.
bool empty() const
Check if the array is empty.
LLVM Basic Block Representation.
LLVM_ABI const_iterator getFirstInsertionPt() const
Returns an iterator to the first instruction in this block that is suitable for inserting a non-PHI i...
LLVM_ABI const BasicBlock * getUniquePredecessor() const
Return the predecessor of this block if it has a unique predecessor block.
InstListType::iterator iterator
Instruction iterators...
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction; assumes that the block is well-formed.
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
static Constant * getInBoundsPtrAdd(Constant *Ptr, Constant *Offset)
Create a getelementptr inbounds i8, ptr, offset constant expression.
This is an important base class in LLVM.
iterator find(const_arg_type_t< KeyT > Val)
Implements a dense probed hash-table based set.
Analysis pass which computes a DominatorTree.
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Lightweight error class with error context and mandatory checking.
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this GlobalObject.
LLVM_ABI bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
A symbol table used for function [IR]PGO name look-up with keys (such as pointers,...
GlobalVariable * getGlobalVariable(uint64_t MD5Hash) const
Return the global variable corresponding to md5 hash.
LLVM_ABI Error create(object::SectionRef &Section)
Create InstrProfSymtab from an object file section which contains function PGO names.
Function * getFunction(uint64_t FuncMD5Hash) const
Return function from the name's md5 hash. Return nullptr if not found.
LLVM_ABI bool isDebugOrPseudoInst() const LLVM_READONLY
Return true if the instruction is a DbgInfoIntrinsic or PseudoProbeInst.
LLVM_ABI unsigned getNumSuccessors() const LLVM_READONLY
Return the number of successors that this instruction has.
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
LLVM_ABI void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
This is an important class for using LLVM in a threaded context.
LLVM_ABI MDNode * createBranchWeights(uint32_t TrueWeight, uint32_t FalseWeight, bool IsExpected=false)
Return metadata containing two branch weights.
A Module instance is used to store all the information related to an LLVM module.
Represent a mutable reference to an array (0 or more elements consecutively in memory),...
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
An analysis pass based on the new PM to deliver ProfileSummaryInfo.
Analysis providing profile information.
bool hasProfileSummary() const
Returns true if profile summary is available.
LLVM_ABI bool isColdCount(uint64_t C) const
Returns true if count C is considered cold.
LLVM_ABI bool isHotCount(uint64_t C) const
Returns true if count C is considered hot.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Represent a constant reference to a string, i.e.
Target - Wrapper for Target specific information.
The instances of the Type class are immutable: once they are created, they are never changed.
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
A Use represents the edge between a Value definition and its users.
User * getUser() const
Returns the User that contains this Use.
LLVMContext & getContext() const
All values hold a context through their type.
iterator_range< use_iterator > uses()
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
void insert_range(Range &&R)
const ParentTy * getParent() const
@ C
The default llvm calling convention, compatible with C.
@ BasicBlock
Various leaf nodes.
LLVM_ABI Function * getDeclarationIfExists(const Module *M, ID id)
Look up the Function declaration of the intrinsic id in the Module M and return it if it exists.
initializer< Ty > init(const Ty &Val)
Add a small namespace to avoid name clashes with the classes used in the streaming interface.
DiagnosticInfoOptimizationBase::Argument NV
LLVM_ABI CallBase & promoteIndirectCall(CallBase &CB, Function *F, uint64_t Count, uint64_t TotalCount, bool AttachProfToDirectCall, OptimizationRemarkEmitter *ORE)
NodeAddr< FuncNode * > Func
friend class Instruction
Iterator for Instructions in a `BasicBlock.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
void stable_sort(R &&Range)
LLVM_ABI bool isLegalToPromote(const CallBase &CB, Function *Callee, const char **FailureReason=nullptr)
Return true if the given indirect call site can be made to call Callee.
std::vector< CallBase * > findIndirectCalls(Function &F)
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
LLVM_ABI CallBase & promoteCallWithIfThenElse(CallBase &CB, Function *Callee, MDNode *BranchWeights=nullptr)
Promote the given indirect call site to conditionally call Callee.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
InnerAnalysisManagerProxy< FunctionAnalysisManager, Module > FunctionAnalysisManagerModuleProxy
Provide the FunctionAnalysisManager to Module proxy.
cl::opt< unsigned > MaxNumVTableAnnotations("icp-max-num-vtables", cl::init(6), cl::Hidden, cl::desc("Max number of vtables annotated for a vtable load instruction."))
auto upper_bound(R &&Range, T &&Value)
Provide wrappers to std::upper_bound which take ranges instead of having to pass begin/end explicitly...
cl::opt< bool > EnableVTableProfileUse("enable-vtable-profile-use", cl::init(false), cl::desc("If ThinLTO and WPD is enabled and this option is true, vtable " "profiles will be used by ICP pass for more efficient indirect " "call sequence. If false, type profiles won't be used."))
LLVM_ABI void annotateValueSite(Module &M, Instruction &Inst, const InstrProfRecord &InstrProfR, InstrProfValueKind ValueKind, uint32_t SiteIndx, uint32_t MaxMDCount=3)
Get the value profile data for value site SiteIdx from InstrProfR and annotate the instruction Inst w...
auto reverse(ContainerTy &&C)
void sort(IteratorTy Start, IteratorTy End)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
FunctionAddr VTableAddr Count
LLVM_ABI SmallVector< InstrProfValueData, 4 > getValueProfDataFromInst(const Instruction &Inst, InstrProfValueKind ValueKind, uint32_t MaxNumValueData, uint64_t &TotalC, bool GetNoICPValue=false)
Extract the value profile data from Inst and returns them if Inst is annotated with value profile dat...
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
ArrayRef(const T &OneElt) -> ArrayRef< T >
std::string toString(const APInt &I, unsigned Radix, bool Signed, bool formatAsCLiteral=false, bool UpperCase=true, bool InsertSeparators=false)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
uint32_t scaleBranchCount(uint64_t Count, uint64_t Scale)
Scale an individual branch count.
LLVM_ABI void setFittedBranchWeights(Instruction &I, ArrayRef< uint64_t > Weights, bool IsExpected, bool ElideAllZero=false)
Variant of setBranchWeights where the Weights will be fit first to uint32_t by shifting right.
uint64_t calculateCountScale(uint64_t MaxCount)
Calculate what to divide by to scale counts.
LLVM_ABI CallBase & promoteCallWithVTableCmp(CallBase &CB, Instruction *VPtr, Function *Callee, ArrayRef< Constant * > AddressPoints, MDNode *BranchWeights)
This is similar to promoteCallWithIfThenElse except that the condition to promote a virtual call is t...
LLVM_ABI void findDevirtualizableCallsForTypeTest(SmallVectorImpl< DevirtCallSite > &DevirtCalls, SmallVectorImpl< CallInst * > &Assumes, const CallInst *CI, DominatorTree &DT)
Given a call to the intrinsic @llvm.type.test, find all devirtualizable call sites based on the call ...
AnalysisManager< Module > ModuleAnalysisManager
Convenience typedef for the Module analysis manager.
LLVM_ABI std::pair< Function *, Constant * > getFunctionAtVTableOffset(GlobalVariable *GV, uint64_t Offset, Module &M)
Given a vtable and a specified offset, returns the function and the trivial pointer at the specified ...
static Instruction * tryGetVTableInstruction(CallBase *CB)