19#include "llvm/Config/config.h"
53#include <system_error>
60#define DEBUG_TYPE "instrprof"
64 cl::desc(
"Use full module build paths in the profile counter names for "
65 "static functions."));
77 cl::desc(
"Strip specified level of directory name from source path in "
78 "the profile counter name for static functions."));
81 const std::string &ErrMsg =
"") {
86 case instrprof_error::success:
89 case instrprof_error::eof:
92 case instrprof_error::unrecognized_format:
93 OS <<
"unrecognized instrumentation profile encoding format";
95 case instrprof_error::bad_magic:
96 OS <<
"invalid instrumentation profile data (bad magic)";
98 case instrprof_error::bad_header:
99 OS <<
"invalid instrumentation profile data (file header is corrupt)";
101 case instrprof_error::unsupported_version:
102 OS <<
"unsupported instrumentation profile format version";
104 case instrprof_error::unsupported_hash_type:
105 OS <<
"unsupported instrumentation profile hash type";
107 case instrprof_error::too_large:
108 OS <<
"too much profile data";
110 case instrprof_error::truncated:
111 OS <<
"truncated profile data";
113 case instrprof_error::malformed:
114 OS <<
"malformed instrumentation profile data";
116 case instrprof_error::missing_correlation_info:
117 OS <<
"debug info/binary for correlation is required";
119 case instrprof_error::unexpected_correlation_info:
120 OS <<
"debug info/binary for correlation is not necessary";
122 case instrprof_error::unable_to_correlate_profile:
123 OS <<
"unable to correlate profile";
125 case instrprof_error::invalid_prof:
126 OS <<
"invalid profile created. Please file a bug "
127 "at: " BUG_REPORT_URL
128 " and include the profraw files that caused this error.";
130 case instrprof_error::unknown_function:
131 OS <<
"no profile data available for function";
133 case instrprof_error::hash_mismatch:
134 OS <<
"function control flow change detected (hash mismatch)";
136 case instrprof_error::count_mismatch:
137 OS <<
"function basic block count change detected (counter mismatch)";
139 case instrprof_error::bitmap_mismatch:
140 OS <<
"function bitmap size change detected (bitmap size mismatch)";
142 case instrprof_error::counter_overflow:
143 OS <<
"counter overflow";
145 case instrprof_error::value_site_count_mismatch:
146 OS <<
"function value site count change detected (counter mismatch)";
148 case instrprof_error::compress_failed:
149 OS <<
"failed to compress data (zlib)";
151 case instrprof_error::uncompress_failed:
152 OS <<
"failed to uncompress data (zlib)";
154 case instrprof_error::empty_raw_profile:
155 OS <<
"empty raw profile file";
157 case instrprof_error::zlib_unavailable:
158 OS <<
"profile uses zlib compression but the profile reader was built "
159 "without zlib support";
161 case instrprof_error::raw_profile_version_mismatch:
162 OS <<
"raw profile version mismatch";
164 case instrprof_error::counter_value_too_large:
165 OS <<
"excessively large counter value suggests corrupted profile data";
171 OS <<
": " << ErrMsg;
181class InstrProfErrorCategoryType :
public std::error_category {
182 const char *
name()
const noexcept
override {
return "llvm.instrprof"; }
184 std::string message(
int IE)
const override {
192 static InstrProfErrorCategoryType ErrorCategory;
193 return ErrorCategory;
198const char *InstrProfSectNameCommon[] = {
199#define INSTR_PROF_SECT_ENTRY(Kind, SectNameCommon, SectNameCoff, Prefix) \
204const char *InstrProfSectNameCoff[] = {
205#define INSTR_PROF_SECT_ENTRY(Kind, SectNameCommon, SectNameCoff, Prefix) \
210const char *InstrProfSectNamePrefix[] = {
211#define INSTR_PROF_SECT_ENTRY(Kind, SectNameCommon, SectNameCoff, Prefix) \
221 "enable-name-compression",
225 "enable-vtable-value-profiling",
cl::init(
false),
226 cl::desc(
"If true, the virtual table address will be instrumented to know "
227 "the types of a C++ pointer. The information is used in indirect "
228 "call promotion to do selective vtable-based comparison."));
231 "enable-vtable-profile-use",
cl::init(
false),
232 cl::desc(
"If ThinLTO and WPD is enabled and this option is true, vtable "
233 "profiles will be used by ICP pass for more efficient indirect "
234 "call sequence. If false, type profiles won't be used."));
238 bool AddSegmentInfo) {
239 std::string SectName;
242 SectName = InstrProfSectNamePrefix[IPSK];
245 SectName += InstrProfSectNameCoff[IPSK];
247 SectName += InstrProfSectNameCommon[IPSK];
249 if (OF ==
Triple::MachO && IPSK == IPSK_data && AddSegmentInfo)
250 SectName +=
",regular,live_support";
270 std::string NewName = std::string(
Name);
276 if (FileName.
empty())
277 NewName = NewName.insert(0,
"<unknown>:");
279 NewName = NewName.insert(0, FileName.
str() +
":");
290 for (
const auto &CI : PathNameStr) {
299 return PathNameStr.
substr(LastPos);
350 MDNode *PGONameMetadata) {
358 return *IRPGOFuncName;
405 if (MangledName.empty())
406 return std::make_pair(
StringRef(), IRPGOName);
407 return std::make_pair(FileName, MangledName);
411 if (FileName.
empty())
431 const char InvalidChars[] =
"-:;<>/\"'";
432 size_t FoundPos = VarName.find_first_of(InvalidChars);
433 while (FoundPos != std::string::npos) {
434 VarName[FoundPos] =
'_';
435 FoundPos = VarName.find_first_of(InvalidChars, FoundPos + 1);
441 const auto &
T =
Triple(M.getTargetTriple());
442 return T.isAMDGPU() ||
T.isNVPTX();
501 if (!
G.hasName() || !
G.hasMetadata(LLVMContext::MD_type))
518 bool Inserted =
true;
519 std::tie(std::ignore, Inserted) =
525 if (
Error E = NameToGUIDMap(VTablePGOName))
528 StringRef CanonicalName = getCanonicalName(VTablePGOName);
529 if (CanonicalName != VTablePGOName)
530 return NameToGUIDMap(CanonicalName);
549 const bool IsCompressed = (CompressedSize != 0);
557 UncompressedNameStrings,
563 NameStrings = toStringRef(UncompressedNameStrings);
566 StringRef(
reinterpret_cast<const char *
>(
P), UncompressedSize);
567 P += UncompressedSize;
576 while (
P < EndP && *
P == 0)
592 this, std::placeholders::_1)))
603 CompressedVTableStrings,
617 const std::string UniqSuffix =
".__uniq.";
618 size_t Pos = PGOName.
find(UniqSuffix);
620 Pos += UniqSuffix.length();
626 Pos = PGOName.
find(
'.', Pos);
628 return PGOName.
substr(0, Pos);
641 if (
Error E = NameToGUIDMap(PGOFuncName))
647 StringRef CanonicalFuncName = getCanonicalName(PGOFuncName);
648 if (CanonicalFuncName != PGOFuncName)
649 return NameToGUIDMap(CanonicalFuncName);
662 auto It =
partition_point(AddrToMD5Map, [=](std::pair<uint64_t, uint64_t>
A) {
669 if (It != AddrToMD5Map.end() && It->first ==
Address)
682 bool DoCompression, std::string &Result) {
683 assert(!NameStrs.
empty() &&
"No name data to emit");
686 std::string UncompressedNameStrings =
691 "PGO name is invalid (contains separator token)");
693 unsigned EncLen =
encodeULEB128(UncompressedNameStrings.length(),
P);
696 auto WriteStringToResult = [&](
size_t CompressedLen,
StringRef InputStr) {
699 char *HeaderStr =
reinterpret_cast<char *
>(&Header[0]);
700 unsigned HeaderLen =
P - &Header[0];
701 Result.append(HeaderStr, HeaderLen);
706 if (!DoCompression) {
707 return WriteStringToResult(0, UncompressedNameStrings);
712 CompressedNameStrings,
715 return WriteStringToResult(CompressedNameStrings.
size(),
716 toStringRef(CompressedNameStrings));
722 Arr->isCString() ? Arr->getAsCString() : Arr->getAsString();
727 std::string &Result,
bool DoCompression) {
728 std::vector<std::string> NameStrs;
729 for (
auto *NameVar : NameVars) {
737 std::string &Result,
bool DoCompression) {
738 std::vector<std::string> VTableNameStrs;
739 for (
auto *VTable : VTables)
740 VTableNameStrs.push_back(
getPGOName(*VTable));
753 for (
uint32_t VK = IPVK_First; VK <= IPVK_Last; ++VK) {
756 for (
size_t I = 0;
I < NumValueSites; ++
I) {
770 double Score = 0.0f, FuncLevelScore = 0.0f;
775 while (
I != IE && J != JE) {
776 if (
I->Value == J->Value) {
784 }
else if (
I->Value < J->Value) {
800 assert(ThisNumValueSites ==
Other.getNumValueSites(ValueKind));
801 if (!ThisNumValueSites)
804 std::vector<InstrProfValueSiteRecord> &ThisSiteRecords =
805 getOrCreateValueSitesForKind(ValueKind);
807 Other.getValueSitesForKind(ValueKind);
809 ThisSiteRecords[
I].
overlap(OtherSiteRecords[
I], ValueKind, Overlap,
819 bool Mismatch = (
Counts.size() !=
Other.Counts.size());
823 for (
uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind) {
826 if (ThisNumValueSites != OtherNumValueSites) {
838 for (
uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind)
844 for (
size_t I = 0, E =
Other.Counts.size();
I < E; ++
I) {
847 MaxCount = std::max(
Other.Counts[
I], MaxCount);
852 if (MaxCount >= ValueCutoff) {
853 double FuncScore = 0.0;
854 for (
size_t I = 0, E =
Other.Counts.size();
I < E; ++
I)
860 FuncLevelOverlap.
Valid =
true;
871 std::vector<InstrProfValueData> Merged;
873 for (
const InstrProfValueData &J : Input.
ValueData) {
874 while (
I != IE &&
I->Value < J.Value) {
875 Merged.push_back(*
I);
878 if (
I != IE &&
I->Value == J.Value) {
883 Merged.push_back(*
I);
889 Merged.insert(Merged.end(),
I, IE);
905void InstrProfRecord::mergeValueProfData(
909 uint32_t OtherNumValueSites = Src.getNumValueSites(ValueKind);
910 if (ThisNumValueSites != OtherNumValueSites) {
914 if (!ThisNumValueSites)
916 std::vector<InstrProfValueSiteRecord> &ThisSiteRecords =
917 getOrCreateValueSitesForKind(ValueKind);
919 Src.getValueSitesForKind(ValueKind);
921 ThisSiteRecords[
I].
merge(OtherSiteRecords[
I], Weight, Warn);
951 for (
size_t I = 0, E =
Other.Counts.size();
I < E; ++
I) {
972 for (
size_t I = 0, E =
Other.BitmapBytes.size();
I < E; ++
I) {
976 for (
uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind)
977 mergeValueProfData(Kind,
Other, Weight, Warn);
980void InstrProfRecord::scaleValueProfData(
983 for (
auto &R : getValueSitesForKind(ValueKind))
989 assert(
D != 0 &&
"D cannot be 0");
990 for (
auto &Count : this->
Counts) {
1000 for (
uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind)
1001 scaleValueProfData(Kind,
N,
D, Warn);
1010 if (ValueKind == IPVK_IndirectCallTarget)
1013 if (ValueKind == IPVK_VTableTarget)
1023 std::vector<InstrProfValueData> RemappedVD;
1024 RemappedVD.reserve(VData.
size());
1025 for (
const auto &V : VData) {
1027 RemappedVD.push_back({NewValue, V.Count});
1030 std::vector<InstrProfValueSiteRecord> &ValueSites =
1031 getOrCreateValueSitesForKind(ValueKind);
1032 assert(ValueSites.size() == Site);
1035 ValueSites.emplace_back(std::move(RemappedVD));
1040 bool RemoveOutlierUNs) {
1043 UtilityNodeT MaxUN = 0;
1049 for (
auto &
Trace : Traces) {
1050 size_t CutoffTimestamp = 1;
1056 It->getSecond() = std::min<size_t>(It->getSecond(),
Timestamp);
1063 for (
auto &[Id, FirstUN] : IdToFirstUN)
1064 for (
auto UN = FirstUN; UN <= MaxUN; ++UN)
1065 IdToUNs[Id].push_back(UN);
1067 IdToFirstUN.
clear();
1070 if (RemoveOutlierUNs) {
1072 for (
auto &[Id, UNs] : IdToUNs)
1073 for (
auto &UN : UNs)
1077 for (
auto &[Id, UNs] : IdToUNs)
1079 return UNFrequency[UN] <= 1 || 2 * UNFrequency[UN] > IdToUNs.
size();
1083 for (
auto &[Id, UNs] : IdToUNs)
1084 Nodes.emplace_back(Id, UNs);
1089 return std::make_pair(IdToFirstTimestamp[L.Id], L.Id) <
1090 std::make_pair(IdToFirstTimestamp[R.Id], R.Id);
1094#define INSTR_PROF_COMMON_API_IMPL
1108 ->getNumValueSites(VKind);
1113 ->getNumValueData(VKind);
1125 llvm::copy(IPR->getValueArrayForSite(K, S), Dst);
1130 (ValueProfData *)(
new (::operator
new(TotalSizeInBytes)) ValueProfData());
1131 memset(VD, 0, TotalSizeInBytes);
1148 Closure.Record = &
Record;
1149 return getValueProfDataSize(&Closure);
1153std::unique_ptr<ValueProfData>
1157 std::unique_ptr<ValueProfData> VPD(
1164 Record.reserveSites(Kind, NumValueSites);
1166 InstrProfValueData *ValueData = getValueProfRecordValueData(
this);
1167 for (
uint64_t VSite = 0; VSite < NumValueSites; ++VSite) {
1168 uint8_t ValueDataCount = this->SiteCountArray[VSite];
1170 Record.addValueData(Kind, VSite, VDs, SymTab);
1171 ValueData += ValueDataCount;
1179 using namespace support;
1185 sys::swapByteOrder<uint32_t>(NumValueSites);
1186 sys::swapByteOrder<uint32_t>(Kind);
1188 uint32_t ND = getValueProfRecordNumValueData(
this);
1189 InstrProfValueData *VD = getValueProfRecordValueData(
this);
1193 sys::swapByteOrder<uint64_t>(VD[
I].
Value);
1194 sys::swapByteOrder<uint64_t>(VD[
I].Count);
1197 sys::swapByteOrder<uint32_t>(NumValueSites);
1198 sys::swapByteOrder<uint32_t>(Kind);
1204 if (NumValueKinds == 0)
1207 ValueProfRecord *VR = getFirstValueProfRecord(
this);
1208 for (
uint32_t K = 0;
K < NumValueKinds;
K++) {
1209 VR->deserializeTo(
Record, SymTab);
1210 VR = getValueProfRecordNext(VR);
1215 return std::unique_ptr<ValueProfData>(
new (::operator
new(TotalSize))
1219Error ValueProfData::checkIntegrity() {
1220 if (NumValueKinds > IPVK_Last + 1)
1221 return make_error<InstrProfError>(
1225 return make_error<InstrProfError>(
1228 ValueProfRecord *VR = getFirstValueProfRecord(
this);
1229 for (
uint32_t K = 0; K < this->NumValueKinds; K++) {
1230 if (VR->Kind > IPVK_Last)
1232 "value kind is invalid");
1233 VR = getValueProfRecordNext(VR);
1234 if ((
char *)VR - (
char *)
this > (
ptrdiff_t)TotalSize)
1235 return make_error<InstrProfError>(
1237 "value profile address is greater than total size");
1243ValueProfData::getValueProfData(
const unsigned char *
D,
1244 const unsigned char *
const BufferEnd,
1246 using namespace support;
1248 if (
D +
sizeof(ValueProfData) > BufferEnd)
1251 const unsigned char *Header =
D;
1252 uint32_t TotalSize = endian::readNext<uint32_t>(Header, Endianness);
1254 if (
D + TotalSize > BufferEnd)
1258 memcpy(VPD.get(),
D, TotalSize);
1260 VPD->swapBytesToHost(Endianness);
1262 Error E = VPD->checkIntegrity();
1264 return std::move(E);
1266 return std::move(VPD);
1270 using namespace support;
1275 sys::swapByteOrder<uint32_t>(TotalSize);
1276 sys::swapByteOrder<uint32_t>(NumValueKinds);
1278 ValueProfRecord *VR = getFirstValueProfRecord(
this);
1279 for (
uint32_t K = 0;
K < NumValueKinds;
K++) {
1281 VR = getValueProfRecordNext(VR);
1286 using namespace support;
1291 ValueProfRecord *VR = getFirstValueProfRecord(
this);
1292 for (
uint32_t K = 0;
K < NumValueKinds;
K++) {
1293 ValueProfRecord *NVR = getValueProfRecordNext(VR);
1297 sys::swapByteOrder<uint32_t>(TotalSize);
1298 sys::swapByteOrder<uint32_t>(NumValueKinds);
1309 for (
const InstrProfValueData &V : VDs)
1334 for (
const auto &VD : VDs) {
1355 if (!
Tag ||
Tag->getString() !=
"VP")
1371 bool GetNoICPValue) {
1385 ValueData.
reserve((NOps - 3) / 2);
1386 for (
unsigned I = 3;
I < NOps;
I += 2) {
1387 if (ValueData.
size() >= MaxNumValueData)
1391 mdconst::dyn_extract<ConstantInt>(MD->
getOperand(
I + 1));
1392 if (!
Value || !Count) {
1399 InstrProfValueData V;
1400 V.Value =
Value->getZExtValue();
1463 M->getNamedGlobal(INSTR_PROF_QUOTE(INSTR_PROF_RAW_VERSION_VAR));
1476 auto *InitVal = dyn_cast_or_null<ConstantInt>(IRInstrVar->
getInitializer());
1479 return (InitVal->getZExtValue() & VARIANT_MASK_IR_PROF) != 0;
1484 if (
F.getName().empty())
1490 if (CheckAddressTaken &&
F.hasAddressTaken())
1498 if (!
F.hasComdat()) {
1507 if (InstrProfileOutput.
empty())
1513 ProfileNameConst, INSTR_PROF_QUOTE(INSTR_PROF_PROFILE_NAME_VAR));
1515 Triple TT(M.getTargetTriple());
1516 if (TT.supportsCOMDAT()) {
1518 ProfileNameVar->
setComdat(M.getOrInsertComdat(
1519 StringRef(INSTR_PROF_QUOTE(INSTR_PROF_PROFILE_NAME_VAR))));
1524 const std::string &TestFilename,
1526 auto GetProfileSum = [IsCS](
const std::string &Filename,
1532 if (
Error E = ReaderOrErr.takeError()) {
1535 auto Reader = std::move(ReaderOrErr.get());
1536 Reader->accumulateCounts(Sum, IsCS);
1554 for (
unsigned I = 0;
I < IPVK_Last - IPVK_First + 1;
I++) {
1564 for (
unsigned I = 0;
I < IPVK_Last - IPVK_First + 1;
I++) {
1574 const char *EntryName =
1575 (Level ==
ProgramLevel ?
"functions" :
"edge counters");
1577 OS <<
"Profile overlap infomation for base_profile: " << *
BaseFilename
1578 <<
" and test_profile: " << *
TestFilename <<
"\nProgram level:\n";
1580 OS <<
"Function level:\n"
1589 OS <<
" # of " << EntryName
1595 OS <<
" Mismatched count percentage (Edge): "
1598 OS <<
" Percentage of Edge profile only in test_profile: "
1605 for (
unsigned I = 0;
I < IPVK_Last - IPVK_First + 1;
I++) {
1608 char ProfileKindName[20] = {0};
1610 case IPVK_IndirectCallTarget:
1611 strncpy(ProfileKindName,
"IndirectCall", 19);
1613 case IPVK_MemOPSize:
1614 strncpy(ProfileKindName,
"MemOP", 19);
1616 case IPVK_VTableTarget:
1617 strncpy(ProfileKindName,
"VTable", 19);
1620 snprintf(ProfileKindName, 19,
"VP[%d]",
I);
1623 OS <<
" " << ProfileKindName
1627 OS <<
" Mismatched count percentage (" << ProfileKindName
1630 OS <<
" Percentage of " << ProfileKindName
1631 <<
" profile only in test_profile: "
1633 OS <<
" " << ProfileKindName
1636 <<
" " << ProfileKindName
1642namespace IndexedInstrProf {
1644 using namespace support;
1645 static_assert(std::is_standard_layout_v<Header>,
1646 "Use standard layout for Header for simplicity");
1649 H.Magic = endian::readNext<uint64_t, llvm::endianness::little>(Buffer);
1655 H.Version = endian::readNext<uint64_t, llvm::endianness::little>(Buffer);
1656 if (
H.getIndexedProfileVersion() >
1661 "Please update the reader as needed when a new field is added "
1662 "or when indexed profile version gets bumped.");
1665 H.HashType = endian::readNext<uint64_t, llvm::endianness::little>(Buffer);
1666 H.HashOffset = endian::readNext<uint64_t, llvm::endianness::little>(Buffer);
1667 if (
H.getIndexedProfileVersion() >= 8)
1669 endian::readNext<uint64_t, llvm::endianness::little>(Buffer);
1670 if (
H.getIndexedProfileVersion() >= 9)
1672 endian::readNext<uint64_t, llvm::endianness::little>(Buffer);
1674 if (
H.getIndexedProfileVersion() >= 10)
1675 H.TemporalProfTracesOffset =
1676 endian::readNext<uint64_t, llvm::endianness::little>(Buffer);
1677 if (
H.getIndexedProfileVersion() >= 12)
1678 H.VTableNamesOffset =
1679 endian::readNext<uint64_t, llvm::endianness::little>(Buffer);
1694 "Please update the size computation below if a new field has "
1695 "been added to the header; for a version bump without new "
1696 "fields, add a case statement to fall through to the latest version.");
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
#define LLVM_ATTRIBUTE_UNUSED
This file contains the declarations for the subclasses of Constant, which represent the different fla...
Module.h This file contains the declarations for the Module class.
static cl::opt< bool > StaticFuncFullModulePrefix("static-func-full-module-prefix", cl::init(true), cl::Hidden, cl::desc("Use full module build paths in the profile counter names for " "static functions."))
static cl::opt< unsigned > StaticFuncStripDirNamePrefix("static-func-strip-dirname-prefix", cl::init(0), cl::Hidden, cl::desc("Strip specified level of directory name from source path in " "the profile counter name for static functions."))
static std::string getInstrProfErrString(instrprof_error Err, const std::string &ErrMsg="")
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file defines the SmallVector class.
Defines the virtual file system interface vfs::FileSystem.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
size_t size() const
size - Get the array size.
bool empty() const
empty - Check if the array is empty.
static Constant * getString(LLVMContext &Context, StringRef Initializer, bool AddNull=true)
This method constructs a CDS and initializes it with a text string.
This is the shared class of boolean and integer constants.
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
This is an important base class in LLVM.
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
Lightweight error class with error context and mandatory checking.
static ErrorSuccess success()
Create a success value.
Tagged union holding either a T or a Error.
void setMetadata(unsigned KindID, MDNode *Node)
Set a particular kind of metadata attachment.
void setComdat(Comdat *C)
MDNode * getMetadata(unsigned KindID) const
Get the current metadata attachments for the given kind, if any.
static bool isLocalLinkage(LinkageTypes Linkage)
bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
LinkageTypes getLinkage() const
bool hasLocalLinkage() const
void setLinkage(LinkageTypes LT)
GUID getGUID() const
Return a 64-bit global unique ID constructed from global value name (i.e.
Module * getParent()
Get the module that this global value is contained inside of...
bool isDiscardableIfUnused() const
@ HiddenVisibility
The GV is hidden.
@ ProtectedVisibility
The GV is protected.
void setVisibility(VisibilityTypes V)
std::string getGlobalIdentifier() const
Return the modified name for this global value suitable to be used as the key for a global lookup (e....
LinkageTypes
An enumeration for the kinds of linkage for global values.
@ PrivateLinkage
Like Internal, but omit from symbol table.
@ InternalLinkage
Rename collisions when linking (static functions).
@ LinkOnceAnyLinkage
Keep one copy of function when linking (inline)
@ ExternalLinkage
Externally visible function.
@ WeakAnyLinkage
Keep one copy of named function when linking (weak)
@ AvailableExternallyLinkage
Available for inspection, not emission.
@ ExternalWeakLinkage
ExternalWeak linkage description.
@ LinkOnceODRLinkage
Same, but only replaced by something equivalent.
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
bool hasInitializer() const
Definitions have initializers, declarations don't.
std::string message() const override
Return the error message as a string.
static Expected< std::unique_ptr< InstrProfReader > > create(const Twine &Path, vfs::FileSystem &FS, const InstrProfCorrelator *Correlator=nullptr, const object::BuildIDFetcher *BIDFetcher=nullptr, const InstrProfCorrelator::ProfCorrelatorKind BIDFetcherCorrelatorKind=InstrProfCorrelator::ProfCorrelatorKind::NONE, std::function< void(Error)> Warn=nullptr)
Factory method to create an appropriately typed reader for the given instrprof file.
A symbol table used for function [IR]PGO name look-up with keys (such as pointers,...
uint64_t getFunctionHashFromAddress(uint64_t Address)
Return a function's hash, or 0, if the function isn't in this SymTab.
Error addSymbolName(StringRef SymbolName)
uint64_t getVTableHashFromAddress(uint64_t Address)
Return a vtable's hash, or 0 if the vtable doesn't exist in this SymTab.
Error addVTableName(StringRef VTableName)
Adds VTableName as a known symbol, and inserts it to a map that tracks all vtable names.
void dumpNames(raw_ostream &OS) const
Dump the symbols in this table.
Error create(object::SectionRef &Section)
Create InstrProfSymtab from an object file section which contains function PGO names.
Error addFuncName(StringRef FuncName)
The method name is kept since there are many callers.
Error initVTableNamesFromCompressedStrings(StringRef CompressedVTableNames)
Initialize 'this' with the set of vtable names encoded in CompressedVTableNames.
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
ValT lookup(KeyT x, ValT NotFound=ValT()) const
lookup - Return the mapped value at x or NotFound.
This is an important class for using LLVM in a threaded context.
ConstantAsMetadata * createConstant(Constant *C)
Return the given constant as metadata.
MDString * createString(StringRef Str)
Return the given string as metadata.
const MDOperand & getOperand(unsigned I) const
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
unsigned getNumOperands() const
Return number of MDNode operands.
static MDString * get(LLVMContext &Context, StringRef Str)
A Module instance is used to store all the information related to an LLVM module.
const std::string & getSourceFileName() const
Get the module's original source file name.
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
void reserve(size_type N)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
iterator_range< StringMapKeyIterator< ValueTy > > keys() const
StringRef - Represent a constant reference to a string, i.e.
std::pair< StringRef, StringRef > split(char Separator) const
Split into two substrings around the first occurrence of a separator character.
std::string str() const
str - Get the contents as an std::string.
const unsigned char * bytes_end() const
constexpr StringRef substr(size_t Start, size_t N=npos) const
Return a reference to the substring from [Start, Start + N).
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
constexpr bool empty() const
empty - Check if the string is empty.
StringRef drop_front(size_t N=1) const
Return a StringRef equal to 'this' but with the first N elements dropped.
constexpr size_t size() const
size - Get the string size.
size_t find(char C, size_t From=0) const
Search for the first character C in the string.
static constexpr size_t npos
const unsigned char * bytes_begin() const
Triple - Helper class for working with autoconf configuration names.
bool supportsCOMDAT() const
Tests whether the target supports comdat.
static IntegerType * getInt32Ty(LLVMContext &C)
static IntegerType * getInt64Ty(LLVMContext &C)
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
LLVMContext & getContext() const
All values hold a context through their type.
StringRef getName() const
Return a constant reference to the value's name.
An efficient, type-erasing, non-owning reference to a callable.
A raw_ostream that writes to a file descriptor.
This class implements an extremely fast bulk output stream that can only output to a stream.
A raw_ostream that writes to an std::string.
@ C
The default llvm calling convention, compatible with C.
initializer< Ty > init(const Ty &Val)
void compress(ArrayRef< uint8_t > Input, SmallVectorImpl< uint8_t > &CompressedBuffer, int Level=DefaultCompression)
Error decompress(ArrayRef< uint8_t > Input, uint8_t *Output, size_t &UncompressedSize)
constexpr int BestSizeCompression
bool is_separator(char value, Style style=Style::native)
Check whether the given char is a path separator on the host OS.
IntrusiveRefCntPtr< FileSystem > getRealFileSystem()
Gets an vfs::FileSystem for the 'real' file system, as seen by the operating system.
This is an optimization pass for GlobalISel generic memory operations.
StringRef getInstrProfNameVarPrefix()
Return the name prefix of variables containing instrumented function names.
std::string getPGOFuncName(const Function &F, bool InLTO=false, uint64_t Version=INSTR_PROF_INDEX_VERSION)
Please use getIRPGOFuncName for LLVM IR instrumentation.
void createPGOFuncNameMetadata(Function &F, StringRef PGOFuncName)
Create the PGOFuncName meta data if PGOFuncName is different from function's raw name.
std::string getIRPGOFuncName(const Function &F, bool InLTO=false)
StringRef getPGOFuncNameMetadataName()
void getValueForSiteInstrProf(const void *R, InstrProfValueData *Dst, uint32_t K, uint32_t S)
cl::opt< bool > DoInstrProfNameCompression
StringRef getFuncNameWithoutPrefix(StringRef PGOFuncName, StringRef FileName="<unknown>")
Given a PGO function name, remove the filename prefix and return the original (static) function name.
auto partition_point(R &&Range, Predicate P)
Binary search for the first iterator in a range where a predicate is false.
uint64_t decodeULEB128(const uint8_t *p, unsigned *n=nullptr, const uint8_t *end=nullptr, const char **error=nullptr)
Utility function to decode a ULEB128 value.
void createPGONameMetadata(GlobalObject &GO, StringRef PGOName)
Create the PGOName metadata if a global object's PGO name is different from its mangled name.
std::pair< StringRef, StringRef > getParsedIRPGOName(StringRef IRPGOName)
MDNode * getPGOFuncNameMetadata(const Function &F)
Return the PGOFuncName meta data associated with a function.
static std::unique_ptr< ValueProfData > allocValueProfData(uint32_t TotalSize)
MDNode * mayHaveValueProfileOfKind(const Instruction &Inst, InstrProfValueKind ValueKind)
std::string getInstrProfSectionName(InstrProfSectKind IPSK, Triple::ObjectFormatType OF, bool AddSegmentInfo=true)
Return the name of the profile section corresponding to IPSK.
cl::opt< bool > EnableVTableProfileUse("enable-vtable-profile-use", cl::init(false), cl::desc("If ThinLTO and WPD is enabled and this option is true, vtable " "profiles will be used by ICP pass for more efficient indirect " "call sequence. If false, type profiles won't be used."))
uint64_t getInstrMaxCountValue()
Return the max count value. We reserver a few large values for special use.
bool needsComdatForCounter(const GlobalObject &GV, const Module &M)
Check if we can use Comdat for profile variables.
std::string getPGOName(const GlobalVariable &V, bool InLTO=false)
GlobalVariable * createPGOFuncNameVar(Function &F, StringRef PGOFuncName)
Create and return the global variable for function name used in PGO instrumentation.
void annotateValueSite(Module &M, Instruction &Inst, const InstrProfRecord &InstrProfR, InstrProfValueKind ValueKind, uint32_t SiteIndx, uint32_t MaxMDCount=3)
Get the value profile data for value site SiteIdx from InstrProfR and annotate the instruction Inst w...
Error collectPGOFuncNameStrings(ArrayRef< GlobalVariable * > NameVars, std::string &Result, bool doCompression=true)
Produce Result string with the same format described above.
void sort(IteratorTy Start, IteratorTy End)
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
StringRef getPGOFuncNameVarInitializer(GlobalVariable *NameVar)
Return the initializer in string of the PGO name var NameVar.
std::enable_if_t< std::is_unsigned_v< T >, T > SaturatingMultiplyAdd(T X, T Y, T A, bool *ResultOverflowed=nullptr)
Multiply two unsigned integers, X and Y, and add the unsigned integer, A to the product.
StringRef getInstrProfNameSeparator()
Return the marker used to separate PGO names during serialization.
SmallVector< InstrProfValueData, 4 > getValueProfDataFromInst(const Instruction &Inst, InstrProfValueKind ValueKind, uint32_t MaxNumValueData, uint64_t &TotalC, bool GetNoICPValue=false)
Extract the value profile data from Inst and returns them if Inst is annotated with value profile dat...
format_object< Ts... > format(const char *Fmt, const Ts &... Vals)
These are helper functions used to produce formatted output.
static std::string getIRPGOObjectName(const GlobalObject &GO, bool InLTO, MDNode *PGONameMetadata)
@ value_site_count_mismatch
std::enable_if_t< std::is_unsigned_v< T >, T > SaturatingMultiply(T X, T Y, bool *ResultOverflowed=nullptr)
Multiply two unsigned integers, X and Y, of type T.
const std::error_category & instrprof_category()
Error collectVTableStrings(ArrayRef< GlobalVariable * > VTables, std::string &Result, bool doCompression)
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
static StringRef getStrippedSourceFileName(const GlobalObject &GO)
uint32_t getNumValueSitesInstrProf(const void *Record, uint32_t VKind)
OutputIt copy(R &&Range, OutputIt Out)
bool canRenameComdatFunc(const Function &F, bool CheckAddressTaken=false)
Check if we can safely rename this Comdat function.
void createProfileFileNameVar(Module &M, StringRef InstrProfileOutput)
constexpr char GlobalIdentifierDelimiter
Error collectGlobalObjectNameStrings(ArrayRef< std::string > NameStrs, bool doCompression, std::string &Result)
Given a vector of strings (names of global objects like functions or, virtual tables) NameStrs,...
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
void setPGOFuncVisibility(Module &M, GlobalVariable *FuncNameVar)
unsigned encodeULEB128(uint64_t Value, raw_ostream &OS, unsigned PadTo=0)
Utility function to encode a ULEB128 value to an output stream.
uint32_t getNumValueDataForSiteInstrProf(const void *R, uint32_t VK, uint32_t S)
static ValueProfRecordClosure InstrProfRecordClosure
static Error readAndDecodeStrings(StringRef NameStrings, std::function< Error(StringRef)> NameCallback)
NameStrings is a string composed of one of more possibly encoded sub-strings.
std::string getPGOFuncNameVarName(StringRef FuncName, GlobalValue::LinkageTypes Linkage)
Return the name of the global variable used to store a function name in PGO instrumentation.
static StringRef stripDirPrefix(StringRef PathNameStr, uint32_t NumPrefix)
static std::optional< std::string > lookupPGONameFromMetadata(MDNode *MD)
std::enable_if_t< std::is_unsigned_v< T >, T > SaturatingAdd(T X, T Y, bool *ResultOverflowed=nullptr)
Add two unsigned integers, X and Y, of type T.
bool isGPUProfTarget(const Module &M)
Determines whether module targets a GPU eligable for PGO instrumentation.
bool isIRPGOFlagSet(const Module *M)
Check if INSTR_PROF_RAW_VERSION_VAR is defined.
StringRef getPGONameMetadataName()
void consumeError(Error Err)
Consume a Error without doing anything.
const uint64_t NOMORE_ICP_MAGICNUM
Magic number in the value profile metadata showing a target has been promoted for the instruction and...
uint32_t getNumValueKindsInstrProf(const void *Record)
ValueProfRecordClosure Interface implementation for InstrProfRecord class.
ValueProfData * allocValueProfDataInstrProf(size_t TotalSizeInBytes)
uint32_t getNumValueDataInstrProf(const void *Record, uint32_t VKind)
static std::string getIRPGONameForGlobalObject(const GlobalObject &GO, GlobalValue::LinkageTypes Linkage, StringRef FileName)
cl::opt< bool > EnableVTableValueProfiling("enable-vtable-value-profiling", cl::init(false), cl::desc("If true, the virtual table address will be instrumented to know " "the types of a C++ pointer. The information is used in indirect " "call promotion to do selective vtable-based comparison."))
std::array< double, IPVK_Last - IPVK_First+1 > ValueCounts
Profiling information for a single function.
void overlapValueProfData(uint32_t ValueKind, InstrProfRecord &Src, OverlapStats &Overlap, OverlapStats &FuncLevelOverlap)
Compute the overlap of value profile counts.
std::vector< uint64_t > Counts
ArrayRef< InstrProfValueData > getValueArrayForSite(uint32_t ValueKind, uint32_t Site) const
Return the array of profiled values at Site.
CountPseudoKind getCountPseudoKind() const
void accumulateCounts(CountSumOrPercent &Sum) const
Compute the sums of all counts and store in Sum.
uint32_t getNumValueSites(uint32_t ValueKind) const
Return the number of instrumented sites for ValueKind.
void setPseudoCount(CountPseudoKind Kind)
void merge(InstrProfRecord &Other, uint64_t Weight, function_ref< void(instrprof_error)> Warn)
Merge the counts in Other into this one.
void addValueData(uint32_t ValueKind, uint32_t Site, ArrayRef< InstrProfValueData > VData, InstrProfSymtab *SymTab)
Add ValueData for ValueKind at value Site.
void overlap(InstrProfRecord &Other, OverlapStats &Overlap, OverlapStats &FuncLevelOverlap, uint64_t ValueCutoff)
Compute the overlap b/w this IntrprofRecord and Other.
std::vector< uint8_t > BitmapBytes
void scale(uint64_t N, uint64_t D, function_ref< void(instrprof_error)> Warn)
Scale up profile counts (including value profile data) by a factor of (N / D).
void sortByTargetValues()
Sort ValueData ascending by Value.
std::vector< InstrProfValueData > ValueData
Value profiling data pairs at a given value site.
void merge(InstrProfValueSiteRecord &Input, uint64_t Weight, function_ref< void(instrprof_error)> Warn)
Merge data from another InstrProfValueSiteRecord Optionally scale merged counts by Weight.
void overlap(InstrProfValueSiteRecord &Input, uint32_t ValueKind, OverlapStats &Overlap, OverlapStats &FuncLevelOverlap)
Compute the overlap b/w this record and Input record.
void scale(uint64_t N, uint64_t D, function_ref< void(instrprof_error)> Warn)
Scale up value profile data counts by N (Numerator) / D (Denominator).
void addOneMismatch(const CountSumOrPercent &MismatchFunc)
static double score(uint64_t Val1, uint64_t Val2, double Sum1, double Sum2)
Error accumulateCounts(const std::string &BaseFilename, const std::string &TestFilename, bool IsCS)
void dump(raw_fd_ostream &OS) const
CountSumOrPercent Overlap
void addOneUnique(const CountSumOrPercent &UniqueFunc)
const std::string * BaseFilename
const std::string * TestFilename
CountSumOrPercent Mismatch
static void createBPFunctionNodes(ArrayRef< TemporalProfTraceTy > Traces, std::vector< BPFunctionNode > &Nodes, bool RemoveOutlierUNs=true)
Use a set of temporal profile traces to create a list of balanced partitioning function nodes used by...