32#define DEBUG_TYPE "ctx-instr-lower"
37 "A function name, assumed to be global, which will be treated as the "
38 "root of an interesting graph, which will be profiled independently "
39 "from other similar graphs."));
48static auto StartCtx =
"__llvm_ctx_profile_start_context";
49static auto ReleaseCtx =
"__llvm_ctx_profile_release_context";
50static auto GetCtx =
"__llvm_ctx_profile_get_context";
57class CtxInstrumentationLowerer final {
60 Type *ContextNodeTy =
nullptr;
69 Constant *CannotBeRootInitializer =
nullptr;
81std::pair<uint32_t, uint32_t> getNumCountersAndCallsites(
const Function &
F) {
83 uint32_t NumCallsites = 0;
84 for (
const auto &BB :
F) {
85 for (
const auto &
I : BB) {
88 static_cast<uint32_t
>(Incr->getNumCounters()->getZExtValue());
90 "expected all llvm.instrprof.increment[.step] intrinsics to "
91 "have the same total nr of counters parameter");
95 static_cast<uint32_t
>(CSIntr->getNumCounters()->getZExtValue());
96 assert((!NumCallsites || V == NumCallsites) &&
97 "expected all llvm.instrprof.callsite intrinsics to have the "
98 "same total nr of callsites parameter");
111 F.getContext().emitError(
"[ctxprof] The function " +
F.getName() +
112 " was indicated as context root but " + Reason +
113 ", which is not supported.");
120CtxInstrumentationLowerer::CtxInstrumentationLowerer(
Module &M,
123 auto *
PointerTy = PointerType::get(
M.getContext(), 0);
124 auto *SanitizerMutexType = Type::getInt8Ty(
M.getContext());
125 auto *I32Ty = Type::getInt32Ty(
M.getContext());
126 auto *I64Ty = Type::getInt64Ty(
M.getContext());
128#define _PTRDECL(_, __) PointerTy,
129#define _VOLATILE_PTRDECL(_, __) PointerTy,
130#define _CONTEXT_ROOT PointerTy,
131#define _MUTEXDECL(_) SanitizerMutexType,
134 M.getContext(), {CTXPROF_FUNCTION_DATA(_PTRDECL, _CONTEXT_ROOT,
135 _VOLATILE_PTRDECL, _MUTEXDECL)});
138#undef _VOLATILE_PTRDECL
141#define _PTRDECL(_, __) Constant::getNullValue(PointerTy),
142#define _VOLATILE_PTRDECL(_, __) _PTRDECL(_, __)
143#define _MUTEXDECL(_) Constant::getNullValue(SanitizerMutexType),
144#define _CONTEXT_ROOT \
145 Constant::getIntegerValue( \
147 APInt(M.getDataLayout().getPointerTypeSizeInBits(PointerTy), 1U)),
153#undef _VOLATILE_PTRDECL
167 if (
const auto *
F =
M.getFunction(Fname)) {
168 if (
F->isDeclaration())
170 ContextRootSet.insert(
F);
171 for (
const auto &BB : *
F)
172 for (
const auto &
I : BB)
174 if (CB->isMustTailCall())
175 emitUnsupportedRootError(*
F,
"it features musttail calls");
181 M.getOrInsertFunction(
201 FunctionType::get(Type::getVoidTy(
M.getContext()),
212 CallsiteInfoTLS->setThreadLocal(
true);
223 CtxInstrumentationLowerer Lowerer(M,
MAM);
226 Changed |= Lowerer.lowerFunction(
F);
230bool CtxInstrumentationLowerer::lowerFunction(
Function &
F) {
231 if (
F.isDeclaration())
241 if (ContextRootSet.contains(&
F))
242 emitUnsupportedRootError(
F,
"it does not return");
250 auto [
NumCounters, NumCallsites] = getNumCountersAndCallsites(
F);
252 Value *Context =
nullptr;
253 Value *RealContext =
nullptr;
256 Value *TheRootFuctionData =
nullptr;
257 Value *ExpectedCalleeTLSAddr =
nullptr;
258 Value *CallsiteInfoTLSAddr =
nullptr;
259 const bool HasMusttail = [&
F]() {
263 if (CB->isMustTailCall())
268 if (HasMusttail && ContextRootSet.contains(&
F)) {
269 F.getContext().emitError(
270 "[ctx_prof] A function with musttail calls was explicitly requested as "
271 "root. That is not supported because we cannot instrument a return "
272 "instruction to release the context: " +
276 auto &Head =
F.getEntryBlock();
277 for (
auto &
I : Head) {
280 assert(Mark->getIndex()->isZero());
283 Guid = Builder.getInt64(
290 {ContextNodeTy, ArrayType::get(Builder.getInt64Ty(), NumCounters),
291 ArrayType::get(Builder.getPtrTy(), NumCallsites)});
305 HasMusttail ? CannotBeRootInitializer
308 if (ContextRootSet.contains(&
F)) {
311 Builder.getInt32(NumCallsites)});
315 Context = Builder.CreateCall(GetCtx, {TheRootFuctionData, &
F,
Guid,
317 Builder.getInt32(NumCallsites)});
323 auto *CtxAsInt = Builder.CreatePtrToInt(
Context, Builder.getInt64Ty());
324 if (NumCallsites > 0) {
327 auto *
Index = Builder.CreateAnd(CtxAsInt, Builder.getInt64(1));
329 ExpectedCalleeTLSAddr = Builder.CreateGEP(
331 Builder.CreateThreadLocalAddress(ExpectedCalleeTLS), {Index});
332 CallsiteInfoTLSAddr = Builder.CreateGEP(
333 Builder.getInt32Ty(),
334 Builder.CreateThreadLocalAddress(CallsiteInfoTLS), {Index});
341 RealContext = Builder.CreateIntToPtr(
342 Builder.CreateAnd(CtxAsInt, Builder.getInt64(-2)),
351 <<
"Function doesn't have instrumentation, skipping";
356 bool ContextWasReleased =
false;
361 switch (
Instr->getIntrinsicID()) {
362 case llvm::Intrinsic::instrprof_increment:
363 case llvm::Intrinsic::instrprof_increment_step: {
367 auto *
GEP = Builder.CreateGEP(
368 ThisContextType, RealContext,
369 {Builder.getInt32(0), Builder.getInt32(1), AsStep->getIndex()});
371 Builder.CreateAdd(Builder.CreateLoad(Builder.getInt64Ty(),
GEP),
375 case llvm::Intrinsic::instrprof_callsite:
380 Builder.CreateStore(CSIntrinsic->getCallee(), ExpectedCalleeTLSAddr,
392 Builder.CreateGEP(ThisContextType,
Context,
393 {Builder.getInt32(0), Builder.getInt32(2),
394 CSIntrinsic->getIndex()}),
395 CallsiteInfoTLSAddr,
true);
402 Builder.CreateCall(ReleaseCtx, {TheRootFuctionData});
403 ContextWasReleased =
true;
407 if (!HasMusttail && !ContextWasReleased)
409 "[ctx_prof] A function that doesn't have musttail calls was "
410 "instrumented but it has no `ret` "
411 "instructions above which to release the context: " +
420 if (
F.isDeclaration())
422 if (
F.hasFnAttribute(Attribute::NoInline))
424 if (!
F.isWeakForLinker())
427 if (
F.hasFnAttribute(Attribute::AlwaysInline))
428 F.removeFnAttr(Attribute::AlwaysInline);
430 F.addFnAttr(Attribute::NoInline);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
This file contains the declarations for the subclasses of Constant, which represent the different fla...
#define CTXPROF_FUNCTION_DATA(PTRDECL, CONTEXT_PTR, VOLATILE_PTRDECL, MUTEXDECL)
The internal structure of FunctionData.
Module.h This file contains the declarations for the Module class.
This header defines various interfaces for pass management in LLVM.
#define _VOLATILE_PTRDECL(_, __)
static cl::list< std::string > ContextRoots("profile-context-root", cl::Hidden, cl::desc("A function name, assumed to be global, which will be treated as the " "root of an interesting graph, which will be profiled independently " "from other similar graphs."))
FunctionAnalysisManager FAM
ModuleAnalysisManager MAM
static LLVM_ABI uint64_t getGUID(const Function &F)
static LLVM_ABI Constant * get(StructType *T, ArrayRef< Constant * > V)
This is an important base class in LLVM.
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
Implements a dense probed hash-table based set.
@ HiddenVisibility
The GV is hidden.
@ InternalLinkage
Rename collisions when linking (static functions).
@ ExternalLinkage
Externally visible function.
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
LLVM_ABI void emitError(const Instruction *I, const Twine &ErrorStr)
emitError - Emit an error message to the currently installed error handler with optional location inf...
A Module instance is used to store all the information related to an LLVM module.
PreservedAnalyses run(Module &M, ModuleAnalysisManager &MAM)
PreservedAnalyses run(Module &M, ModuleAnalysisManager &MAM)
static bool isCtxIRPGOInstrEnabled()
static PointerType * getUnqual(Type *ElementType)
This constructs a pointer to an object of the specified type in the default address space (address sp...
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
StringRef - Represent a constant reference to a string, i.e.
Class to represent struct types.
static LLVM_ABI StructType * get(LLVMContext &Context, ArrayRef< Type * > Elements, bool isPacked=false)
This static method is the primary way to create a literal StructType.
The instances of the Type class are immutable: once they are created, they are never changed.
LLVM Value Representation.
LLVM_ABI LLVMContext & getContext() const
All values hold a context through their type.
Pass manager infrastructure for declaring and invalidating analyses.
static auto ExpectedCalleeTLS
NodeAddr< InstrNode * > Instr
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
InnerAnalysisManagerProxy< FunctionAnalysisManager, Module > FunctionAnalysisManagerModuleProxy
Provide the FunctionAnalysisManager to Module proxy.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
AnalysisManager< Module > ModuleAnalysisManager
Convenience typedef for the Module analysis manager.
LLVM_ABI bool canReturn(const Function &F)
Return true if there is at least a path through which F can return, false if there is no such path.