LLVM 20.0.0git
AlwaysInliner.cpp
Go to the documentation of this file.
1//===- AlwaysInliner.cpp - Code to inline always_inline functions ----------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements a custom inliner that handles only functions that
10// are marked as "always inline".
11//
12//===----------------------------------------------------------------------===//
13
15#include "llvm/ADT/SetVector.h"
22#include "llvm/IR/Module.h"
26
27using namespace llvm;
28
29#define DEBUG_TYPE "inline"
30
31namespace {
32
33bool AlwaysInlineImpl(
34 Module &M, bool InsertLifetime, ProfileSummaryInfo &PSI,
35 function_ref<AssumptionCache &(Function &)> GetAssumptionCache,
36 function_ref<AAResults &(Function &)> GetAAR,
39 bool Changed = false;
40 SmallVector<Function *, 16> InlinedComdatFunctions;
41
42 for (Function &F : make_early_inc_range(M)) {
43 if (F.isPresplitCoroutine())
44 continue;
45
46 if (F.isDeclaration() || !isInlineViable(F).isSuccess())
47 continue;
48
49 Calls.clear();
50
51 for (User *U : F.users())
52 if (auto *CB = dyn_cast<CallBase>(U))
53 if (CB->getCalledFunction() == &F &&
54 CB->hasFnAttr(Attribute::AlwaysInline) &&
55 !CB->getAttributes().hasFnAttr(Attribute::NoInline))
56 Calls.insert(CB);
57
58 for (CallBase *CB : Calls) {
59 Function *Caller = CB->getCaller();
60 OptimizationRemarkEmitter ORE(Caller);
61 DebugLoc DLoc = CB->getDebugLoc();
62 BasicBlock *Block = CB->getParent();
63
64 InlineFunctionInfo IFI(GetAssumptionCache, &PSI,
65 GetBFI ? &GetBFI(*Caller) : nullptr,
66 GetBFI ? &GetBFI(F) : nullptr);
67
68 InlineResult Res = InlineFunction(*CB, IFI, /*MergeAttributes=*/true,
69 &GetAAR(F), InsertLifetime);
70 if (!Res.isSuccess()) {
71 ORE.emit([&]() {
72 return OptimizationRemarkMissed(DEBUG_TYPE, "NotInlined", DLoc, Block)
73 << "'" << ore::NV("Callee", &F) << "' is not inlined into '"
74 << ore::NV("Caller", Caller)
75 << "': " << ore::NV("Reason", Res.getFailureReason());
76 });
77 continue;
78 }
79
81 ORE, DLoc, Block, F, *Caller,
82 InlineCost::getAlways("always inline attribute"),
83 /*ForProfileContext=*/false, DEBUG_TYPE);
84
85 Changed = true;
86 }
87
88 F.removeDeadConstantUsers();
89 if (F.hasFnAttribute(Attribute::AlwaysInline) && F.isDefTriviallyDead()) {
90 // Remember to try and delete this function afterward. This allows to call
91 // filterDeadComdatFunctions() only once.
92 if (F.hasComdat()) {
93 InlinedComdatFunctions.push_back(&F);
94 } else {
95 M.getFunctionList().erase(F);
96 Changed = true;
97 }
98 }
99 }
100
101 if (!InlinedComdatFunctions.empty()) {
102 // Now we just have the comdat functions. Filter out the ones whose comdats
103 // are not actually dead.
104 filterDeadComdatFunctions(InlinedComdatFunctions);
105 // The remaining functions are actually dead.
106 for (Function *F : InlinedComdatFunctions) {
107 M.getFunctionList().erase(F);
108 Changed = true;
109 }
110 }
111
112 return Changed;
113}
114
115struct AlwaysInlinerLegacyPass : public ModulePass {
116 bool InsertLifetime;
117
118 AlwaysInlinerLegacyPass()
119 : AlwaysInlinerLegacyPass(/*InsertLifetime*/ true) {}
120
121 AlwaysInlinerLegacyPass(bool InsertLifetime)
122 : ModulePass(ID), InsertLifetime(InsertLifetime) {
124 }
125
126 /// Main run interface method. We override here to avoid calling skipSCC().
127 bool runOnModule(Module &M) override {
128
129 auto &PSI = getAnalysis<ProfileSummaryInfoWrapperPass>().getPSI();
130 auto GetAAR = [&](Function &F) -> AAResults & {
131 return getAnalysis<AAResultsWrapperPass>(F).getAAResults();
132 };
133 auto GetAssumptionCache = [&](Function &F) -> AssumptionCache & {
134 return getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F);
135 };
136
137 return AlwaysInlineImpl(M, InsertLifetime, PSI, GetAssumptionCache, GetAAR,
138 /*GetBFI*/ nullptr);
139 }
140
141 static char ID; // Pass identification, replacement for typeid
142
143 void getAnalysisUsage(AnalysisUsage &AU) const override {
147 }
148};
149
150} // namespace
151
152char AlwaysInlinerLegacyPass::ID = 0;
153INITIALIZE_PASS_BEGIN(AlwaysInlinerLegacyPass, "always-inline",
154 "Inliner for always_inline functions", false, false)
158INITIALIZE_PASS_END(AlwaysInlinerLegacyPass, "always-inline",
159 "Inliner for always_inline functions", false, false)
160
162 return new AlwaysInlinerLegacyPass(InsertLifetime);
163}
164
169 auto GetAssumptionCache = [&](Function &F) -> AssumptionCache & {
171 };
172 auto GetBFI = [&](Function &F) -> BlockFrequencyInfo & {
174 };
175 auto GetAAR = [&](Function &F) -> AAResults & {
176 return FAM.getResult<AAManager>(F);
177 };
178 auto &PSI = MAM.getResult<ProfileSummaryAnalysis>(M);
179
180 bool Changed = AlwaysInlineImpl(M, InsertLifetime, PSI, GetAssumptionCache,
181 GetAAR, GetBFI);
182
183 return Changed ? PreservedAnalyses::none() : PreservedAnalyses::all();
184}
for(const MachineOperand &MO :llvm::drop_begin(OldMI.operands(), Desc.getNumOperands()))
always Inliner for always_inline functions
always inline
#define DEBUG_TYPE
Provides passes to inlining "always_inline" functions.
#define F(x, y, z)
Definition: MD5.cpp:55
Module.h This file contains the declarations for the Module class.
FunctionAnalysisManager FAM
ModuleAnalysisManager MAM
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition: PassSupport.h:55
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:57
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:52
This file implements a set that has insertion order iteration characteristics.
A manager for alias analyses.
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
PreservedAnalyses run(Module &M, ModuleAnalysisManager &)
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:253
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Definition: PassManager.h:405
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
A function analysis which provides an AssumptionCache.
An immutable pass that tracks lazily created AssumptionCache objects.
A cache of @llvm.assume calls within a function.
LLVM Basic Block Representation.
Definition: BasicBlock.h:61
Analysis pass which computes BlockFrequencyInfo.
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1236
A debug info location.
Definition: DebugLoc.h:33
static InlineCost getAlways(const char *Reason, std::optional< CostBenefitPair > CostBenefit=std::nullopt)
Definition: InlineCost.h:126
This class captures the data input to the InlineFunction call, and records the auxiliary results prod...
Definition: Cloning.h:203
InlineResult is basically true or false.
Definition: InlineCost.h:180
bool isSuccess() const
Definition: InlineCost.h:189
const char * getFailureReason() const
Definition: InlineCost.h:190
An analysis over an "outer" IR unit that provides access to an analysis manager over an "inner" IR un...
Definition: PassManager.h:563
ModulePass class - This class is used to implement unstructured interprocedural optimizations and ana...
Definition: Pass.h:251
virtual bool runOnModule(Module &M)=0
runOnModule - Virtual method overriden by subclasses to process the module being operated on.
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:65
The optimization diagnostic interface.
void emit(DiagnosticInfoOptimizationBase &OptDiag)
Output the remark via the diagnostic handler and to the optimization record file.
Diagnostic information for missed-optimization remarks.
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Pass interface - Implemented by all 'passes'.
Definition: Pass.h:94
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:111
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
Definition: Analysis.h:114
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:117
An analysis pass based on the new PM to deliver ProfileSummaryInfo.
An analysis pass based on legacy pass manager to deliver ProfileSummaryInfo.
Analysis providing profile information.
void clear()
Completely clear the SetVector.
Definition: SetVector.h:273
bool insert(const value_type &X)
Insert a new element into the SetVector.
Definition: SetVector.h:162
A SetVector that performs no allocations if smaller than a certain size.
Definition: SetVector.h:370
bool empty() const
Definition: SmallVector.h:94
void push_back(const T &Elt)
Definition: SmallVector.h:426
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209
An efficient, type-erasing, non-owning reference to a callable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24
DiagnosticInfoOptimizationBase::Argument NV
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Definition: STLExtras.h:656
InlineResult isInlineViable(Function &Callee)
Minimal filter to detect invalid constructs for inlining.
void emitInlinedIntoBasedOnCost(OptimizationRemarkEmitter &ORE, DebugLoc DLoc, const BasicBlock *Block, const Function &Callee, const Function &Caller, const InlineCost &IC, bool ForProfileContext=false, const char *PassName=nullptr)
Emit ORE message based in cost (default heuristic).
Pass * createAlwaysInlinerLegacyPass(bool InsertLifetime=true)
Create a legacy pass manager instance of a pass to inline and remove functions marked as "always_inli...
InlineResult InlineFunction(CallBase &CB, InlineFunctionInfo &IFI, bool MergeAttributes=false, AAResults *CalleeAAR=nullptr, bool InsertLifetime=true, Function *ForwardVarArgsTo=nullptr)
This function inlines the called function into the basic block of the caller.
void filterDeadComdatFunctions(SmallVectorImpl< Function * > &DeadComdatFunctions)
Filter out potentially dead comdat functions where other entries keep the entire comdat group alive.
void initializeAlwaysInlinerLegacyPassPass(PassRegistry &)